In [5]:
import os
import pandas as pd

In [2]:
def concatenate_csv_files(input_folder, output_file):
    # Get a list of all CSV files in the input folder
    csv_files = [file for file in os.listdir(input_folder) if file.endswith('.csv')]

    # Check if there are any CSV files
    if not csv_files:
        print("No CSV files found in the input folder.")
        return

    # Read the first CSV file to get the column names
    first_csv = pd.read_csv(os.path.join(input_folder, csv_files[0]))
    columns = list(first_csv.columns)

    # Create an empty DataFrame to store the concatenated data
    result_df = pd.DataFrame(columns=columns)

    # Concatenate all CSV files
    for csv_file in csv_files:
        current_csv = pd.read_csv(os.path.join(input_folder, csv_file))
        result_df = pd.concat([result_df, current_csv], ignore_index=True)

    # Write the concatenated data to the output CSV file
    result_df.to_csv(output_file, index=False)
    print(f"Concatenation completed. Result saved to {output_file}")

In [3]:
# Get the current directory (should be 'csvConcat')
current_dir = os.getcwd()

# Get the parent directory
parent_dir = os.path.dirname(current_dir)

# Construct the path to the 'DemoFiles/csv' folder
demo_files_dir = os.path.join(parent_dir, 'DemoFiles', 'csv')

print(demo_files_dir)

D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv


In [4]:
output_file = 'output.csv'
concatenate_csv_files(demo_files_dir, output_file)

  result_df = pd.concat([result_df, current_csv], ignore_index=True)


Concatenation completed. Result saved to output.csv


In [6]:
# New Modified code

def concatenate_csv_files(input_folder, output_file):
    # Get a list of all CSV files in the input folder
    csv_files = [file for file in os.listdir(input_folder) if file.endswith('.csv')]

    # Check if there are any CSV files
    if not csv_files:
        print("No CSV files found in the input folder.")
        return

    # Read the first CSV file to get the column names
    first_csv = pd.read_csv(os.path.join(input_folder, csv_files[0]))
    columns = list(first_csv.columns)

    # Create an empty DataFrame to store the concatenated data
    result_df = pd.DataFrame(columns=columns)

    # Concatenate all CSV files
    for csv_file in csv_files:
        current_csv = pd.read_csv(os.path.join(input_folder, csv_file))
        result_df = pd.concat([result_df, current_csv], ignore_index=True)

    # Remove rows with missing data
    result_df = result_df.dropna()

    # Write the concatenated data to the output CSV file
    result_df.to_csv(output_file, index=False)
    print(f"Concatenation completed. Result saved to {output_file}")

# Get the current directory (should be 'csvConcat')
current_dir = os.getcwd()

# Get the parent directory
parent_dir = os.path.dirname(current_dir)

# Construct the path to the 'DemoFiles/csv' folder
demo_files_dir = os.path.join(parent_dir, 'DemoFiles', 'csv')

print(demo_files_dir)

output_file = 'output.csv'
concatenate_csv_files(demo_files_dir, output_file)

D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv


  result_df = pd.concat([result_df, current_csv], ignore_index=True)


Concatenation completed. Result saved to output.csv


In [9]:
# Modified 2

def concatenate_csv_files(input_folder, output_file):
    # Get a list of all CSV files in the input folder
    csv_files = [file for file in os.listdir(input_folder) if file.endswith('.csv')]

    # Check if there are any CSV files
    if not csv_files:
        print("No CSV files found in the input folder.")
        return

    # Read the first CSV file to get the column names and dtypes
    first_csv = pd.read_csv(os.path.join(input_folder, csv_files[0]))
    columns = list(first_csv.columns)
    dtypes = first_csv.dtypes

    # Create an empty DataFrame with the same column names and dtypes
    result_df = pd.DataFrame(columns=columns).astype(dtypes)

    # Concatenate all CSV files
    for csv_file in csv_files:
        current_csv = pd.read_csv(os.path.join(input_folder, csv_file))
        result_df = pd.concat([result_df, current_csv], ignore_index=True)

    # Remove rows with missing data
    result_df = result_df.dropna()

    # Write the concatenated data to the output CSV file
    result_df.to_csv(output_file, index=False)
    print(f"Concatenation completed. Result saved to {output_file}")

# Get the current directory (should be 'csvConcat')
current_dir = os.getcwd()

# Get the parent directory
parent_dir = os.path.dirname(current_dir)

# Construct the path to the 'DemoFiles/csv' folder
demo_files_dir = os.path.join(parent_dir, 'DemoFiles', 'csv')

print(demo_files_dir)

output_file = 'output.csv'
concatenate_csv_files(demo_files_dir, output_file)


D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv
Concatenation completed. Result saved to output.csv


In [10]:
# modified 3 WORKING

def concatenate_csv_files(input_folder, output_file):
    # Get a list of all CSV files in the input folder
    csv_files = [file for file in os.listdir(input_folder) if file.endswith('.csv')]

    # Check if there are any CSV files
    if not csv_files:
        print("No CSV files found in the input folder.")
        return

    # Read the first CSV file to get the column names and dtypes
    first_csv = pd.read_csv(os.path.join(input_folder, csv_files[0]))
    columns = list(first_csv.columns)
    dtypes = first_csv.dtypes

    # Create an empty DataFrame with the same column names and dtypes
    result_df = pd.DataFrame(columns=columns).astype(dtypes)

    # Concatenate all CSV files
    for csv_file in csv_files:
        current_csv = pd.read_csv(os.path.join(input_folder, csv_file))
        result_df = pd.concat([result_df, current_csv], ignore_index=True)

    # Remove rows with all values empty (horizontal empty rows)
    result_df = result_df.dropna(how='all')

    # Write the concatenated data to the output CSV file
    result_df.to_csv(output_file, index=False)
    print(f"Concatenation completed. Result saved to {output_file}")

# Get the current directory (should be 'csvConcat')
current_dir = os.getcwd()

# Get the parent directory
parent_dir = os.path.dirname(current_dir)

# Construct the path to the 'DemoFiles/csv' folder
demo_files_dir = os.path.join(parent_dir, 'DemoFiles', 'csv')

print(demo_files_dir)

output_file = 'output.csv'
concatenate_csv_files(demo_files_dir, output_file)


D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv
Concatenation completed. Result saved to output.csv


In [11]:
# works with concatinating

In [13]:
# modified 4 for deleting csv files and placing output.csv file there

import os
import pandas as pd

def concatenate_csv_files(input_folder, output_file):
    # Get a list of all CSV files in the input folder
    csv_files = [file for file in os.listdir(input_folder) if file.endswith('.csv')]

    # Check if there are any CSV files
    if not csv_files:
        print("No CSV files found in the input folder.")
        return

    # Read the first CSV file to get the column names and dtypes
    first_csv = pd.read_csv(os.path.join(input_folder, csv_files[0]))
    columns = list(first_csv.columns)
    dtypes = first_csv.dtypes

    # Create an empty DataFrame with the same column names and dtypes
    result_df = pd.DataFrame(columns=columns).astype(dtypes)

    # Concatenate all CSV files
    for csv_file in csv_files:
        current_csv = pd.read_csv(os.path.join(input_folder, csv_file))
        result_df = pd.concat([result_df, current_csv], ignore_index=True)

    # Remove rows with all values empty (horizontal empty rows)
    result_df = result_df.dropna(how='all')

    # Write the concatenated data to the output CSV file
    result_df.to_csv(output_file, index=False)
    print(f"Concatenation completed. Result saved to {output_file}")

    # Remove the original CSV files
    for csv_file in csv_files:
        os.remove(os.path.join(input_folder, csv_file))
        print(f"Deleted: {csv_file}")

    # Move the output CSV file to the input folder
    output_path = os.path.join(input_folder, output_file)
    os.replace(output_file, output_path)
    print(f"Moved {output_file} to {input_folder}")

# Get the current directory (should be 'csvConcat')
current_dir = os.getcwd()

# Get the parent directory
parent_dir = os.path.dirname(current_dir)

# Construct the path to the 'DemoFiles/csv' folder
demo_files_dir = os.path.join(parent_dir, 'DemoFiles', 'csv')

print(demo_files_dir)

output_file = 'output.csv'
concatenate_csv_files(demo_files_dir, output_file)

D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv
Concatenation completed. Result saved to output.csv
Deleted: test-367845.csv
Deleted: test-418137.csv
Deleted: test-537092.csv
Deleted: test-818971.csv
Deleted: test-998161.csv
Moved output.csv to D:\000 PICT Projects\BE project\GEPCS\DemoFiles\csv
