### CSV day output

In [1]:
import os
import json
import pandas as pd

# === CONFIGURATION ===
input_folder = r"D:\Desktop\SEM 7\Mini Project\csv_day_output"
output_folder = r"D:\SEM_8\Major-project\csv_day_2017_json"
log_file = 'processed_files.json'

# === Ensure output directory exists ===
os.makedirs(output_folder, exist_ok=True)

# === Columns to retain ===
columns_to_keep = ['diffTimeStamp', 'tokenAddress', 'from', 'to', 'fromIsContract', 'toIsContract']

# === Load processed file log ===
if os.path.exists(log_file):
    with open(log_file, 'r') as f:
        processed_files = set(json.load(f))
else:
    processed_files = set()

# === Process each CSV file ===
for file_name in os.listdir(input_folder):
    if file_name.endswith('.csv') and file_name not in processed_files:
        input_path = os.path.join(input_folder, file_name)
        output_name = file_name.replace('.csv', '.json')
        output_path = os.path.join(output_folder, output_name)

        try:
            df = pd.read_csv(input_path, usecols=columns_to_keep)
            df.to_json(output_path, orient='records', lines=True)
            print(f"Processed: {file_name}")
            processed_files.add(file_name)

            # Save updated log
            with open(log_file, 'w') as f:
                json.dump(list(processed_files), f, indent=2)

        except Exception as e:
            print(f"Error processing {file_name}: {e}")


Processed: 2022--05--10.csv
Processed: 2022--05--11.csv
Processed: 2022--05--12.csv
Processed: 2022--05--13.csv
Processed: 2022--05--14.csv
Processed: 2022--05--15.csv
Processed: 2022--05--16.csv
Processed: 2022--05--17.csv
Processed: 2022--05--18.csv
Processed: 2022--05--19.csv
Processed: 2022--05--20.csv
Processed: 2022--05--21.csv
Processed: 2022--05--22.csv
Processed: 2022--05--23.csv
Processed: 2022--05--24.csv
Processed: 2022--05--25.csv
Processed: 2022--05--26.csv
Processed: 2022--05--27.csv
Processed: 2022--05--28.csv
Processed: 2022--05--29.csv
Processed: 2022--05--30.csv
Processed: 2022--05--31.csv
Processed: 2022--06--01.csv
Processed: 2022--06--02.csv
Processed: 2022--06--03.csv
Processed: 2022--06--04.csv
Processed: 2022--06--05.csv
Processed: 2022--06--06.csv
Processed: 2022--06--07.csv
Processed: 2022--06--08.csv
Processed: 2022--06--09.csv
Processed: 2022--06--10.csv
Processed: 2022--06--11.csv
Processed: 2022--06--12.csv
Processed: 2022--06--13.csv
Processed: 2022--06-