In [6]:
import os
import json
import pandas as pd

archive_dir = '../data/raw/archive'
output_prices_file = '../data/processed/all_data.csv'
output_sec_file = '../data/processed/securities.csv'

# Load securities.json
securities_path = os.path.join(archive_dir, 'securities.json')
with open(securities_path, 'r') as f:
    securities_data = json.load(f)
securities_df = pd.DataFrame(securities_data)
securities_df.to_csv(output_sec_file, index=False)
print(f"✅ securities.csv saved at {output_sec_file}")

# Load all other JSON files (excluding securities.json)
all_price_data = []

for filename in sorted(os.listdir(archive_dir)):
    if filename.endswith('.json') and filename != 'securities.json':
        file_path = os.path.join(archive_dir, filename)
        with open(file_path, 'r') as f:
            try:
                data = json.load(f)
                all_price_data.extend(data)
            except json.JSONDecodeError as e:
                print(f"⚠️ JSON decode error in {filename}: {e}")

# Create price DataFrame
prices_df = pd.DataFrame(all_price_data)
prices_df['date'] = pd.to_datetime(prices_df['date'])
prices_df.sort_values('date', inplace=True)
prices_df.to_csv(output_prices_file, index=False)
print(f"✅ all_data.csv saved at {output_prices_file}")

✅ securities.csv saved at ../data/processed/securities.csv
✅ all_data.csv saved at ../data/processed/all_data.csv
