In [1]:
import os
import json

def process_receipts(input_folder, output_folder):
    if not os.path.exists(output_folder):
        os.makedirs(output_folder)
    
    for filename in os.listdir(input_folder):
        if filename.endswith(".json"):
            input_path = os.path.join(input_folder, filename)
            output_path = os.path.join(output_folder, filename)
            
            with open(input_path, "r", encoding="utf-8") as file:
                try:
                    data = json.load(file)
                    
                    # Ensure data is a list
                    if isinstance(data, list):
                        cleaned_data = [
                            {
                                "merchant_name": receipt.get("merchant_name", ""),
                                "receipt_type": receipt.get("receipt_type", ""),
                                "total": receipt.get("total", 0.0),
                                "date": receipt.get("transaction_date", ""),
                                "notes": "",
                                "recurring": False
                            }
                            for receipt in data
                        ]
                        
                        # Save cleaned data
                        with open(output_path, "w", encoding="utf-8") as out_file:
                            json.dump(cleaned_data, out_file, indent=4)
                except json.JSONDecodeError:
                    print(f"Error decoding JSON in file: {filename}")

if __name__ == "__main__":
    input_folder = "processed_json_images"
    output_folder = "cleaned_json_images"
    process_receipts(input_folder, output_folder)
    print("Processing complete. Cleaned JSON files are saved in 'cleaned_json_images'.")

Processing complete. Cleaned JSON files are saved in 'cleaned_json_images'.
