In [1]:
import argparse
import pyreadr
import pandas as pd
from pathlib import Path

In [2]:
def convert_rdata_to_csv(input_path, output_dir):
    """
    Convert all data frames in an RData file to CSV format
    
    Args:
        input_path (str): Path to input .RData file
        output_dir (str): Directory to save CSV files
    """
    # Read RData file
    result = pyreadr.read_r(input_path)
    
    # Create output directory
    output_path = Path(output_dir)
    output_path.mkdir(parents=True, exist_ok=True)
    
    # Convert each object to CSV
    for obj_name, data in result.items():
        if isinstance(data, pd.DataFrame):
            csv_path = output_path / f"{obj_name if obj_name else 'unnamed'}.csv"
            data.to_csv(csv_path, index=False)
            print(f"✅ Saved {len(data):,} rows to {csv_path}")
        else:
            print(f"⚠️  Skipped non-dataframe object: {obj_name} ({type(data).__name__})")

In [3]:
if __name__ == "__main__":
    # Hardcoded file paths (EDIT THESE VALUES)
    input_rdata = "data/TEP_Faulty_Testing.RData"
    output_directory = "data/"
    
    # Perform conversion
    convert_rdata_to_csv(input_rdata, output_directory)

✅ Saved 9,600,000 rows to data/faulty_testing.csv
