# Analyze the data

In [3]:
import os
import numpy as np
import pandas as pd

def read_and_analyze_data(directory='bin_data'):
    # List all files in the directory
    files = [f for f in os.listdir(directory) if os.path.isfile(os.path.join(directory, f))]

    # Initialize a list to store the results
    results = []

    # Process each file
    for file in files:
        # Construct full file path
        file_path = os.path.join(directory, file)
        
        # Load the data
        data = np.fromfile(file_path, dtype=np.float32)

        # Calculate statistics
        data_range = np.ptp(data)  # Peak to peak (max - min) range
        data_std = np.std(data)    # Standard deviation
        file_size = os.path.getsize(file_path)  # File size in bytes

        # Append results
        results.append({
            'Dataset Name': file,
            'Range': data_range,
            'Standard Deviation': data_std,
            'File Size (bytes)': file_size
        })

    # Convert results to DataFrame
    results_df = pd.DataFrame(results)

    # Save results to CSV
    results_df.to_csv('dataset_statistics.csv', index=False)

    return results_df

# Call the function
data_statistics = read_and_analyze_data()
