In [9]:
import numpy as np 
import pandas as pd

In [10]:
# Function to load and analyze the data
def load_and_analyze(file):
    # Check file extension and load accordingly
    if file.endswith('.npy'):
        # Load .npy file
        data = np.load(file)
        print(f"Loaded .npy file: {file}")
    elif file.endswith('.csv'):
        # Load .csv file using pandas
        data = pd.read_csv(file)
        print(f"Loaded .csv file: {file}")
    else:
        raise ValueError("Unsupported file format. Only .npy and .csv are supported.")
    
    # Handle NumPy arrays directly
    if isinstance(data, np.ndarray):
        print("This is a NumPy array")
        print_stats(data)
    
    # Handle pandas DataFrames (for CSVs)
    elif isinstance(data, pd.DataFrame):
        print("This is a pandas DataFrame")
        
        # Separate numeric data and calculate stats
        numeric_data = data.select_dtypes(include=[np.number])
        
        # Convert to numpy array if necessary
        if not numeric_data.empty:
            print_stats(numeric_data.to_numpy())
        else:
            print("No numeric data found in the CSV file")
    else:
        print("Unsupported data type.")

In [11]:
# Function to print statistics
def print_stats(data):
    print("Shape:", data.shape)
    if np.issubdtype(data.dtype, np.number):
        print("Max:", np.nanmax(data))  # Use nanmax to ignore NaN values
        print("Min:", np.nanmin(data))  # Use nanmin to ignore NaN values
        print("Mean:", np.nanmean(data))  # Use nanmean to ignore NaN values
        print("Std:", np.nanstd(data))  # Use nanstd to ignore NaN values
    else:
        print("Data is not numeric.")

In [12]:
file = 'mfcc_features/mfcc_n_mfcc=40_n_fft=4096_hop_length=512_n_mels=40_fmax=4000.csv'
load_and_analyze(file)

Loaded .csv file: mfcc_features/mfcc_n_mfcc=40_n_fft=4096_hop_length=512_n_mels=40_fmax=4000.csv
This is a pandas DataFrame
Shape: (125, 125161)
Max: 233.0
Min: -368.2053527832031
Mean: -1.6456110313816315
Std: 16.50251207091385
