In [1]:
import os
import pandas as pd

# Get the project directory path
project_dir = os.getcwd()

# Function to load data and count values in 'onset' column
def load_data_and_count_values(data_dir):
    csv_files = [os.path.join(data_dir, file) for file in os.listdir(data_dir) if file.endswith('.csv')]
    dataframes = {file: pd.read_csv(file) for file in csv_files}
    onset_counts = {os.path.basename(file): df['onset'].value_counts() for file, df in dataframes.items() if 'onset' in df.columns}
    return onset_counts

# Training data analysis
train_data_dir = os.path.join(project_dir, 'Data', 'train_data')
train_onset_counts = load_data_and_count_values(train_data_dir)

# Test data analysis
test_data_dir = os.path.join(project_dir, 'Data', 'test_data')
test_onset_counts = load_data_and_count_values(test_data_dir)

In [2]:
# Print the results
sum_train_0 = 0
sum_train_1 = 0
sum_test_0 = 0
sum_test_1 = 0
print("Training Data Onset Counts:")
for file, counts in train_onset_counts.items():
    print(f"{file}:")
    print(counts)
    sum_train_0 += counts[0]
    sum_train_1 += counts[1]
    print()

Training Data Onset Counts:
Haslebuskane_angry_start_end_spect_target.csv:
onset
0    17129
1      532
Name: count, dtype: int64

Haslebuskane_happy_start_end_spect_target.csv:
onset
0    17358
1      539
Name: count, dtype: int64

Haslebuskane_original_start_end_spect_target.csv:
onset
0    18421
1      539
Name: count, dtype: int64

Haslebuskane_sad_start_end_spect_target.csv:
onset
0    20317
1      545
Name: count, dtype: int64

Haslebuskane_tender_start_end_spect_target.csv:
onset
0    18965
1      541
Name: count, dtype: int64

Havbrusen_angry_start_end_spect_target.csv:
onset
0    33525
1      747
Name: count, dtype: int64

Havbrusen_happy_start_end_spect_target.csv:
onset
0    33147
1      744
Name: count, dtype: int64

Havbrusen_original_start_end_spect_target.csv:
onset
0    35498
1      749
Name: count, dtype: int64

Havbrusen_sad_start_end_spect_target.csv:
onset
0    39111
1      769
Name: count, dtype: int64

Havbrusen_tender_start_end_spect_target.csv:
onset
0    37591
1

In [3]:
print("Test Data Onset Counts:")
for file, counts in test_onset_counts.items():
    print(f"{file}:")
    print(counts)
    sum_test_0 += counts[0]
    sum_test_1 += counts[1]
    print()

Test Data Onset Counts:
Silkjegulen_angry_start_end_spect_target.csv:
onset
0    21626
1      539
Name: count, dtype: int64

Silkjegulen_happy_start_end_spect_target.csv:
onset
0    21492
1      536
Name: count, dtype: int64

Silkjegulen_original_start_end_spect_target.csv:
onset
0    23142
1      539
Name: count, dtype: int64

Silkjegulen_sad_start_end_spect_target.csv:
onset
0    24352
1      546
Name: count, dtype: int64

Silkjegulen_tender_start_end_spect_target.csv:
onset
0    23195
1      545
Name: count, dtype: int64

Valdresspringar_angry_start_end_spect_target.csv:
onset
0    15000
1      332
Name: count, dtype: int64

Valdresspringar_happy_start_end_spect_target.csv:
onset
0    15163
1      341
Name: count, dtype: int64

Valdresspringar_original_start_end_spect_target.csv:
onset
0    14840
1      320
Name: count, dtype: int64

Valdresspringar_sad_start_end_spect_target.csv:
onset
0    16212
1      326
Name: count, dtype: int64

Valdresspringar_tender_start_end_spect_target.cs

In [5]:
print(f"Training Data Total Not Onset Counts:", sum_train_0)
print(f"Training Data Total Onset Counts:", sum_train_1)
print(f"Test Data Total Not Onset Counts:", sum_test_0)
print(f"Test Data Total Onset Counts:", sum_test_1)


Training Data Total Not Onset Counts: 538539
Training Data Total Onset Counts: 11897
Test Data Total Not Onset Counts: 324293
Test Data Total Onset Counts: 6732
