# 📁 03_create_csv_from_segments.ipynb

# 🎯 Step 3: Create Initial CSV File for Manual Labeling

"""
This notebook creates a CSV file listing all filtered audio segments,
preparing them for manual labeling.
Labels are left empty for the user to fill manually.
"""

In [None]:
# 📂 Mount Google Drive
from google.colab import drive
drive.mount('/content/drive')

In [None]:
# 📦 Libraries
import os
import pandas as pd

In [None]:
# 📂 Path to cleaned segments
segments_folder = "/content/drive/MyDrive/audio_segments" 

In [None]:
# 📝 Create CSV with filenames (label column left empty)
filtered_files = []

for filename in os.listdir(segments_folder):
    if filename.endswith(".wav"):
        filtered_files.append(filename)

initial_df = pd.DataFrame({
    "filename": filtered_files,
    "label": [""] * len(filtered_files)  # ⚡ Leave labels empty for manual labeling
})

# 💬 Important: After generating this CSV, manually listen to each file and fill in the correct label.
# Example: 0 for Neutral, 1 for Happy, 2 for Sad, 3 for Angry

# 💾 Save CSV
initial_df.to_csv("/content/drive/MyDrive/initial_labels.csv", index=False)

print(f"✅ initial_labels.csv created with {len(initial_df)} files. Ready for manual labeling!")