In [None]:
# Cell 7 to rename problematic .parquet files

import os
from pathlib import Path
import glob # Import glob

# --- Define the directories where the parquet files are located ---
# Use the same source directories as in the training loop (Cell 6)
sleep_edfx_processed_dir_source = Path('/content/drive/MyDrive/sleep_edfx_processed/')
shhs1_processed_dir_source = Path('/content/drive/MyDrive/shhs1_processed/')
shhs2_processed_dir_source = Path('/content/drive/MyDrive/shhs2_processed/')

# --- IMPORTANT: Replace with the actual list of problematic filenames from your logs ---
problematic_filenames = [
    "shhs2-200820.parquet",
    "shhs2-200822.parquet",
    # Add other problematic filenames here as you identify them from the logs
]

prefix = "problematic_"

print(f"Attempting to rename {len(problematic_filenames)} problematic files...")

for filename in problematic_filenames:
    found_path = None
    # Search for the file in the defined source directories
    for directory in [sleep_edfx_processed_dir_source, shhs1_processed_dir_source, shhs2_processed_dir_source]:
        # Use glob to search recursively in shhs directories, and directly in edfx
        if 'shhs' in str(directory):
             # Search recursively in shhs subdirectories
             search_pattern = str(directory / '**' / filename)
             matching_files = glob.glob(search_pattern, recursive=True)
             if matching_files:
                 # Assuming only one file with the same name across shhs folders (or take the first)
                 found_path = Path(matching_files[0])
                 break # Stop searching directories once found
        elif directory.joinpath(filename).exists():
             # Check directly in edfx directory
             found_path = directory / filename
             break # Stop searching directories once found


    if found_path and found_path.exists():
        new_filename = prefix + filename
        new_path = found_path.with_name(new_filename)

        try:
            os.rename(found_path, new_path)
            print(f"Successfully renamed '{filename}' to '{new_filename}'")
        except Exception as e:
            print(f"Error renaming file '{filename}': {e}")
    else:
        print(f"File '{filename}' not found in the specified source directories. Skipping rename.")

print("Renaming process complete.")