In [5]:
import os
import shutil

# Folder containing XML files
XML_FOLDER = "/Users/macbook/Desktop/data mining project/Data mining/data"
CSV_FILE = "flights_data.csv"

def delete_xml_files(folder_path, csv_path):
    """
    Delete all XML files from the folder while keeping the CSV file.
    """
    # First, verify the CSV file exists
    if not os.path.exists(csv_path):
        print(f"WARNING: CSV file '{csv_path}' not found!")
        print("Please ensure your merged data is saved before proceeding.")
        return
    
    # Count files before deletion
    xml_files = [f for f in os.listdir(folder_path) if f.endswith('.xml')]
    xml_count = len(xml_files)
    
    if xml_count == 0:
        print("No XML files found to delete.")
        return
    
    # Confirm deletion
    print(f"Found {xml_count} XML files in: {folder_path}")
    print(f"CSV file location: {csv_path}")
    print(f"\nThis will DELETE all {xml_count} XML files permanently.")
    print("\nType 'DELETE' (in capital letters) to confirm:")
    
    response = input().strip()
    
    print(f"You typed: '{response}'")  # Debug line to see what was typed
    
    if response != 'DELETE':
        print("Operation cancelled. No files were deleted.")
        print(f"Expected: 'DELETE', but got: '{response}'")
        return
    
    # Delete XML files
    deleted_count = 0
    errors = []
    
    print("\nStarting deletion...")
    for filename in xml_files:
        file_path = os.path.join(folder_path, filename)
        try:
            os.remove(file_path)
            deleted_count += 1
            if deleted_count % 500 == 0:
                print(f"Deleted {deleted_count}/{xml_count} files...")
        except Exception as e:
            errors.append(f"{filename}: {e}")
    
    # Summary
    print(f"\n✓ Successfully deleted {deleted_count} XML files")
    if errors:
        print(f"\n⚠ Errors encountered ({len(errors)} files):")
        for error in errors[:10]:
            print(f"  - {error}")
    
    print(f"\n✓ Your merged data is safe in: {csv_path}")

# Run the deletion
if __name__ == "__main__":
    delete_xml_files(XML_FOLDER, CSV_FILE)


No XML files found to delete.
