In [10]:
import os

def create_folders(base_folder, last_name, fasta_file="sequences.fna"):
    """
    Create the folder structure for the assignment.
    
    Parameters:
    - base_folder: The root directory where the structure will be created.
    - last_name: The last name to be included in folder and report names.
    - fasta_file: Path to the fasta file containing sequence IDs.
    """
    # Define the base directory
    root_dir = os.path.join(base_folder, f"assignment_1_{last_name}")
    
    # Define main directories
    subdirs = [
        "data/folded_proteins",
        "bin",
        "results/sequence_properties",
        "results/alignments",
        "results/phylogenetic_tree",
        "results/functional_prediction",
        "results/organism_origin",
        "results/predicted_structures",
        "results/structural_homology",
        "results/pair_homology/pair_comparisons",
        "docs"
    ]
    
    # Create directories
    for subdir in subdirs:
        os.makedirs(os.path.join(root_dir, subdir), exist_ok=True)
    
    # Create specific files
    open(os.path.join(root_dir, "readme.md"), "w").close()
    open(os.path.join(root_dir, "data", "sequences.fna"), "w").close()
    open(os.path.join(root_dir, "bin", "sequence_analysis_pipeline.ipynb"), "w").close()
    open(os.path.join(root_dir, "bin", "structure_analysis_pipeline.ipynb"), "w").close()
    
    # Create report files
    open(os.path.join(root_dir, "docs", f"report_{last_name}.docx"), "w").close()
    open(os.path.join(root_dir, "docs", f"report_{last_name}.pdf"), "w").close()

    # Process the FASTA file for sequence IDs
    fasta_path = os.path.join(root_dir, "data", fasta_file)
   
    
    print(f"Folder structure created at {root_dir}")

# Usage example
create_folders(base_folder=os.getcwd(), last_name="Li")  # Replace 'Doe' with the actual last name


Folder structure created at d:\Microsoft VS Code\assignment_1_Li
