In [4]:
import os
import csv
import json
from Bio import ExPASy
from Bio import SwissProt


In [5]:
# Define protein A as MAPLC3B
protein_A_uniprot = "Q9GZQ8"  # MAPLC3B的UniProt ID
protein_A_id = "A"

# Output folder
folder_name = "MAPLC3B_protein_pairs"
os.makedirs(folder_name, exist_ok=True)

# Input CSV with protein UniProt IDs in first column
csv_file = "SL18_Live_pq_153 modified.csv"  # 你的实际CSV文件名

# First, get MAPLC3B sequence
try:
    handle_A = ExPASy.get_sprot_raw(protein_A_uniprot)
    record_A = SwissProt.read(handle_A)
    seq_A = record_A.sequence
    entry_name_A = record_A.entry_name
    print(f"Successfully retrieved MAPLC3B sequence: {entry_name_A}")
except Exception as e:
    print(f"Failed to retrieve MAPLC3B sequence: {e}")
    exit(1)

# Process each protein target (chainB) 
with open(csv_file, "r", encoding="utf-8-sig") as file:
    reader = csv.reader(file)
    next(reader)  # Skip header line
    
    for row in reader:
        chainB_id = row[1].strip()  # 假设UniProt ID在第二列
        if not chainB_id:
            continue
            
        try:
            # Fetch protein sequence for chainB
            handle_B = ExPASy.get_sprot_raw(chainB_id)
            record_B = SwissProt.read(handle_B)
            seq_B = record_B.sequence
            entry_name_B = record_B.entry_name
            
            # Build JSON structure for protein-protein interaction
            json_data = {
                "name": f"MAPLC3B_{entry_name_B}",
                "sequences": [
                    {
                        "protein": {
                            "id": protein_A_id,
                            "sequence": seq_A
                        }
                    },
                    {
                        "protein": {
                            "id": "B", 
                            "sequence": seq_B
                        }
                    }
                ],
                "modelSeeds": [1],
                "dialect": "alphafold3",
                "version": 1
            }
            
            # Save JSON file
            output_filename = f"pair_MAPLC3B_{entry_name_B}.json"
            output_path = os.path.join(folder_name, output_filename)
            
            with open(output_path, "w") as json_file:
                json.dump(json_data, json_file, indent=2)
                
            print(f"Wrote: {output_path}")
            
        except Exception as e:
            print(f"Failed to process {chainB_id}: {e}")

# Create file list for batch submission
list_file_path = f"{folder_name}_list.txt"
json_files = [f for f in os.listdir(folder_name) if f.endswith('.json')]
json_files.sort()  # Sort for consistent ordering

with open(list_file_path, 'w') as list_file:
    for json_file in json_files:
        list_file.write(f"{json_file}\n")

print(f"Processing complete. Files saved in '{folder_name}' folder.")
print(f"Created file list: {list_file_path}")
print(f"Total JSON files: {len(json_files)}")
print(f"Remember to update the job array size in your batch script to [1-{len(json_files)}]")

Successfully retrieved MAPLC3B sequence: MLP3B_HUMAN
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EPIPL_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PLEC_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EF1G_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ICAL_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_OTUL_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CH033_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_XPO2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NEK7_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MAP1B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_COPB2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SRRM2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RED_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DDX1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SPF45_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PTPRD_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MYO1E_HUMAN.json
Wrote: MAPLC

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_FUS_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DDX17_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SC24C_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB7A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SMG1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GOGB1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_USP9X_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_LMNA_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ERBIN_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_WBP11_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_KANK2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PUF60_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CPSF7_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TOM34_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GSTP1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TR150_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_BCLF1_HUMAN.json
W

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RACK1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CAPZB_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TTL12_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TB182_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_G3BP1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_THUM3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ANM3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PRDX6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EI2BA_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PEPL_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_JIP4_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TCTP_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_YTHD2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_HNRH3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_HNRH1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EF1A1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SAFB2_HUMAN.json
W

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DEGS1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_KS6A6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GBF1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_FHL2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_FND3B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GOGA3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GSTO1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PIN1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_HNRL2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_FYCO1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SYIC_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_UBP7_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RIGI_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TRI16_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GCN1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DDX21_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GPX4_HUMAN.json
Wrote

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ADDA_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GPN1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SKI8_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DNJC8_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TCP4_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PIGU_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NONO_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EIF1B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB1A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB1B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TB22A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SEC13_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ILEU_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DHB11_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GTF2I_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_AAPK1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PRP16_HUMAN.json
Wrot

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PKP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_WIPI2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PA24A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MCP_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CP51A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CDC5L_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SPT6H_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NFX1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PRDX5_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CRIP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PCBP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PCBP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SRA1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_IDHC_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TPD52_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_IF2A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_BAG3_HUMAN.json
Wrote

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PCY1A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CKAP5_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAN_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EXOC3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GBP3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_GBP1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TNPO1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_XPO7_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SEPT7_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ABCF2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB8B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SON_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EF1B_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DDI2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ARFG2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_H0Y8G4_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PYR1_HUMAN.json
Wrote:

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_LSM2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PRS8_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_AKA12_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SPAS2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_VATB2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_AP3B1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_AHSA1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ROBO1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TRIPB_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SMC4_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NACAM_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RS6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NOLC1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PSB2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SYLC_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ZN622_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_STAT1_HUMAN.json
Wrot

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_LAMP1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SRSF9_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_T22D1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_S38A2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_LYRIC_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TMF1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ATRN1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_REEP3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_KAT3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_EHD2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PKN2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_TBC13_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB6A_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ITA5_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_KINH_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DDX6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_CSN3_HUMAN.json
Wrote

Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MD2L1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ZDH21_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_AKAP1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MAP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_BABA2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RL11_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_ACKR3_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MCM6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_VIP2_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_MCMBP_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_DPH6_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_SRP09_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PDLI1_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_OBRG_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_PUR9_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_NUCKS_HUMAN.json
Wrote: MAPLC3B_protein_pairs/pair_MAPLC3B_RAB35_HUMAN.json
Wrot