In [1]:
import pandas as pd
import numpy as np
import ampal
from dp_utils.pipeline_data import get_full_pipeline_df
from utils import useful_cols,useful_cols_non_csv,sharing_cols
import pandas

pandas.set_option("display.max_rows", None, "display.max_columns", None)



In [2]:

def generate_deltaprot_designs_data():

    no_disulfide_df =pd.read_csv("/home/tadas/code/deltaproteinsBristol/selected_deltaprots/no_disulfide/no_disulfide_selected_deltaprots.csv")
    no_disulfide_whole_pipeline_df = get_full_pipeline_df("/home/tadas/code/deltaproteinsBristol/pipeline_data/05_evaluation")
    # merge no_disulfide_whole_pipeline_df into no_disulfide_df only where by model_sequence and sequence_name match. Also ignore duplicate columns
    no_disulfide_df = pd.merge(no_disulfide_df, no_disulfide_whole_pipeline_df, how="left", left_on=["sequence_name", "model_sequence"], right_on=["sequence_name", "model_sequence"], suffixes=("", "_whole_pipeline"))
    no_disulfide_df.drop(columns=[col for col in no_disulfide_df.columns if "_whole_pipeline" in col], inplace=True)


    variable_linkers_df = pd.read_csv("/home/tadas/code/deltaproteinsBristol/selected_deltaprots/variable_linkers/variable_linkers/variable_linkers_selected_deltaprots.csv")
    variable_linkers_whole_pipeline_df = get_full_pipeline_df("/home/tadas/code/deltaproteinsBristol/pipeline_data/orientation_gap_length_optimisation_optimised")
    variable_linkers_df = pd.merge(variable_linkers_df, variable_linkers_whole_pipeline_df, how="left", left_on=["sequence_name", "model_sequence"], right_on=["sequence_name", "model_sequence"], suffixes=("", "_whole_pipeline"))
    variable_linkers_df.drop(columns=[col for col in variable_linkers_df.columns if "_whole_pipeline" in col], inplace=True)


    no_disulfide_df["name"]="no_disulfide_"+no_disulfide_df["orientation_code"]
    variable_linkers_df["name"]="variable_linkers_"+variable_linkers_df["orientation_code"]

    # merge the two piplene dataframes 
    df = pd.concat([no_disulfide_df, variable_linkers_df], axis=0)

    well_df = pd.read_csv("/home/tadas/code/deltaproteinsBristol/order_optimised_codons_96_wp.csv")

    # merge well_df with df by Name and sort by Well Position
    df = pd.merge(well_df, df, how="left", left_on="Name", right_on="name")



    # MGSSHHHHHHSSGENLYFQSGS addition adds some mw
    df["model_sequence_w_prefix"] = "MGSSHHHHHHSSGENLYFQSGS" + df["model_sequence"]
    df["mass_w_prefix"] = df["model_sequence_w_prefix"].apply(ampal.analyse_protein.sequence_molecular_weight)
    df["sequence_molar_extinction_280_w_prefix"] = df["model_sequence_w_prefix"].apply(ampal.analyse_protein.sequence_molar_extinction_280)
    
    df["percent_helicity_with_prefix"] = df["dssp_assignment"].str.count("H") / df["model_sequence_w_prefix"].str.len()
    
    df.to_pickle("/home/tadas/code/deltaproteinsBristol/deltaprot_designs_data.pkl")

def load_deltaprot_designs_data():
    return pd.read_pickle("/home/tadas/code/deltaproteinsBristol/deltaprot_designs_data.pkl")

def calc_molar_conc(ext_coef, absorbance):
    return ext_coef / absorbance

def calc_mg_per_ml(molar_conc, mass):
    return molar_conc * mass

In [3]:
generate_deltaprot_designs_data()
df = load_deltaprot_designs_data()


  df["model_sequence_w_prefix"] = "MGSSHHHHHHSSGENLYFQSGS" + df["model_sequence"]
  df["mass_w_prefix"] = df["model_sequence_w_prefix"].apply(ampal.analyse_protein.sequence_molecular_weight)
  df["sequence_molar_extinction_280_w_prefix"] = df["model_sequence_w_prefix"].apply(ampal.analyse_protein.sequence_molar_extinction_280)
  df["percent_helicity_with_prefix"] = df["dssp_assignment"].str.count("H") / df["model_sequence_w_prefix"].str.len()


In [None]:

# populate received_from_idt column. Received everything except for C2,C4,D5,D6,F2,F3,F6


not_received = ['C2', 'C4', 'D5', 'D6', 'F2', 'F3', 'F6']
df['received_from_idt'] = ~df["Well Position"].isin(not_received)

# populate transformation_attempted for (A1-A12,B1-B12,C1,C3,F4,C5,C6)
transformation_attempted_ids = set([f"A{i}" for i in range(1, 13)] +
                    [f"B{i}" for i in range(1, 13)] +
                    ['C1', 'C3', 'F4', 'C5', 'C6'])
df['transformation_attempted'] = df["Well Position"].isin(transformation_attempted_ids)
df['transformation_successful'] = df["Well Position"].isin(transformation_attempted_ids) # all transformations worked, C6 failed initially

# populate expression_levels: (None, "low","medium","high") low: A1,A3,A6,A7,A8,A10,B1. Medium: A5,A11,B2,B3. High: A9,A12


expr_map = {
    # TODO , 'C6' was transformed later, but not yet tested
    **dict.fromkeys(['A2', 'A4', 'B5', 'B6', 'B7', 'B9', 'B11', 'C5'], 'none'), 
    **dict.fromkeys(['A1','A3', 'A6', 'A8', 'B1','B4', 'B10','C3'], 'low'),
    **dict.fromkeys(['A7', 'A10','B12','C1','F4'], 'medium'),
    **dict.fromkeys(['A11', 'B2', 'B3','A5'], 'high'),
    **dict.fromkeys(['A9', 'A12', 'B8'], 'super_high')
}
df['expression_levels'] = df["Well Position"].map(expr_map)

# populate sds_page_size_appearance for every visible band?
# TODO

# populate large_scale_expressed for A12,A9,B8,A1,B12,F4
scaled_expressed_ids = ['A12','A9','B8','A1','B12','F4',"A11","B3","B10"]
df['large_scale_expressed'] = df["Well Position"].isin(scaled_expressed_ids)

# populate scaled_purified for A12,A9,B8 TODO add ,'A1','B12','F4'
# scaled_purified_ids = ['A12','A9','B8'] \

# Note: A9,B8 had some aggregation (small pellet after spining down). A12 did not

A280_after_NI_NTA_IMAC = {
    "A12": 13.41,
    "A9": 6.2,
    "B8": 16.11,
    #"A1" Not Measured, 
    #"B12" Not Measured, 
    #"F4": Not Measured, 
    "A11":6.565,
    "B3":9.067,
    "B10":5.780,
}


df['A280_after_NI_NTA_IMAC'] = df["Well Position"].map(A280_after_NI_NTA_IMAC)
volume_after_NI_NTA_IMAC = 3.2
# calculate molar conc asuming sample is entirely my protein df.sequence_molar_extinction_280

df['molar_conc_after_NI_NTA_IMAC'] = df['A280_after_NI_NTA_IMAC'] / df['sequence_molar_extinction_280_w_prefix']
df['mg_per_ml_after_NI_NTA_IMAC'] = df['molar_conc_after_NI_NTA_IMAC'] * df['mass_w_prefix']
df['mg_after_NI_NTA_IMAC'] = df['mg_per_ml_after_NI_NTA_IMAC'] * volume_after_NI_NTA_IMAC

# after SEC (central fractions)
A280_after_SEC = {
    "A12": 4.93,
    "A9": 2.18,
    "B8": 6.758,
    "A1": 0.820,
    "B12": 2.510,
    "F4": 2.427, 
    "A11":2.478,
    "B3":2.939,
    "B10":2.556,
}
volume_after_sec = {
    "A12": 5.1,
    "A9": 5.1,
    "B8": 3.4,
    "A1": 3.4,
    "B12": 5.1,
    "F4": 5.1,
    "A11": 5.1,
    "B3":3.4,
    "B10":3.4,
}
df["volume_after_sec"] = df["Well Position"].map(volume_after_sec)

df['A280_after_SEC'] = df["Well Position"].map(A280_after_SEC)
df['molar_conc_after_SEC'] = df['A280_after_SEC'] / df['sequence_molar_extinction_280_w_prefix']
df['mg_per_ml_after_SEC'] = df['molar_conc_after_SEC'] * df['mass_w_prefix']
df['mg_after_SEC'] = df['mg_per_ml_after_SEC'] * df['volume_after_sec']


# Biophysical characterisation info (CD and biophysical SEC used same sample. Was assumed it is 20 uM, however it was a bit less.)
cd_sample_A280 = {
    "A12": 0.395, # later measure: 0.406
    "A9": 0.168, # later measure: 0.190
    "B8": 0.517, # later measure: 0.537
    "A1":0.173,
    "B12": 0.210,
    "F4": 0.211,
    "A11": 0.569,
    "B3":0.764,
    "B10":0.175,
}

df["cd_sample_A280"] = df["Well Position"].map(cd_sample_A280)
df["cd_sample_molar_conc"] = df["cd_sample_A280"] / df["sequence_molar_extinction_280_w_prefix"]
df["cd_path_length_mm"]=1

saxs_submitted_samples = ["A1","A9","A12","B8","B12","F4"]

df["saxs_submitted"] = df["Well Position"].isin(saxs_submitted_samples)

# crystal screens set up with 3+3 uL

    # # plate 1, position 2:
    # "B12": 19.19,

    # # plate 2, position 1:
    # "A12": 36.56,
    # # plate 2, position 2:
    # "B8": 43.35,

    # # plate 3, position 1:
    # "A1": 13.82,
    # # plate 3, position 2:
    # "B3": 37.62,
crystal_screens_info = {
    # plate 1, position 1:
    "A9": {
        "plate": 1,
        "position": 1,
        "date": "2025-04-11",
        "A280": 19.40
    },
    "B12":{
        "plate": 1,
        "position": 2,
        "date": "2025-04-11",
        "A280": 19.19
    },
    "A12":{
        "plate": 2,
        "position": 1,
        "date": "2025-04-14",
        "A280": 36.56
    },
    "B8":{
        "plate": 2,
        "position": 2,
        "date": "2025-04-14",
        "A280": 43.35
    },
    "A1":{
        "plate": 3,
        "position": 1,
        "date": "2025-04-17",
        "A280": 13.82
    },
    "B3":{
        "plate": 3,
        "position": 2,
        "date": "2025-04-17",
        "A280": 37.62
    }
}
# unpack all of these columns to df
df["crystal_screens_info"] = df["Well Position"].map(crystal_screens_info)
crystal_keys = ["plate", "position", "date", "A280"]
for key in crystal_keys:
    df[f"crystal_{key}"] = df["crystal_screens_info"].map(lambda x: x.get(key) if isinstance(x, dict) else None)

# Drop original nested column
df.drop(columns=["crystal_screens_info"], inplace=True)
# calculate crystal_mg_per_ml
# df['molar_conc_after_SEC'] = df['A280_after_SEC'] / df['sequence_molar_extinction_280_w_prefix']
# df['mg_per_ml_after_SEC'] = df['molar_conc_after_SEC'] * df['mass_w_prefix']
df["crystal_molar_conc"] = df["crystal_A280"] / df["sequence_molar_extinction_280_w_prefix"]
df["crystal_mg_per_ml"] = df["crystal_molar_conc"] * df["mass_w_prefix"]


# df["mg_per_ml_crystal_screens"] = df["crystal_screens_info"].map(lambda x: x["mg_per_ml"] if x else np.nan)
# df["plate_crystal_screens"] = df["crystal_screens_info"].map(lambda x: x["plate"] if x else np.nan)
# df["position_crystal_screens"] = df["crystal_screens_info"].map(lambda x: x["position"] if x else np.nan)
# df["date_crystal_screens"] = df["crystal_screens_info"].map(lambda x: x["date"] if x else np.nan)
    
                 
experimental_cols = [
    "model_sequence_w_prefix",
    "mass_w_prefix",
    "sequence_molar_extinction_280_w_prefix",
    "received_from_idt",
    "transformation_attempted",
    "transformation_successful",
    "expression_levels",
    "large_scale_expressed",
    "A280_after_NI_NTA_IMAC",
    "molar_conc_after_NI_NTA_IMAC",
    "mg_per_ml_after_NI_NTA_IMAC",
    "mg_after_NI_NTA_IMAC",
    "volume_after_sec",
    "A280_after_SEC",
    "molar_conc_after_SEC",
    "mg_per_ml_after_SEC",
    "mg_after_SEC",
    "cd_sample_A280",
    "cd_sample_molar_conc",
    "cd_path_length_mm",
    "saxs_submitted",
    "crystal_plate", "crystal_position", "crystal_date", "crystal_A280","crystal_molar_conc","crystal_mg_per_ml"
    # "scaled_purified" is mentioned but not actually created
]


  df["crystal_screens_info"] = df["Well Position"].map(crystal_screens_info)


In [7]:
df[useful_cols+experimental_cols].to_csv("/home/tadas/code/deltaproteinsBristol/experimental_results/deltaprot_designs_data_with_results.csv", index=False)
df[sharing_cols+experimental_cols].to_csv("/home/tadas/code/deltaproteinsBristol/experimental_results/deltaprot_designs_data_with_results_minimised.csv", index=False)
df.to_pickle("/home/tadas/code/deltaproteinsBristol/deltaprot_designs_all_data_with_results.pkl")

In [10]:
df[df["large_scale_expressed"]][["Well Position","crystal_plate"]]

Unnamed: 0,Well Position,crystal_plate
0,A1,3.0
8,A9,1.0
10,A11,
11,A12,2.0
14,B3,3.0
19,B8,2.0
21,B10,
23,B12,1.0
57,F4,


In [None]:
df[df['large_scale_expressed']][["Well Position","Name","mass_w_prefix","expression_levels","mg_per_ml_after_SEC","mg_after_SEC","molar_conc_after_SEC","cd_sample_molar_conc"]]

In [3]:
df

NameError: name 'df' is not defined

In [None]:
# set limit to column width
pd.set_option('display.max_colwidth', 1)

In [None]:
df[["Well Position","cd_sample_molar_conc","Name","expression_levels"]]

In [None]:
df[["Well Position","cd_sample_molar_conc","Name","A280_after_SEC","volume_after_sec","sequence_molar_extinction_280_w_prefix","molar_conc_after_SEC","mg_per_ml_after_SEC","mg_after_SEC"]]

In [None]:
df[["Well Position","Name","mass","mass_w_prefix","charge","A280_after_SEC","volume_after_sec","sequence_molar_extinction_280_w_prefix","molar_conc_after_NI_NTA_IMAC","molar_conc_after_SEC","mg_per_ml_after_SEC","mg_after_SEC"]]

In [None]:
# mass correct: A9, A11, B2, C1, F4, B12
# mass questionable: A12 (has 2 bands), B3 (2 bands)
# mass wrong: 

In [None]:
# unlimit pandas column display number
pd.set_option('display.max_columns', None)

In [15]:
df[df["transformation_successful"] & df["expression_levels"].isin(["low","medium","high","super_high", np.nan]) & ~df["large_scale_expressed"]][["Well Position","Name","expression_levels"]]

Unnamed: 0,Well Position,Name,expression_levels
2,A3,no_disulfide_b4iiiix,low
4,A5,no_disulfide_b4iiin,high
5,A6,no_disulfide_b4inin,low
6,A7,no_disulfide_b4innn,medium
7,A8,no_disulfide_b4nnnnx,low
9,A10,no_disulfide_b5iiiin,medium
12,B1,no_disulfide_b5innnn,low
13,B2,no_disulfide_b6iiniin,high
15,B4,no_disulfide_b6inninn,low
24,C1,no_disulfide_l5inni,medium


In [12]:
df[df["expression_levels"].isin(["low","medium","high","super_high"])].sort_values(["large_scale_expressed","expression_levels"],ascending=[False,True])[["Well Position","Name","mass_w_prefix","expression_levels","large_scale_expressed"]]

Unnamed: 0,Well Position,Name,mass_w_prefix,expression_levels,large_scale_expressed
10,A11,no_disulfide_b5iinin,14240.78108,high,True
14,B3,no_disulfide_b6ininin,15691.18198,high,True
0,A1,no_disulfide_b3iii,9661.41738,low,True
21,B10,no_disulfide_l4iin,10960.05638,low,True
23,B12,no_disulfide_l5iiin,12669.91628,medium,True
57,F4,variable_linkers_l6innni,11020.77008,medium,True
8,A9,no_disulfide_b4nnnny,11094.27778,super_high,True
11,A12,no_disulfide_b5ininn,14092.83838,super_high,True
19,B8,no_disulfide_h6i_i_i,16168.21468,super_high,True
4,A5,no_disulfide_b4iiin,9348.14028,high,False


In [23]:
df[df["expression_levels"].isin(["low","medium","high","super_high"]) & ~df["large_scale_expressed"]][ ["Well Position","expression_levels"]]

Unnamed: 0,Well Position,expression_levels
2,A3,low
4,A5,high
5,A6,low
6,A7,medium
7,A8,low
9,A10,medium
12,B1,low
13,B2,high
15,B4,low
24,C1,medium


In [17]:
df[df["expression_levels"].isin(["low","medium","high","super_high"])]

Unnamed: 0,Well Position,Name,Sequence,orientation_code,atp_cost_per_aa,dna_complexity_per_aa,pll,pll_per_aa,isoelectric_point,charge,sequence_charge,mass,sequence_length,mean_plddt,mean_pae,ptm,tm_rmsd,tm_score_assembly,tm_score_design,tm_rmsd100,dp_finder_total_cost_norm,predicted_usability,combined_score,path_score_version,residues_per_helix,deltahedron_edge_length,diffuse_termini,avoid_amino_acids,increase_amino_acid_likelihood,energy_minimization,algorithms_sequence_prediction,algorithms_structure_prediction,rf_file_num,rib_num,aa_count_per_gap,model_sequence,sequence_molar_extinction_280,sequence_molecular_weight,backbone_loop_mask_string,aligned_length,seq_id,sequence_name,dssp_assignment,aggrescan3d_avg_value,hydrophobic_fitness,packing_density,rosetta_total_per_aa,name,structure_prediction_file_name,structure_prediction_file_path,deltaprot_score,loop_lengths,designs_per_orientation,rf_diffusion_mask_input_seq_bool,directories_assembly_inputs,directories_rf_diffusion_outputs,directories_seq_pred_inputs,directories_seq_pred_outputs,directories_structure_prediction,directories_evaluation,composition_ALA,composition_CYS,composition_ASP,composition_GLU,composition_PHE,composition_GLY,composition_HIS,composition_ILE,composition_LYS,composition_LEU,composition_MET,composition_ASN,composition_PRO,composition_GLN,composition_ARG,composition_SER,composition_THR,composition_VAL,composition_TRP,composition_TYR,atp_cost,dna_complexity,aa_count_per_gap_list,index_helix1_n,index_helix1_c,index_helix2_n,index_helix2_c,index_helix3_n,index_helix3_c,index_helix4_n,index_helix4_c,index_helix5_n,index_helix5_c,index_helix6_n,index_helix6_c,linker1_length,linker2_length,linker3_length,linker4_length,linker5_length,deltahedron_name,taylor_letter_packing_descriptors,chothia_omega_angles,overall_distance_score_v2,overall_path_distance_score_v2,overall_linker_length_score,overall_contact_order_score,overall_linker_convenience_score,overall_linker_convenience_v2_score,path_score_v2,path_score_v3,angle_helix1,hydrophobic_count_helix1,residue_count_helix1,angle_helix2,hydrophobic_count_helix2,residue_count_helix2,angle_helix3,hydrophobic_count_helix3,residue_count_helix3,angle_helix4,hydrophobic_count_helix4,residue_count_helix4,angle_helix5,hydrophobic_count_helix5,residue_count_helix5,angle_helix6,hydrophobic_count_helix6,residue_count_helix6,angle_resolution,path,design_name,file_name,full_sequence,composition_UNK,ss_prop_alpha_helix,ss_prop_beta_bridge,ss_prop_beta_strand,ss_prop_3_10_helix,ss_prop_pi_helix,ss_prop_hbonded_turn,ss_prop_bend,ss_prop_loop,num_residues,budeff_total,budeff_steric,budeff_desolvation,budeff_charge,evoef2_total,evoef2_ref_total,evoef2_intraR_total,evoef2_interS_total,evoef2_interD_total,dfire2_total,rosetta_total,rosetta_fa_atr,rosetta_fa_rep,rosetta_fa_intra_rep,rosetta_fa_elec,rosetta_fa_sol,rosetta_lk_ball_wtd,rosetta_fa_intra_sol_xover4,rosetta_hbond_lr_bb,rosetta_hbond_sr_bb,rosetta_hbond_bb_sc,rosetta_hbond_sc,rosetta_dslf_fa13,rosetta_rama_prepro,rosetta_p_aa_pp,rosetta_fa_dun,rosetta_omega,rosetta_pro_close,rosetta_yhh_planarity,aggrescan3d_total_value,aggrescan3d_min_value,aggrescan3d_max_value,hydrophobic_fitness_per_aa,budeff_total_per_aa,budeff_steric_per_aa,budeff_desolvation_per_aa,budeff_charge_per_aa,evoef2_total_per_aa,evoef2_ref_total_per_aa,evoef2_intraR_total_per_aa,evoef2_interS_total_per_aa,evoef2_interD_total_per_aa,dfire2_total_per_aa,rosetta_fa_atr_per_aa,rosetta_fa_rep_per_aa,rosetta_fa_intra_rep_per_aa,rosetta_fa_elec_per_aa,rosetta_fa_sol_per_aa,rosetta_lk_ball_wtd_per_aa,rosetta_fa_intra_sol_xover4_per_aa,rosetta_hbond_lr_bb_per_aa,rosetta_hbond_sr_bb_per_aa,rosetta_hbond_bb_sc_per_aa,rosetta_hbond_sc_per_aa,rosetta_dslf_fa13_per_aa,rosetta_rama_prepro_per_aa,rosetta_p_aa_pp_per_aa,rosetta_fa_dun_per_aa,rosetta_omega_per_aa,rosetta_pro_close_per_aa,rosetta_yhh_planarity_per_aa,dp_finder_filename,dp_finder_helix_axes,dp_finder_orientation_code,dp_finder_rotation_matrix,dp_finder_scale,dp_finder_translation_matrix,dp_finder_sliding_rmsd,dp_finder_rmsd,dp_finder_best_angle_error,dp_finder_assignment_indices,dp_finder_transformed_orientation_data,dp_finder_total_unassigned_axes,dp_finder_total_cost,dp_finder_correct_deltaprot,sid,round,settings_deltaprot_score,settings_loop_lengths,settings_designs_per_orientation,settings_rf_diffusion_mask_input_seq_bool,settings_energy_minimization,directories_rf_diffusion_inference_py,aa,model_sequence_w_prefix,mass_w_prefix,sequence_molar_extinction_280_w_prefix,percent_helicity_with_prefix,received_from_idt,transformation_attempted,transformation_successful,expression_levels,large_scale_expressed,A280_after_NI_NTA_IMAC,molar_conc_after_NI_NTA_IMAC,mg_per_ml_after_NI_NTA_IMAC,mg_after_NI_NTA_IMAC,volume_after_sec,A280_after_SEC,molar_conc_after_SEC,mg_per_ml_after_SEC,mg_after_SEC,cd_sample_A280,cd_sample_molar_conc,cd_path_length_mm,saxs_submitted,crystal_plate,crystal_position,crystal_date,crystal_A280
0,A1,no_disulfide_b3iii,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b3iii,23.098276,3.586207,-98.798406,-1.703421,4.5,-7.195539,-7.195539,7218.91718,58,85.567931,4.15338,0.6,1.05,0.53697,0.36119,1.443028,0.911146,0.566661,0.679661,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,2,3,13.0,KKEEIRRYLREVRRRLEAGEPLSEEQLRAIEEAREWLEENREEYPE...,9530,7218.91718,----GGGGGGGG-------------GGGGGGGG-------------...,24.0,0.0,b3iii_gap_13_2,-HHHHHHHHHHHHHHHHHT----HHHHHHHHHHHHHHHHTTTT-HH...,-2.8968,-24.301692,49.807087,2.483311,no_disulfide_b3iii,b3iii_gap_13_2_unrelaxed_rank_001_alphafold2_p...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.069,0.0,0.0,0.3276,0.0,0.0172,0.0,0.0517,0.0517,0.1207,0.0,0.0172,0.0345,0.0172,0.1552,0.0345,0.0,0.0345,0.0172,0.0517,1339.7,208.0,"[13, 13]",0.0,1.0,2.0,3.0,4.0,5.0,,,,,,,1.0,1.0,,,,octahedron,"(a, c, b)","(60.0, 60.0, 60.0)",1.0,1.0,1.0,1.33,1.25,0.93,3.5,1.24,330.0,2.0,10.0,330.0,2.0,10.0,330.0,2.0,10.0,,,,,,,,,,1.0,"[(0, 1), (2, 3), (4, 5)]",b3iii_gap_13_2_unrelaxed_rank_001_alphafold2_p...,b3iii_gap_13_2_unrelaxed_rank_001_alphafold2_p...,KKEEIRRYLREVRRRLEAGEPLSEEQLRAIEEAREWLEENREEYPE...,0,0.775862,0.0,0.0,0.0,0.0,0.103448,0.0,0.12069,58,-903.028963,31.302666,-530.358748,-403.972881,-243.86,-26.21,123.44,-341.11,0.0,-101.0,144.032052,-320.679579,237.089433,0.555761,-71.584878,219.743918,-5.908246,11.5507,-0.731174,-35.094499,-1.671817,0.0,0.0,-15.403506,-10.25387,158.090638,3.742577,2.074623,0.0,-168.0172,-5.4391,0.7694,-0.418995,-15.569465,0.539701,-9.144116,-6.96505,-4.204483,-0.451897,2.128276,-5.881207,0.0,-1.741379,-5.528958,4.087749,0.009582,-1.234222,3.788688,-0.101866,0.19915,-0.012606,-0.605078,-0.028824,0.0,0.0,-0.265578,-0.176791,2.725701,0.064527,0.035769,0.0,b3iii_gap_13_2_unrelaxed_rank_001_alphafold2_p...,"[{'center': [-4.73020619410339, -3.27492316765...",b3iii,"[[-0.29569374811807303, 0.9454984075066322, 0....",11.966493,"[-80.37972200393837, 56.38709838407229, 112.14...",0.751556,1.664792,0.034245,"[(0, 0), (1, 1), (2, 2)]","[{'center': [-3.72171751744564, -3.78559186116...",0.0,1.572829,True,b3iii_gap_13_2,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSKKEEIRRYLREVRRRLEAGEPLSE...,9661.41738,10810,0.5625,True,True,True,low,True,,,,,3.4,0.82,7.6e-05,0.732873,2.49177,0.173,1.6e-05,1,True,3.0,1.0,2025-04-17,13.82
2,A3,no_disulfide_b4iiiix,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4iiiix,22.808861,3.987342,-168.607116,-2.134267,4.4,-8.306272,-8.306272,9399.48898,79,85.295316,4.178289,0.71,1.02,0.7512,0.37117,1.156281,0.935027,0.591358,0.663041,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,0,4,13.0,GEWVERYRELLEYAVEYLGEPRYEELRETCIRLGGIDPSLSEEELR...,10810,9399.48898,----GGGGGGGG-------------GGGGGGGG-------------...,32.0,0.0,b4iiiix_gap_13_0,-HHHHHHHHHHHHHHHTTTSGGGHHHHHHHHHHHT--TTS-HHHHH...,-1.9354,-27.670283,53.068079,5.941159,no_disulfide_b4iiiix,b4iiiix_gap_13_0_unrelaxed_rank_001_alphafold2...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0633,0.0127,0.0127,0.2532,0.0,0.0633,0.0,0.0506,0.0,0.1646,0.0,0.0,0.0506,0.0,0.1646,0.038,0.0127,0.0506,0.0127,0.0506,1801.9,315.0,"[13, 13, 13]",0.0,5.0,2.0,7.0,6.0,4.0,3.0,1.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(x, b, d, c, a, x)","(71.9, 11.7, 70.7, 70.7, 11.7, 71.9)",0.91,0.82,1.0,1.51,1.05,0.9,5.18,1.24,272.0,2.0,10.0,130.0,2.0,10.0,272.0,2.0,10.0,130.0,2.0,10.0,,,,,,,1.0,"[(0, 5), (2, 7), (6, 4), (3, 1)]",b4iiiix_gap_13_0_unrelaxed_rank_001_alphafold2...,b4iiiix_gap_13_0_unrelaxed_rank_001_alphafold2...,GEWVERYRELLEYAVEYLGEPRYEELRETCIRLGGIDPSLSEEELR...,0,0.746835,0.0,0.0,0.037975,0.0,0.101266,0.037975,0.075949,79,-1256.102862,124.431915,-746.900178,-633.634598,-204.31,-22.15,214.48,-396.63,0.0,-145.8,469.351525,-461.966297,605.09985,0.815734,-104.189637,299.174043,-8.740889,13.1176,-0.83311,-43.940726,-3.33998,-0.829704,0.0,2.306326,-13.223682,171.976802,7.859605,10.379979,0.0,-152.8993,-4.7415,0.0,-0.350257,-15.900036,1.575088,-9.454433,-8.020691,-2.586203,-0.28038,2.714937,-5.020633,0.0,-1.84557,-5.847675,7.659492,0.010326,-1.318856,3.787013,-0.110644,0.166046,-0.010546,-0.556212,-0.042278,-0.010503,0.0,0.029194,-0.167388,2.176922,0.099489,0.131392,0.0,b4iiiix_gap_13_0_unrelaxed_rank_001_alphafold2...,"[{'center': [-4.435322309410603, 5.10876543301...",b4iiiix,"[[-0.4716642771938947, 0.4338930791905715, -0....",12.777187,"[-94.57420283481724, -116.96125451399031, -42....",0.635425,1.714278,0.047829,"[(1, 0), (3, 1), (2, 2), (0, 4)]","[{'center': [1.4035227519612192, -1.0145312885...",0.0,1.23329,True,b4iiiix_gap_13_0,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSGEWVERYRELLEYAVEYLGEPRYE...,11841.98918,12090,0.584158,True,True,True,low,False,,,,,,,,,,,,1,False,,,,
4,A5,no_disulfide_b4iiin,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4iiin,22.315873,3.777778,-116.430898,-1.848109,3.9,-9.196622,-9.196622,6905.64008,63,89.29873,3.126344,0.7,0.97,0.71746,0.45252,1.261407,0.954729,0.695207,0.690276,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,0,4,9.0,SRYAEALELIRAKLPDTPEGRELLAALEAGTFDPEWAIAWLREAGF...,13940,6905.64008,--GGGGGGGG---------GGGGGGGG---------GGGGGGGG--...,32.0,0.062,b4iiin_gap_9_0,-HHHHHHHHHHHHS-SSHHHHHHHHHHHHT---HHHHHHHHHHTT-...,-1.5753,-29.741803,51.508197,0.972441,no_disulfide_b4iiin,b4iiin_gap_9_0_unrelaxed_rank_001_alphafold2_p...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.1905,0.0,0.0317,0.1905,0.0317,0.0794,0.0,0.0317,0.0159,0.1587,0.0,0.0,0.0476,0.0,0.0635,0.0317,0.0317,0.0317,0.0317,0.0317,1405.9,238.0,"[9, 9, 9]",0.0,4.0,7.0,3.0,2.0,6.0,5.0,1.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(b, x, a, a, x, A)","(11.7, 48.3, 49.9, 49.9, 48.3, -11.7)",0.93,1.0,1.0,1.42,1.43,0.99,6.62,1.31,278.0,2.0,10.0,278.0,2.0,10.0,55.0,2.0,10.0,55.0,2.0,10.0,,,,,,,1.0,"[(0, 4), (7, 3), (2, 6), (5, 1)]",b4iiin_gap_9_0_unrelaxed_rank_001_alphafold2_p...,b4iiin_gap_9_0_unrelaxed_rank_001_alphafold2_p...,SRYAEALELIRAKLPDTPEGRELLAALEAGTFDPEWAIAWLREAGF...,0,0.777778,0.0,0.0,0.0,0.0,0.047619,0.047619,0.126984,63,-941.568458,43.041104,-540.735219,-443.874343,-281.04,-13.97,105.72,-372.83,0.0,-108.6,61.263788,-336.75168,198.124608,0.546103,-79.525068,205.72256,-6.996983,10.092563,-1.694295,-36.836244,-5.618005,-0.272046,0.0,-12.245417,-12.98973,114.680441,4.917127,6.877201,0.0,-99.2436,-3.7793,0.0,-0.472092,-14.945531,0.683192,-8.583099,-7.045624,-4.460952,-0.221746,1.678095,-5.917937,0.0,-1.72381,-5.345265,3.144835,0.008668,-1.262303,3.265437,-0.111063,0.160199,-0.026894,-0.584702,-0.089175,-0.004318,0.0,-0.194372,-0.206186,1.820324,0.07805,0.109162,0.0,b4iiin_gap_9_0_unrelaxed_rank_001_alphafold2_p...,"[{'center': [4.274912573334547, -9.26731120402...",b4iiin,"[[-0.1294624800692348, 0.9318380223655469, -0....",11.828015,"[80.36439215052413, -14.580542101860303, -119....",0.82805,1.641102,0.010009,"[(0, 0), (3, 1), (2, 2), (1, 3)]","[{'center': [2.7530892302877277, -9.8764609675...",0.0,0.953168,True,b4iiin_gap_9_0,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSSRYAEALELIRAKLPDTPEGRELL...,9348.14028,15220,0.576471,True,True,True,high,False,,,,,,,,,,,,1,False,,,,
5,A6,no_disulfide_b4inin,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4inin,23.674684,3.063291,-127.335028,-1.611836,4.0,-20.303951,-20.303951,9720.64698,79,91.401139,3.190729,0.75,0.59,0.85643,0.39168,0.668829,0.96254,0.787491,0.708648,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,6,4,13.0,SLEELIEKIEKFNNLENPTEEELEELIELLKEWCEELGVEEEKKEE...,15220,9720.64698,----GGGGGGGG-------------GGGGGGGG-------------...,32.0,0.0,b4inin_gap_13_6,-HHHHHHHHHHHHTSSS--HHHHHHHHHHHHHHHHHHT--HHHHHH...,-2.4303,-41.131171,54.471449,3.939049,no_disulfide_b4inin,b4inin_gap_13_6_unrelaxed_rank_001_alphafold2_...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0127,0.0127,0.0,0.3797,0.0127,0.0127,0.0,0.0506,0.1139,0.1772,0.0,0.0633,0.0127,0.0,0.0127,0.0253,0.0253,0.0253,0.0253,0.038,1870.3,242.0,"[13, 13, 13]",4.0,0.0,3.0,7.0,2.0,1.0,5.0,6.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(a, x, A, A, x, a)","(11.7, 16.6, -11.7, -11.7, 16.6, 11.7)",0.96,1.0,1.0,1.51,1.49,1.0,7.03,1.45,119.0,2.0,10.0,119.0,2.0,10.0,119.0,2.0,10.0,119.0,2.0,10.0,,,,,,,1.0,"[(4, 0), (3, 7), (2, 1), (5, 6)]",b4inin_gap_13_6_unrelaxed_rank_001_alphafold2_...,b4inin_gap_13_6_unrelaxed_rank_001_alphafold2_...,SLEELIEKIEKFNNLENPTEEELEELIELLKEWCEELGVEEEKKEE...,0,0.810127,0.0,0.0,0.0,0.0,0.050633,0.050633,0.088608,79,-1358.905765,74.764154,-809.524236,-624.145683,-354.64,-26.05,149.05,-477.63,0.0,-158.9,311.184906,-484.692898,500.572156,0.816175,-105.978859,334.477131,-7.280146,15.527712,-1.241451,-57.810557,-3.395402,-1.898945,0.0,-13.955278,-13.392943,187.262691,4.246024,2.186235,0.0,-191.9902,-4.7561,0.0,-0.520648,-17.201339,0.946382,-10.247142,-7.900578,-4.489114,-0.329747,1.886709,-6.045949,0.0,-2.011392,-6.135353,6.336356,0.010331,-1.341505,4.233888,-0.092154,0.196553,-0.015715,-0.731779,-0.04298,-0.024037,0.0,-0.176649,-0.169531,2.370414,0.053747,0.027674,0.0,b4inin_gap_13_6_unrelaxed_rank_001_alphafold2_...,"[{'center': [-1.0928267079027385, -4.037293867...",b4inin,"[[-0.6557510888188983, -0.7404070723702155, -0...",11.361241,"[3.7338436494787244, -34.64067691880748, 71.35...",0.790176,2.338301,0.004156,"[(0, 0), (2, 1), (1, 2), (3, 3)]","[{'center': [0.258659014867042, -4.05055302999...",0.0,0.842124,True,b4inin_gap_13_6,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSSLEELIEKIEKFNNLENPTEEELE...,12163.14718,16500,0.633663,True,True,True,low,False,,,,,,,,,,,,1,False,,,,
6,A7,no_disulfide_b4innn,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4innn,20.311392,3.962025,-143.267369,-1.813511,4.1,-8.256534,-8.256534,8302.30618,79,91.910886,2.788188,0.79,1.34,0.62928,0.35019,1.519035,0.914906,0.675381,0.705306,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,8,4,13.0,PLDPEAVRAWLRRALAELQAEGLATPALVAAVEAHADEIAGADAEG...,11380,8302.30618,----GGGGGGGG-------------GGGGGGGG-------------...,32.0,0.0,b4innn_gap_13_8,---HHHHHHHHHHHHHHHHHTT---HHHHHHHHHTHHHHHHS-HHH...,-1.4508,-39.574988,52.35274,1.08603,no_disulfide_b4innn,b4innn_gap_13_8_unrelaxed_rank_001_alphafold2_...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.2658,0.0127,0.038,0.1392,0.0127,0.0506,0.0127,0.0127,0.0,0.1646,0.0,0.0,0.0506,0.0253,0.0759,0.0253,0.0253,0.0633,0.0253,0.0,1604.6,313.0,"[13, 13, 13]",0.0,5.0,6.0,4.0,3.0,7.0,2.0,1.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(b, X, B, B, X, A)","(11.7, -48.3, -49.9, -49.9, -48.3, -11.7)",0.93,1.0,1.0,1.42,1.43,0.99,6.62,1.31,272.0,2.0,10.0,272.0,2.0,10.0,119.0,2.0,10.0,119.0,2.0,10.0,,,,,,,1.0,"[(0, 5), (6, 4), (3, 7), (2, 1)]",b4innn_gap_13_8_unrelaxed_rank_001_alphafold2_...,b4innn_gap_13_8_unrelaxed_rank_001_alphafold2_...,PLDPEAVRAWLRRALAELQAEGLATPALVAAVEAHADEIAGADAEG...,0,0.797468,0.0,0.0,0.0,0.0,0.063291,0.012658,0.126582,79,-1193.890078,52.16468,-640.446689,-605.608069,-339.01,-15.92,128.43,-451.51,0.0,-137.5,85.796389,-428.07677,298.871372,0.647023,-108.887467,257.664251,-10.607937,12.686901,-2.272111,-51.741183,-3.54567,-0.896917,0.0,-14.761819,-10.96247,99.849348,4.958428,10.77589,0.0,-114.6134,-3.3313,0.0,-0.500949,-15.112533,0.660312,-8.10692,-7.665925,-4.291266,-0.201519,1.625696,-5.715316,0.0,-1.740506,-5.418693,3.783182,0.00819,-1.378322,3.261573,-0.134278,0.160594,-0.028761,-0.654952,-0.044882,-0.011353,0.0,-0.186858,-0.138765,1.263916,0.062765,0.136404,0.0,b4innn_gap_13_8_unrelaxed_rank_001_alphafold2_...,"[{'center': [-3.181212539340748, 4.12834057350...",b4innn,"[[-0.8027873906215266, 0.5962651908824997, -0....",11.732763,"[64.1180155664314, -114.43015749180279, 27.845...",1.047217,2.199629,0.037772,"[(0, 0), (3, 1), (2, 3), (1, 4)]","[{'center': [-2.3812155933308787, 4.0465745631...",0.0,1.519368,True,b4innn_gap_13_8,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSPLDPEAVRAWLRRALAELQAEGLA...,10744.80638,12660,0.623762,True,True,True,medium,False,,,,,,,,,,,,1,False,,,,
7,A8,no_disulfide_b4nnnnx,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4nnnnx,24.284507,3.605634,-129.296705,-1.82108,4.2,-12.148349,-12.148349,8860.65328,71,90.073239,3.399583,0.72,0.73,0.79779,0.42538,0.880839,0.940639,0.745587,0.694855,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,4,4,11.0,WEELEEAVRWLRERLPDLTEEQHIEYIRRYAEEGPDDLSPEVREAL...,17780,8860.65328,---GGGGGGGG-----------GGGGGGGG-----------GGGGG...,32.0,0.0,b4nnnnx_gap_11_4,-HHHHHHHHHHHHH-TT--HHHHHHHHHHHHHH-GGGS-HHHHHHH...,-2.129,-24.650449,53.345048,1.334067,no_disulfide_b4nnnnx,b4nnnnx_gap_11_4_unrelaxed_rank_001_alphafold2...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0563,0.0,0.0423,0.2817,0.0,0.0282,0.0141,0.0563,0.0,0.1268,0.0,0.0,0.0563,0.0141,0.1549,0.0141,0.0141,0.0423,0.0282,0.0704,1724.2,256.0,"[11, 11, 11]",0.0,3.0,2.0,6.0,7.0,4.0,5.0,1.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(X, B, D, C, A, X)","(-71.9, -11.7, -70.7, -70.7, -11.7, -71.9)",0.91,0.82,1.0,1.51,1.05,0.9,5.18,1.24,238.0,2.0,10.0,55.0,2.0,10.0,238.0,2.0,10.0,55.0,2.0,10.0,,,,,,,1.0,"[(0, 3), (2, 6), (7, 4), (5, 1)]",b4nnnnx_gap_11_4_unrelaxed_rank_001_alphafold2...,b4nnnnx_gap_11_4_unrelaxed_rank_001_alphafold2...,WEELEEAVRWLRERLPDLTEEQHIEYIRRYAEEGPDDLSPEVREAL...,0,0.802817,0.0,0.0,0.042254,0.0,0.028169,0.014085,0.112676,71,-1125.2451,64.553678,-720.360623,-469.438155,-300.69,-18.04,158.73,-441.38,0.0,-133.6,94.718734,-420.944075,218.938481,0.736818,-86.819102,267.216628,-10.449288,14.543467,0.0,-41.776484,-3.579936,-1.146395,0.0,-1.204131,-13.61583,183.192164,5.86366,6.770667,0.0,-151.1597,-4.1245,0.0,-0.347189,-15.848523,0.909207,-10.145924,-6.611805,-4.23507,-0.254085,2.235634,-6.21662,0.0,-1.88169,-5.92879,3.083641,0.010378,-1.222804,3.763614,-0.147173,0.204838,0.0,-0.588401,-0.050422,-0.016146,0.0,-0.01696,-0.191772,2.580171,0.082587,0.095362,0.0,b4nnnnx_gap_11_4_unrelaxed_rank_001_alphafold2...,"[{'center': [-5.287766965590257, -2.0788163531...",b4nnnnx,"[[-0.8464541804725815, -0.4575214713946152, 0....",11.99408,"[-2.2058461249126053, -73.76715607946068, 76.0...",1.10664,1.609215,0.003749,"[(3, 0), (1, 1), (0, 2), (2, 4)]","[{'center': [3.627479251494083, 3.565589420445...",0.0,1.153497,True,b4nnnnx_gap_11_4,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSWEELEEAVRWLRERLPDLTEEQHI...,11303.15348,19060,0.612903,True,True,True,low,False,,,,,,,,,,,,1,False,,,,
8,A9,no_disulfide_b4nnnny,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b4nnnny,24.277465,3.352113,-120.195202,-1.69289,4.5,-7.202815,-7.202815,8651.77758,71,89.287746,3.763206,0.69,0.99,0.72932,0.40897,1.194563,0.977125,0.768718,0.694436,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,19,4,11.0,MSREEKIKLLKEKGYNLSREELIKLILEEYGYDTEETKELREKAYE...,10810,8651.77758,---GGGGGGGG-----------GGGGGGGG-----------GGGGG...,32.0,0.0,b4nnnny_gap_11_19,--HHHHHHHHHHHHTTS-HHHHHHHHHHHTT--SGGGHHHHHHHHH...,-2.2877,-25.448277,53.184818,4.388,no_disulfide_b4nnnny,b4nnnny_gap_11_19_unrelaxed_rank_001_alphafold...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0141,0.0,0.0423,0.2394,0.0,0.0282,0.0,0.0704,0.1268,0.169,0.0282,0.0282,0.0,0.0141,0.0563,0.0563,0.0282,0.0282,0.0141,0.0563,1723.7,238.0,"[11, 11, 11]",0.0,1.0,2.0,3.0,7.0,6.0,5.0,4.0,,,,,1.0,1.0,1.0,,,snub_disphenoid,"(B, X, A, A, F, B)","(-49.9, -90.0, -49.9, -49.9, -48.6, -49.9)",0.93,1.0,1.0,1.45,1.32,0.96,6.37,1.29,24.0,2.0,10.0,251.0,3.0,10.0,24.0,2.0,10.0,251.0,3.0,10.0,,,,,,,1.0,"[(0, 1), (2, 3), (7, 6), (5, 4)]",b4nnnny_gap_11_19_unrelaxed_rank_001_alphafold...,b4nnnny_gap_11_19_unrelaxed_rank_001_alphafold...,MSREEKIKLLKEKGYNLSREELIKLILEEYGYDTEETKELREKAYE...,0,0.690141,0.0,0.0,0.042254,0.0,0.098592,0.056338,0.112676,71,-1154.61908,47.728037,-691.594988,-510.752129,-293.61,-18.64,150.86,-425.84,0.0,-129.5,311.547979,-429.718016,471.732887,0.738913,-88.018843,278.84962,-10.2274,13.644285,-0.167154,-38.769419,-2.303038,-1.515459,0.0,-17.139443,-14.244454,161.041635,2.627676,0.0,0.0,-162.4291,-4.4665,0.0,-0.358426,-16.262241,0.672226,-9.740774,-7.193692,-4.135352,-0.262535,2.124789,-5.997746,0.0,-1.823944,-6.052366,6.644125,0.010407,-1.239702,3.927459,-0.144048,0.192173,-0.002354,-0.546048,-0.032437,-0.021344,0.0,-0.241401,-0.200626,2.268192,0.03701,0.0,0.0,b4nnnny_gap_11_19_unrelaxed_rank_001_alphafold...,"[{'center': [-5.3590771160303134, 5.4315571739...",b4nnnny,"[[-0.4179872945190504, -0.3243719560654371, 0....",11.928266,"[40.17424408645632, 10.658605271260061, 151.32...",0.330799,1.54307,0.024317,"[(3, 0), (1, 1), (0, 2), (2, 3)]","[{'center': [7.418586329004796, -8.36555960435...",0.0,0.634758,True,b4nnnny_gap_11_19,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSMSREEKIKLLKEKGYNLSREELIK...,11094.27778,12090,0.526882,True,True,True,super_high,True,6.2,0.000513,5.689373,18.205994,5.1,2.18,0.00018,2.000457,10.202331,0.168,1.4e-05,1,True,1.0,1.0,2025-04-11,19.4
9,A10,no_disulfide_b5iiiin,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b5iiiin,24.275,3.0375,-136.490614,-1.706133,4.9,-4.200798,-4.200798,9471.93758,80,88.10325,4.046527,0.69,0.97,0.7962,0.45912,1.091816,0.948716,0.767717,0.687914,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,15,5,9.0,MDLDKGLEELIERIKKGEALEELKKFGKEAKNLPKEVKEILEKLEK...,12660,9471.93758,--GGGGGGGG---------GGGGGGGG---------GGGGGGGG--...,40.0,0.05,b5iiiin_gap_9_15,--HHHHHHHHHHHHHTTSSHHHHHHHHHH-SS--HHHHHHHHHHHT...,-2.3249,-49.488881,53.716867,7.510148,no_disulfide_b5iiiin,b5iiiin_gap_9_15_unrelaxed_rank_001_alphafold2...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0375,0.0,0.025,0.25,0.0125,0.0625,0.0,0.0625,0.2125,0.15,0.025,0.025,0.0125,0.0125,0.0125,0.0125,0.0125,0.0375,0.025,0.0125,1942.0,243.0,"[9, 9, 9, 9]",0.0,4.0,5.0,6.0,7.0,9.0,8.0,3.0,2.0,1.0,,,1.0,1.0,1.0,1.0,,gyro_square_bipyramid,"(x, x, b, d, b, x, B, a, x, x)","(45.0, 31.4, 18.5, 60.0, 60.0, 60.0, -45.0, 18...",0.86,0.88,1.0,1.62,1.33,0.95,8.97,1.32,278.0,2.0,10.0,261.0,3.0,10.0,14.0,2.0,10.0,274.0,2.0,10.0,261.0,3.0,10.0,,,,1.0,"[(0, 4), (5, 6), (7, 9), (8, 3), (2, 1)]",b5iiiin_gap_9_15_unrelaxed_rank_001_alphafold2...,b5iiiin_gap_9_15_unrelaxed_rank_001_alphafold2...,MDLDKGLEELIERIKKGEALEELKKFGKEAKNLPKEVKEILEKLEK...,0,0.7625,0.0,0.0,0.0,0.0,0.0625,0.0625,0.1125,80,-1344.875028,71.357046,-798.970977,-617.261097,-313.31,-26.63,163.63,-450.29,0.0,-153.0,600.811826,-482.069138,756.602341,0.7488,-101.257426,294.543662,-12.626391,12.870107,-2.566982,-44.201104,-2.69459,-0.134327,0.0,-16.131538,-12.312565,222.541111,4.063744,2.386971,0.0,-185.9889,-4.7352,0.0,-0.618611,-16.810938,0.891963,-9.987137,-7.715764,-3.916375,-0.332875,2.045375,-5.628625,0.0,-1.9125,-6.025864,9.457529,0.00936,-1.265718,3.681796,-0.15783,0.160876,-0.032087,-0.552514,-0.033682,-0.001679,0.0,-0.201644,-0.153907,2.781764,0.050797,0.029837,0.0,b5iiiin_gap_9_15_unrelaxed_rank_001_alphafold2...,"[{'center': [2.317663159827137, 7.866123741513...",b5iiiin,"[[0.09078123890288034, -0.5689637171675826, 0....",11.581539,"[-16.860188421192817, 56.69902989118972, 38.77...",0.979916,1.614591,0.025473,"[(0, 0), (3, 1), (4, 2), (2, 3), (1, 4)]","[{'center': [3.081716306286964, 8.073889861402...",0.0,1.038667,True,b5iiiin_gap_9_15,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSMDLDKGLEELIERIKKGEALEELK...,11914.43778,13940,0.598039,True,True,True,medium,False,,,,,,,,,,,,1,False,,,,
10,A11,no_disulfide_b5iinin,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b5iinin,24.25,3.541667,-151.663192,-1.579825,4.3,-15.1868,-15.1868,11798.28088,96,89.485417,3.621901,0.74,0.89,0.81853,0.39284,0.908544,0.967086,0.627793,0.690057,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,19,5,12.0,SREELLELAKKLLEAIKSEELKEEWKELLEEILENGLNEELLKRWE...,28450,11798.28088,----GGGGGGGG------------GGGGGGGG------------GG...,40.0,0.0,b5iinin_gap_12_19,-HHHHHHHHHHHHHH---HHHHHHHHHHHHHHHHH-S-HHHHHHHH...,-2.3183,-43.869211,54.613718,2.064086,no_disulfide_b5iinin,b5iinin_gap_12_19_unrelaxed_rank_001_alphafold...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0312,0.0,0.0104,0.3229,0.0,0.0208,0.0,0.0521,0.1146,0.2396,0.0,0.0208,0.0104,0.0104,0.0625,0.0521,0.0,0.0,0.0521,0.0,2328.0,340.0,"[12, 12, 12, 12]",1.0,5.0,8.0,3.0,7.0,9.0,6.0,2.0,0.0,4.0,,,1.0,1.0,1.0,1.0,,gyro_square_bipyramid,"(X, x, a, D, a, x, b, A, x, x)","(-23.9, 42.2, 45.0, -18.5, 18.5, 23.9, 18.5, -...",0.88,0.9,1.0,1.66,1.44,0.98,9.62,1.43,24.0,2.0,10.0,274.0,2.0,10.0,14.0,2.0,10.0,24.0,2.0,10.0,278.0,2.0,10.0,,,,1.0,"[(1, 5), (8, 3), (7, 9), (6, 2), (0, 4)]",b5iinin_gap_12_19_unrelaxed_rank_001_alphafold...,b5iinin_gap_12_19_unrelaxed_rank_001_alphafold...,SREELLELAKKLLEAIKSEELKEEWKELLEEILENGLNEELLKRWE...,0,0.854167,0.0,0.0,0.0,0.0,0.03125,0.010417,0.104167,96,-1695.16243,46.434393,-999.8516,-741.745223,-503.83,-23.89,169.84,-649.79,0.0,-210.4,198.152236,-598.212518,463.793109,0.979359,-144.621608,404.667888,-13.092597,19.153792,-1.152761,-69.935546,-3.996659,-0.880125,0.0,-20.065592,-17.093844,207.604743,6.323909,0.330986,0.0,-222.5556,-4.643,0.2087,-0.456971,-17.657942,0.483692,-10.415121,-7.726513,-5.248229,-0.248854,1.769167,-6.768646,0.0,-2.191667,-6.23138,4.831178,0.010202,-1.506475,4.215291,-0.136381,0.199519,-0.012008,-0.728495,-0.041632,-0.009168,0.0,-0.209017,-0.178061,2.162549,0.065874,0.003448,0.0,b5iinin_gap_12_19_unrelaxed_rank_001_alphafold...,"[{'center': [-1.3835912793347955, -11.01719925...",b5iinin,"[[0.1887266418148749, -0.9786573267973812, 0.0...",12.091937,"[81.89205381954399, -135.02194867853137, -6.38...",0.931976,1.72541,0.00319,"[(1, 0), (3, 1), (4, 2), (2, 3), (0, 4)]","[{'center': [2.9262565131167833, -3.6689887869...",0.0,0.777486,True,b5iinin_gap_12_19,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSSREELLELAKKLLEAIKSEELKEE...,14240.78108,29730,0.694915,True,True,True,high,True,6.565,0.000221,3.14466,10.06291,5.1,2.478,8.3e-05,1.186971,6.053553,0.569,1.9e-05,1,False,,,,
11,A12,no_disulfide_b5ininn,ATGGGCAGCAGCCATCATCATCATCATCACAGCAGCGGCGAGAACT...,b5ininn,25.084375,3.03125,-183.494775,-1.911404,5.0,-5.156637,-5.156637,11650.33818,96,90.599688,3.312275,0.77,0.82,0.85373,0.3968,0.837086,0.982297,0.800557,0.669485,3.0,8.0,12.0,True,X,WY,oxygenMathFix,solublempnn,alphafold2,4,5,12.0,IKELVYKTIEKLLENIDKKETAEKWKEYIKWLEEKGLSKEIRDEWI...,20910,11650.33818,----GGGGGGGG------------GGGGGGGG------------GG...,40.0,0.0,b5ininn_gap_12_4,-HHHHHHHHHHHHHTTTSHHHHHHHHHHHHHHHHTT--HHHHHHHH...,-2.3052,-30.173146,55.603912,1.08692,no_disulfide_b5ininn,b5ininn_gap_12_4_unrelaxed_rank_001_alphafold2...,/home/tadas/code/single_chain_deltaprots/outpu...,best,"[8, 9, 10, 11, 12, 13]",120.0,True,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,/home/tadas/code/single_chain_deltaprots/outpu...,0.0521,0.0,0.0521,0.2396,0.0,0.0208,0.0104,0.0833,0.2083,0.125,0.0208,0.0104,0.0,0.0,0.0312,0.0312,0.0208,0.0312,0.0312,0.0312,2408.1,291.0,"[12, 12, 12, 12]",8.0,3.0,2.0,6.0,1.0,0.0,4.0,5.0,9.0,7.0,,,1.0,1.0,1.0,1.0,,gyro_square_bipyramid,"(X, X, A, d, A, x, B, a, X, X)","(-23.9, -42.2, -45.0, 18.5, -18.5, 23.9, -18.5...",0.88,0.9,1.0,1.66,1.44,0.98,9.62,1.43,274.0,2.0,10.0,24.0,2.0,10.0,14.0,2.0,10.0,274.0,2.0,10.0,278.0,2.0,10.0,,,,1.0,"[(8, 3), (2, 6), (1, 0), (4, 5), (9, 7)]",b5ininn_gap_12_4_unrelaxed_rank_001_alphafold2...,b5ininn_gap_12_4_unrelaxed_rank_001_alphafold2...,IKELVYKTIEKLLENIDKKETAEKWKEYIKWLEEKGLSKEIRDEWI...,0,0.833333,0.0,0.0,0.0,0.0,0.072917,0.020833,0.072917,96,-1707.153417,87.306682,-982.601613,-811.858486,-488.7,-23.86,176.25,-641.09,0.0,-193.3,104.344291,-616.181361,373.499503,1.054175,-150.580468,428.902013,-9.919014,17.410451,-2.678854,-70.263984,-6.836512,-0.884414,0.0,-21.041787,-13.630222,190.134595,7.175648,0.0,0.0,-221.3037,-4.9172,0.0,-0.314304,-17.782848,0.909445,-10.235433,-8.456859,-5.090625,-0.248542,1.835938,-6.678021,0.0,-2.013542,-6.418556,3.89062,0.010981,-1.568547,4.467729,-0.103323,0.181359,-0.027905,-0.731917,-0.071214,-0.009213,0.0,-0.219185,-0.141981,1.980569,0.074746,0.0,0.0,b5ininn_gap_12_4_unrelaxed_rank_001_alphafold2...,"[{'center': [-2.1078966424201067, -5.273012765...",b5ininn,"[[0.9288943063451415, -0.08250362199991125, -0...",11.647762,"[-31.45560482327593, -11.586676983305319, 46.8...",0.578401,1.797818,0.00985,"[(3, 0), (1, 1), (4, 2), (2, 3), (0, 4)]","[{'center': [-6.847071433179565, 2.46609901821...",0.0,0.561221,True,b5ininn_gap_12_4,,,,,,,,,MGSSHHHHHHSSGENLYFQSGSIKELVYKTIEKLLENIDKKETAEK...,14092.83838,22190,0.677966,True,True,True,super_high,True,13.41,0.000604,8.516672,27.253352,5.1,4.93,0.000222,3.131036,15.968285,0.395,1.8e-05,1,True,2.0,1.0,2025-04-14,36.56


In [23]:
df[df["expression_levels"].isin(["low"])]["Well Position"]


0      A1
2      A3
5      A6
7      A8
12     B1
15     B4
21    B10
26     C3
Name: Well Position, dtype: object

In [None]:
# Choices for large scale expression

# A12	no_disulfide_b5ininn super_high
# A9	no_disulfide_b4nnnny
# B8	no_disulfide_h6i_i_i

# A1 no_disulfide_b3iii (low-medium)
# B12	no_disulfide_l5iiin (medium)
# F4	variable_linkers_l6innni	(medium)


In [None]:
p