# Data Generation for Plots Notebook

This notebook generates data used to contruct `binding peak` tables and `venn diagrams` for ChIP-pro, as well as other  visuals. But before you run the notebook, make sure of the following: 

> Make sure to rename TF in the gff file to match the TF convention and not gene convension.

In [30]:
import numpy as np 
import pandas as pd
import glob
import urllib                      
import gzip
from collections import defaultdict

pd.set_option('display.max_columns', 500)

# Functions

## Generate Binding peaks 

This function assigns bindings peaks for each TF and fins the corresponsing gene targets using the `gene_info.csv` table. 

In [2]:
def annotate_peaks(TF_name, TF_condition, peak_df,margin,gene_info):
    
    res_df = peak_df.copy()
#     TF = peak_df.condition_name[1][:4]
    for i,row in res_df.iterrows():
        pos = row['binding_peak_start']
        # Identify genes within MARGIN nt of binding peak
        close_genes = gene_info[(gene_info.start_codon_pos > pos-margin) 
                                & (gene_info.start_codon_pos < pos+margin)]
        for strand,group in close_genes.groupby('strand'):
            #Remove genes that are completely transcribed before binding peak
            if strand == '+':
                group = group[group.stop > pos]
            else:
                group = group[group.start < pos]

            operon = group.operon.unique()
            # Ensure that we're only identifying one operon on either side of binding peak
#             if len(operon) > 1:
#                 print (operon)

            # Get all genes in operon
            bnums = gene_info[gene_info.operon.isin(operon)].index
            
            ## Add gene information to dataframe
            if strand == '+':
                res_df.loc[i,'TU_p'] = ','.join(operon)
                res_df.loc[i,'genes_p'] = ','.join(bnums)
            else:
                res_df.loc[i,'TU_m'] = ','.join(operon)
                res_df.loc[i,'genes_m'] = ','.join(bnums)
    res_df['index'] = [TF_name +'-' + str(i) for i in range(1,peak_df.shape[0]+1)]
    res_df['condition'] = [ TF_name.lower() + " + " + TF_condition for i in peak_df.condition_name]
#     [peak_df.condition_name[2][:4]+' + '+peak_df.condition_name[1][5:8]]*peak_df.shape[0]
    cols = ['index','condition','binding_peak_start','binding_peak_end',
            'binding_peak_strength','TU_p','genes_p','TU_m','genes_m']
    return res_df.reindex(columns = cols)

## Validate Binding Peaks 

this function validates the accuracy of every gene target from the already indetified gene list for every binding site, identified from the previous function  

In [85]:
def validate_peak_info(df,gene_info):
    locusTag = defaultdict(list)
    geneName = defaultdict(list)
    for i,row in df.iterrows():
        BP = row['binding_peak_start']
        idx_name = i
        genes = [row['genes_p'] , row['genes_m']]
        if ((genes[0] == '' or str(genes[0]) == 'nan') & (genes[1] == '' or str(genes[1]) == 'nan')):
            locusTag[idx_name].append('')
            geneName[idx_name].append('')
        for gene in genes:
            if gene == '' or str(gene) == 'nan':
                continue 
            gene_list = gene.split(',')
            for g in gene_list: 
                name = DF_gene_info.loc[g].gene_name 
                strand = DF_gene_info.loc[g].strand 
                start = DF_gene_info.loc[g].start
                stop = DF_gene_info.loc[g].stop
                if ((start > BP) & (stop > BP) & (strand == '+')) | ((start < BP) & (stop < BP) & (strand == '-')):
                        locusTag[idx_name].append(g)
                        geneName[idx_name].append(name)
                elif ((start < BP) & (stop > BP)) | ((start > BP) & (stop < BP)):
                    locusTag[idx_name].append(g)
                    geneName[idx_name].append(name)
                    
    for k, v in locusTag.items():
        if ((len(v) == 1) & (v[0] == '')): 
            locusTag[k] = ''
            continue
        genes = ','.join(locusTag[k])
        locusTag[k] = genes

    for k, v in geneName.items():
        if ((len(v) == 1) & (v[0] == '')): 
            geneName[k] = ''
            continue
        genes = ','.join(geneName[k])
        geneName[k] = genes

    df_complete = df.loc[:,['index','condition','binding_peak_start',
                            'binding_peak_end','binding_peak_strength']]
    df_complete['target_locus'] = locusTag.values()
    df_complete['target_genes'] = geneName.values()
    return df_complete

# Venn Diagrams

Make sure to update the list of `TF_names` as Ye adds more gff files into the dropbox

In [76]:
def Venn_data_gen(Peak_DF): 
    TF_name = Peak_DF['index'][1][:4]
    gene_list = [i for i in Peak_DF.target_genes if i != '']
    chip_data= ','.join(list(gene_list)).split(',')
    reg_data = TRN_data[TF_name]
    all_genes = [i  for i in chip_data if i not in reg_data] + reg_data
    
    
    TF = TF_name
    reg_genes=reg_data
    reg_only = []
    chip_genes=chip_data
    chip_only = []
    shared_genes=[]
    for i in all_genes: 
        if (i in reg_data) & (i not in chip_data):
            reg_only.append(i)
        elif (i in chip_data) & (i not in reg_data):
            chip_only.append(i)
        elif (i in chip_data) & (i in reg_data):
            shared_genes.append(i)
            
    values = [TF,
          len(reg_genes),
          len(reg_only),
          len(chip_genes),
          len(chip_only),
          len(shared_genes),
          len(all_genes)]
    
    index_name = ['TF',
              'reg_genes',
              'reg_only',
              'chip_genes',
              'chip_only',
              'shared_genes',
              'all_genes']
    
    genes = ['; '.join(precise2_TRN.source[precise2_TRN.index == TF_name].unique()),
         reg_genes,
         reg_only,
         chip_genes,
         chip_only,
         shared_genes,
         all_genes]
    
    same1 = defaultdict(list)
    for i in range(0,len(index_name)):
        same1[index_name[i]].append(values[i])

    finall = pd.DataFrame.from_dict(same1, orient='index', columns = ['value'])
    finall['list'] = genes
    for i, row in finall.iterrows(): 
        if row.value == 0:
            finall.list[i] = ''
    return finall

# Binding Width Histograms

In [77]:
def binding_width_gen(TF, peak_df,out_dir): 
    widths = pd.DataFrame(peak_df.binding_peak_end - peak_df.binding_peak_start + 1, columns=["binding_width"])
    widths.to_csv(out_dir+TF+'_widths.csv')

# Peak Position Scatter

In [78]:
def peak_position_gen(TF, final_annot_DF,out_dir): 
    peak_scatter_df = pd.DataFrame(columns=final_annot_DF.columns.to_list()+['gene'] +['normalized_dist'])
    counter=0

    for i in range(len(final_annot_DF)):
        peak = final_annot_DF.loc[i+1,:]
        peak_center = np.mean([peak.binding_peak_start, peak.binding_peak_end])

        for gene in peak.target_genes.split(","):
            gene_info = DF_gene_info[DF_gene_info.gene_name == gene]
            try:
                if gene_info.strand[0] == "-":
                    dist = float((gene_info.stop - peak_center)/gene_info.length)
                else:
                    dist = float((peak_center - gene_info.start)/gene_info.length)
                peak_scatter_df.loc[counter] = peak.to_list()+[gene, dist]
                counter+=1
            except:
                continue

    peak_scatter_df['binding_peak_center'] = peak_scatter_df.binding_peak_start/2 + peak_scatter_df.binding_peak_end/2
    peak_scatter_df.to_csv(out_dir+TF+'_positions.csv')

# E. coli

In [79]:
org_folder = "../data/e_coli/"

In [80]:
TF_list = pd.read_csv(org_folder+'TF_list.csv', index_col=0)

TF_list

Unnamed: 0_level_0,TF,Organism,Strain,Media,Supplement,genome_id,organism_id,num_binding_sites,num_samples,num_cond,project,binding tables,BWcond1_1_name,BWcond1_1,BWcond1_2_name,BWcond1_2,BWcond2_1_name,BWcond2_1,BWcond2_2_name,BWcond2_2,BWcond3_1_name,BWcond3_1,BWcond3_2_name,BWcond3_2,BWcond4_1_name,BWcond4_1,BWcond4_2_name,BWcond4_2
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1
0,BaeR,Escherichia coli,K-12 MG1655,LB,EtOH,NC_000913_3,e_coli,,4,1,TCS,EtOH|baer_EtOH_binding_table.json,bio-rep1 – R1,BaeR_R1_S31_R1.bw,bio-rep1 – R2,BaeR_R1_S31_R2.bw,bio-rep2 – R1,BaerR_R2_S32_R1.bw,bio-rep2 – R2,BaerR_R2_S32_R2.bw,,,,,,,,
1,CpxR,Escherichia coli,K-12 MG1655,LB,EtOH,NC_000913_3,e_coli,,2,1,TCS,EtOH|cpxr_EtOH_binding_table.json,R1,CpxRR1_S1_R1.bw,R2,CpxRR2_S2_R2.bw,,,,,,,,,,,,
2,Cra,Escherichia coli,K-12 MG1655,M9,"Fructose, Galactose, or Acetate",NC_000913_3,e_coli,,8,4,known_TF,acetate|cra_acetate_binding_table.json;M9|cra_...,Glu – R1,cra_glu_1.bw,Glu – R2,cra_glu_2.bw,Fru – R1,cra_fru_1.bw,Fru – R2,cra_fru_2.bw,Gal – R1,cra_gal_1.bw,Gal – R2,cra_gal_2.bw,Ace – R1,cra_ace_1.bw,Ace – R2,cra_ace_2.bw
3,Fur,Escherichia coli,K-12 MG1655,M9,Fe or DPD,NC_000913_3,e_coli,,4,2,known_TF,fe|fur_fe_binding_table.json;dpd|fur_dpd_bindi...,Fe – R1,fur_fe_1.bw,Fe – R2,fur_fe_2.bw,DPD – R1,fur_dpd_1.bw,DPD – R2,fur_dpd_2.bw,,,,,,,,
4,GadE,Escherichia coli,K-12 MG1655,M9,,NC_000913_3,e_coli,,2,1,known_TF,M9|gade_M9_binding_table.json,R1,gade_1.bw,R2,gade_2.bw,,,,,,,,,,,,
5,GadW,Escherichia coli,K-12 MG1655,M9,,NC_000913_3,e_coli,,2,1,known_TF,M9|gadw_M9_binding_table.json,R1,gadw_1.bw,R2,gadw_2.bw,,,,,,,,,,,,
6,GadX,Escherichia coli,K-12 MG1655,M9,,NC_000913_3,e_coli,,2,1,known_TF,M9|gadx_M9_binding_table.json,R1,gadx_1.bw,R2,gadx_2.bw,,,,,,,,,,,,
7,KdpE,Escherichia coli,K-12 MG1655,TMA,KCl,NC_000913_3,e_coli,,2,1,TCS,KCl|kdpe_KCl_binding_table.json,R1,KdpeE_R2_S34_R1.bw,R2,KdpeE_R2_S34_R2.bw,,,,,,,,,,,,
8,PhoB,Escherichia coli,K-12 MG1655,M9P,,NC_000913_3,e_coli,,4,1,TCS,M9P|phob_M9P_binding_table.json,bio-rep1 – R1,PhoB_1_S16_R1.bw,bio-rep1 – R2,PhoB_1_S16_R2.bw,bio-rep2 – R1,PhoB_2_S6_R1.bw,bio-rep2 – R2,PhoB_2_S6_R2.bw,,,,,,,,
9,RpoB,Escherichia coli,K-12 MG1655,M9,Fe or DPD,NC_000913_3,e_coli,,4,2,known_TF,fe|rpob_fe_binding_table.json;dpd|rpob_dpd_bin...,Fe – R1,rpob_fe1.bw,Fe – R2,rpob_fe2.bw,DPD – R1,rpob_dpd1.bw,DPD – R2,rpob_dpd2.bw,,,,,,,,


In [81]:
strain = 'NC_000913_3'
DF_gene_info = pd.read_csv(org_folder+strain+'/annotation/gene_info.csv',index_col=0)
DF_gene_info['start_codon_pos'] = [row.start if row.strand == '+' else row.stop for idx,row in DF_gene_info.iterrows()]
TRN = pd.read_csv(org_folder+strain+'/annotation/trn.csv',index_col=0)

DF_gene_info

Unnamed: 0,start,stop,strand,gene_name,length,operon,cog,start_codon_pos
b0001,189,255,+,thrL,66,thrLABC,No COG Annotation,189
b0002,336,2799,+,thrA,2463,thrLABC,No COG Annotation,336
b0003,2800,3733,+,thrB,933,thrLABC,Amino acid transport and metabolism,2800
b0004,3733,5020,+,thrC,1287,thrLABC,Amino acid transport and metabolism,3733
b0005,5233,5530,+,yaaX,297,yaaX,Function unknown,5233
...,...,...,...,...,...,...,...,...
b4399,4636695,4638120,+,creC,1425,creABCD,Signal transduction mechanisms,4636695
b4400,4638177,4639530,+,creD,1353,creABCD,Defense mechanisms,4638177
b4401,4639589,4640306,-,arcA,717,arcA,Signal transduction mechanisms,4640306
b4402,4640401,4640542,+,yjjY,141,yjjY,Function unknown,4640401


In [84]:
for TF_index in range(len(TF_list)):

    TF_name= TF_list.TF[TF_index].lower()
    strain = TF_list.genome_id[TF_index]

    #find files and format
    curated_loc = glob.glob(org_folder+strain+"/curated_input/"+TF_name+"_*.gff")
    curated_files = [i.split("/")[-1] for i in curated_loc]
    curated_cond = [i.split("_")[1] for i in curated_files]
    table_string =";".join([curated_cond[i]+"|"+TF_name+"_"+curated_cond[i]+'_binding_table.json' for i in range(len(curated_loc))])
    TF_list.loc[TF_index, 'binding tables'] = table_string
    TF_list.loc[TF_index, 'num_cond'] = len(curated_loc)
    
    #write plot data files to folders
    for file_index in range(len(curated_files)):
        try:
            file = curated_files[file_index]
            df = pd.read_csv(org_folder+strain+"/curated_input/"+file,index_col=0, 
                                     delimiter='\t', header=None, 
                                     names = ['ref','condition', 'condition_name', 
                                              "binding_peak_start",'binding_peak_end', 
                                              'binding_peak_strength', 'direction', '.','ID'])
            df = df.set_index(pd.Series(range(1,len(df)+1)))
            peak_annot_DF = annotate_peaks(TF_list.TF[TF_index], curated_cond[file_index], df, 500, DF_gene_info)
            final_annot_DF = validate_peak_info(peak_annot_DF,DF_gene_info)
            final_annot_DF.to_json(org_folder+strain+"/table/"+TF_name+"_"+curated_cond[file_index]+'_binding_table.json',orient='records')
            binding_width_gen(TF_list.TF[TF_index], df, org_folder+strain+"/binding_widths/")
            peak_position_gen(TF_list.TF[TF_index], final_annot_DF, org_folder+strain+"/positions/")
        except:
            continue

['raiA' 'pheLA']
['raiA' 'pheLA']
['arfA' 'yhdN-zntR']
['rpsLG-fusA-tufA' 'yheO-tusDCB']
['yiaG' 'cspA']
['yjfN' 'bsmA']
['yjfN' 'bsmA']
['topAI-yjhQ' 'yjhX']
[nan, 'b0071,b0072,b0073,b0074,b0075']
[nan, 'b0071,b0072,b0073,b0074,b0075']
['b0150,b0151,b0152,b0153', nan]
[nan, nan]
[nan, nan]
[nan, 'b0281']
[nan, 'b0610']
[nan, 'b0610']
[nan, 'b0613,b0614,b0615,b0616,b0617,b0618']
['b0623', nan]
['b0623', nan]
['b0681,b0682', nan]
[nan, 'b0683,b4637,b0684']
[nan, 'b0720']
['b0733,b0734', nan]
['b0972,b0973,b0974,b0975,b0976,b0977', 'b0970']
[nan, 'b1521']
[nan, 'b1521']
['b1655', 'b1654']
['b1661', nan]
['b1677', nan]
[nan, 'b1743']
[nan, 'b1743']
[nan, 'b1743']
[nan, 'b1838']
[nan, nan]
[nan, 'b1908']
[nan, 'b1908']
[nan, 'b1908']
[nan, 'b1908']
[nan, nan]
['b1982', nan]
['b1982', nan]
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4668']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4668']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b209

['b0150,b0151,b0152,b0153', nan]
[nan, nan]
['b1242', 'b1241']
['b1676', 'b1675']
[nan, 'b1777']
['b1779,b1780', 'b1778']
['b1817,b1818,b1819', 'b1816']
[nan, 'b1908']
['b2170', 'b2167,b2168,b2169']
[nan, 'b2181']
[nan, 'b2181']
[nan, 'b2276,b2277,b2278,b2279,b2280,b2281,b2282,b2283,b2284,b2285,b2286,b2287,b2288']
['b2389', 'b2388']
['b2415,b2416,b2417', nan]
['b2448,b2449', nan]
[nan, 'b2556']
[nan, nan]
[nan, 'b2787,b2788,b2789']
[nan, 'b2925,b2926,b2927']
['b3710', nan]
['b3800', nan]
[nan, nan]
['b3916', nan]
[nan, 'b3919']
[nan, nan]
['b0150,b0151,b0152,b0153', nan]
['b0217', nan]
[nan, '']
[nan, 'b0281']
[nan, nan]
[nan, 'b0930']
['b1242', 'b1241']
[nan, 'b1521']
['b1667', 'b1664']
[nan, 'b1777']
[nan, 'b1908']
['b1978', nan]
[nan, 'b1985']
[nan, 'b1988']
['b2170', 'b2167,b2168,b2169']
['b2398,b2399', 'b2395']
[nan, nan]
['b2415,b2416,b2417', nan]
['b2448,b2449', nan]
[nan, 'b2556']
[nan, 'b2790,b2791,b2792']
[nan, 'b2813']
[nan, 'b2925,b2926,b2927']
['b3093', 'b3091,b3092']
['b3

['b2912', nan]
['b2912', nan]
['b3008', 'b3005,b3006']
['b3065,b3066,b3067', 'b3064']
['b3093', 'b3091,b3092']
['b3094', nan]
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3230,b3231']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3339,b3340,b3341,b3342']
[nan, 'b3376,b3377,b3378,b3379,b3380,b3381']
[nan, nan]
[nan, nan]
[nan, nan]
['b3441', 'b3440']
['b3501,b3502,b3503', 'b4613']
['b3536,b3537,b3538', nan]
['b3555,b3556', nan]
['b3556', nan]
['b3556', nan]
[nan, 'b3635,b3636,b3637,b3638']
['b3703,b3704', nan]
['b3710', nan]
['b3715', 'b3714']
[nan, 'b3754,b3755']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
['b3829', 'b3828']
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
[nan, 'b4005,b4006']
['b4050', nan]
['

['b0910,b0911,b0912,b0913,b0914,b0915,b0916', nan]
['b0917,b0918', nan]
['b0925', nan]
['b0926,b0927', nan]
[nan, 'b0928']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0930']
['b0932', 'b0931']
['b0932', 'b0931']
['b0945', nan]
['b0945', nan]
['b0946', nan]
['b0946', nan]
['b0950,b0951,b0952', nan]
['b0953', nan]
[nan, 'b0954']
[nan, nan]
['b0956', 'b0955']
[nan, 'b0957']
[nan, 'b0957']
[nan, 'b0957']
[nan, 'b0957']
[nan, 'b0957']
[nan, 'b0957']
['b0959', 'b0958']
['b0959', 'b0958']
[nan, 'b0966']
[nan, 'b0966']
[nan, 'b0966']
[nan, 'b0970']
['b0972,b0973,b0974,b0975,b0976,b0977', 'b0970']
['b4516,b0988', 'b0984,b0985,b0986,b0987']
[nan, nan]
[nan, '']
[nan, '']
['b0990', 'b0989']
['b0996,b0997,b0998', 'b0995']
['b0996,b0997,b0998', 'b0995']
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', nan]
['b1001', nan]
['b4518', 'b1003,b1004']
['b1020', nan]
['b1020', nan]
[nan, 'b1021,b1022,b1023,b1024']
['b1025', 'b1021,

[nan, 'b1891,b1892']
[nan, nan]
[nan, 'b1896,b1897']
[nan, 'b1896,b1897']
[nan, 'b4460,b1900,b1901']
['b1902', nan]
['b1902', nan]
['b1902', nan]
['b1904', 'b4537']
['b1904', 'b4537,b4663']
['b1905', nan]
['b1905', nan]
['b1907', 'b1906']
[nan, 'b1908']
[nan, nan]
[nan, 'b1912']
['b1915', 'b1913,b1914']
['b1915', 'b1913,b1914']
[nan, 'b1916']
[nan, 'b1920,b1921,b1922']
[nan, nan]
[nan, nan]
[nan, nan]
['b1929,b1930', 'b1928']
['b1932', nan]
['b1936', 'b4495_3,b4495_2']
['b1936', 'b4495_3,b4495_2,b4495_1']
['b1953', 'b1952']
['b1955', 'b1952']
['b1955', 'b1952']
['b1955', nan]
[nan, 'b1956']
[nan, 'b1956']
[nan, 'b1956,b1957']
['b1959', 'b1958']
['b1959', 'b1958']
[nan, 'b1962,b1963']
['b1967', nan]
['b1967', nan]
['b1967', nan]
['b1971,b1972', nan]
['b1973', nan]
['b1973', nan]
['b1974', nan]
['b1974', nan]
['b1976', nan]
[nan, nan]
['b1978', nan]
['b1978', nan]
[nan, nan]
[nan, nan]
['b1981', 'b4497']
['b1981', 'b4497']
['b1982', nan]
['b1983', nan]
[nan, nan]
[nan, 'b1985']
[nan, 'b1

['b2837', 'b2835,b2836']
['b2846', nan]
['b2847,b2848', '']
['b2850_1,b2850_2', 'b4683,b2849']
['b2851', nan]
['b2851', nan]
['b2853,b2854_1,b2854_2', nan]
[nan, 'b2858_2,b2858_1,b2859,b2860,b2861']
[nan, 'b2863']
[nan, 'b2863']
['b2866,b2867,b2868', 'b2865']
['b2866,b2867,b2868', 'b2865']
['b2877', 'b2876']
['b2877', 'b2876']
['b2889', nan]
[nan, 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
['b2895', 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
['b2898', 'b2896,b2897']
['b2898', 'b2896,b2897']
[nan, 'b2903,b2904,b2905']
['b2910', 'b2906,b2907,b2908,b2909']
['b2910', 'b2906,b2907,b2908,b2909']
['b2912', 'b2906,b2907,b2908,b2909']
[nan, '']
[nan, 'b2913']
['b2916', 'b2914']
[nan, 'b2922']
[nan, 'b2924']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
['b2936', 'b2935']
[nan, 'b2937,b2938']
['b2940', 'b2937,b2938']
['b2942', nan]
['b2942', nan]
['b2943', nan]
[nan, nan]
[nan, 'b2958']
[nan, 'b2958']
[nan, nan]
[nan

['b3660', nan]
['b4555', 'b3661']
['b4555', 'b3661']
[nan, 'b3662']
['b4618', 'b3667,b3668,b3669,b3670,b3671,b3672']
['b4618', 'b3667,b3668,b3669,b3670,b3671,b3672']
['b3677', 'b3674,b3675,b3676']
['b3680', 'b3678,b3679']
['b3688', 'b3686,b3687']
['b3688', 'b3686,b3687']
['b3688', 'b3686,b3687']
['b3696', 'b3691,b4478,b4477,b3693,b4479']
[nan, nan]
[nan, 'b3698']
[nan, 'b3699']
[nan, 'b3700,b3701,b3702']
['b3703,b3704', 'b3700,b3701,b3702']
['b3703,b3704', 'b3700,b3701,b3702']
['b3703,b3704', 'b3700,b3701,b3702']
['b3703,b3704', 'b3700,b3701,b3702']
['b3703,b3704', nan]
['b3707,b3708,b3709', nan]
['b3712,b3713', nan]
['b3715', 'b3714']
['b3716,b3717', nan]
['b3716,b3717', nan]
[nan, nan]
[nan, 'b3729,b3730']
[nan, 'b3731,b3732,b3733,b3734,b3735,b3736,b3737,b3738,b3739']
[nan, 'b3740,b3741,b3742,b3743']
[nan, 'b3740,b3741,b3742,b3743']
['b3747', 'b3745,b3746']
['b3748,b3749,b3750,b3751,b3752,b3753', nan]
[nan, 'b3754,b3755']
[nan, 'b3754,b3755']
[nan, nan]
['b3764', 'b4480']
['b3766,b46

['hokB' 'mokB']
['hokB' 'mokB']
['ydcH' 'rimL']
['ortT' 'ydcY']
['ortT' 'ydcY']
['maeA' 'bdm-sra']
['rspAB' 'ynfA']
['blr' 'cnu']
['cnu' 'ydgK-rsxABCDGE-nth']
['cnu' 'ydgK-rsxABCDGE-nth']
['ydhF' 'ydhL']
['ydhP' 'ynhF']
['ydhP' 'ynhF']
['ydhR' 'ydhS']
['ydiZ' 'yniA']
['yebO' 'mgrB']
['yebO' 'mgrB']
['yebV' 'yebW']
['holE' 'yobB-exoX']
['holE' 'yobB-exoX']
['yebF' 'yebG']
['ruvAB' 'yobI']
['yecJ' 'azuC']
['yedMN_2N_3' 'yedN_1']
['dgcQ' 'yodC']
['insH-8' 'yejO']
['menFDHBCE' 'elaB']
['bamB-der' 'yfgM']
['bamB-der' 'yfgM']
['trxC' 'yfiP-patZ']
['yfiL' 'yfiR-dgcN-yfiB']
['gshA' 'yqaBA']
['ispDF' 'ftsB']
['yqcG' 'ygcG']
['yqcG' 'ygcG']
['ygdR' 'tas']
['yqeL' 'yqeK']
['ygeI' 'pbl']
['yqjF' 'yqjG']
['yraH' 'yraIJK']
['yhdE' 'mreBCD']
['yhdE' 'mreBCD']
['rpsLG-fusA-tufA' 'yheO-tusDCB']
['rpsLG-fusA-tufA' 'yheO-tusDCB']
['greB' 'yhgF']
['yhiS_1' 'slp-dctR']
['yhiS_1' 'slp-dctR']
['bcsQ' 'yhjR']
['bcsQ' 'yhjR']
['bcsQ' 'yhjR']
['yiaG' 'cspA']
['glyQS' 'ysaB']
['yihI' 'hemN']
['cpxPQ' 'fieF']
['h

['b0828,b0829,b0830,b0831,b0832', 'b0826,b0827']
['b0833,b0834', nan]
['b0836', 'b0835']
['b0839', 'b0838']
['b0842', 'b0841']
[nan, nan]
[nan, nan]
['b0848', 'b0847']
['b0848', 'b0847']
['b0848', 'b0847']
['b0850,b0851,b0852,b0853', 'b0849']
['b0854,b0855,b0856,b0857', nan]
[nan, 'b0861,b0862,b0863,b0864']
['b0866,b0867', 'b0865']
['b0876', 'b0875']
['b0876', 'b0875']
['b0876', 'b0875']
['b0878,b0879', 'b0877']
[nan, nan]
[nan, '']
['b0881,b0882', 'b0880']
[nan, '']
[nan, '']
[nan, 'b0884']
[nan, 'b0884']
[nan, 'b0885']
['b0889', nan]
['b0890', nan]
['b0890', nan]
['b0898', 'b0897']
['b0899', nan]
[nan, 'b0902']
[nan, 'b0903,b0904']
[nan, 'b0903,b0904']
[nan, 'b0903,b0904']
['b0906', 'b0905']
['b0910,b0911,b0912', nan]
['b0910,b0911,b0912', nan]
['b0910,b0911,b0912', nan]
['b0917,b0918', nan]
['b0925', nan]
['b0926,b0927', nan]
[nan, 'b0928']
[nan, 'b0928']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0929']
[nan, 'b0930']
['b0932', 'b0931']
['b0932', 'b0931']
['b0945', nan]
['b0946', nan]
[

[nan, nan]
[nan, 'b1860,b1861']
['b1862', 'b1860,b1861,b4677']
['b1867,b1868', 'b1866']
['b1867,b1868', 'b1866']
['b1869,b1870,b1871', nan]
[nan, 'b1872,b1873']
[nan, nan]
['b1876', 'b1874,b1875']
['b1877', nan]
[nan, 'b1891,b1892']
[nan, nan]
[nan, 'b1896,b1897']
[nan, 'b1896,b1897']
[nan, 'b4460,b1900,b1901']
['b1902', nan]
['b1902', nan]
['b1904', 'b4537,b4663']
['b1907', 'b1906']
[nan, nan]
['b1915', 'b1913,b1914']
[nan, 'b1916']
[nan, 'b1916']
[nan, 'b1920,b1921,b1922']
[nan, nan]
[nan, nan]
[nan, nan]
['b1929,b1930', 'b1928']
['b1931', nan]
['b1932', nan]
['b1936', 'b4495_3,b4495_2,b4495_1']
['b1953', 'b1952']
['b1955', 'b1952']
['b1955', nan]
[nan, 'b1956']
[nan, 'b1956,b1957']
['b1959', 'b1958']
[nan, 'b1962,b1963']
[nan, 'b1962,b1963']
['b1967', nan]
['b1967', nan]
['b1971,b1972', nan]
['b1976', nan]
['b1978', nan]
[nan, nan]
['b1982', nan]
['b1983', nan]
[nan, nan]
[nan, nan]
[nan, 'b1985']
[nan, 'b1985']
[nan, 'b1985']
[nan, 'b1988']
[nan, 'b1990']
[nan, 'b4640_1']
['b4582_1

['b3073', 'b3072']
['b3088', nan]
['b3089', nan]
['b3094', nan]
['b3095,b3096', nan]
['b3095,b3096', nan]
['b3097,b3098,b3099,b3100', nan]
['b3101,b3102', nan]
['b3103', nan]
['b3103', nan]
['b3104', nan]
['b3106,b3107', 'b3105']
['b3120,b3121', nan]
[nan, nan]
['b3142,b3143,b3144,b3145', nan]
[nan, nan]
['b3153', 'b3152']
[nan, 'b3163']
[nan, 'b3163']
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3175']
[nan, 'b3175']
[nan, 'b3178,b3179']
['b3180', 'b3178,b3179']
['b3180', 'b3178,b3179']
['b3180', 'b3178,b3179']
['b3180', 'b3178,b3179']
['b3180', 'b3178,b3179']
['', nan]
['b3182', 'b3181']
['b3182', 'b3181']
['b3187', 'b3183,b3184,b3185,b3186']
['b3187', 'b3183,b3184,b3185,b3186']
['b3196,b3197,b3198,b3199,b3200,b3201,b3202,b3203,b3204,b3205,b3206', 'b3191,b3192,b3193,b3194,b3195']
['b3196,b3197,b3198,b3199,b3200,

[nan, 'b3919']
[nan, 'b3925,b3926,b3927']
['b3928', 'b3925,b3926,b3927']
[nan, 'b3929,b3930']
[nan, 'b3931,b3932']
['b3936', 'b3935']
['b3939,b3940', 'b3938']
['b3942', nan]
[nan, 'b3955']
['b3963,b3964', 'b3962']
['b3963,b3964', 'b3962']
['b3963,b3964', 'b3962']
['b3963,b3964', 'b3962']
[nan, 'b3965']
['b3966,b3967', nan]
[nan, nan]
[nan, nan]
['b3972,b3973', nan]
[nan, 'b3974']
[nan, 'b3974']
['b3981,b3982', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
[nan, nan]
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
['b3996,b3997,b3998', nan]
['b4000,b4001', nan]
[nan, 'b4005,b4006']
[nan, 'b4005,b4006']
[nan, nan]
['b4013', 'b4012']
['b4014,b4015,b4016', nan]
[nan, 'b4023']
['b4025', 'b4024']
['b4025', 'b4024']
['b4039,b4040', nan]
['b4042', 'b4041']
['b4045', nan]
['b4047,b4048', 'b4046']
['b4049', nan]
['b4050', nan]
['b4056,b4057', nan]
['b4059', 'b4058']
['b4059', 'b4058']
['b4061', 'b4060']
['

[nan, 'b3292,b3293,b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298,b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, nan]
[nan, nan]
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300

['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['ybaN' 'apt']
['ybaN' 'apt']
['yceQ' 'rluC']
['proQ-prc' 'msrC']
['ypjD' 'yfjD']
['zapA' 'ssrS-fau']
['ibsD' 'ibsE']
['sspAB' 'rplM-rpsI']
['yhdN-zntR' 'rpsMKD-rpoA-rplQ']
['rpsMKD-rpoA-rplQ' 'rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ']
['rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ'
 'rpsJ-rplCDWB-rpsS-rplV-rpsC-rplP-rpmC-rpsQ']
['rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ'
 'rpsJ-rplCDWB-rpsS-rplV-rpsC-rplP-rpmC-rpsQ']
['rpsLG-fusA-tufA' 'yheO-tusDCB']
['rpsLG-fusA-tufA' 'yheO-tusDCB']
['bcsQ' 'yhjR']
['yiaG' 'cspA']
['cspA' 'insJ']
['glmUS' 'atpIBEFHAGDC']
['trxA' 'rhoL-rho']
['thiCEFSGH' 'rsd']
['yjdQ_2' 'yjdQ_1']
['yjdQ_2' 'yjdQ_1']
['ecnAB' 'sugE']
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
[nan, nan]
[nan, nan]
['b0024,b0025,b0026,b0027,b0028,b0029', 'b

[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298,b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b33

['b0081,b0082,b0083,b0084,b0085,b0086,b0087,b0088,b0089,b0090,b0091,b0092,b0093,b0094,b0095,b0096', nan]
['b0104', 'b0101,b0102,b0103']
[nan, 'b0281']
[nan, 'b0428,b0429,b0430,b0431,b0432']
['b1201', 'b1198,b1199,b1200']
['b1343', nan]
[nan, 'b1521']
[nan, 'b1908']
[nan, 'b1985']
['b2172', nan]
['b2175', nan]
[nan, 'b2400']
['b2448,b2449', nan]
[nan, 'b2579']
['b2673,b2674,b2675,b2676', nan]
[nan, 'b2790,b2791,b2792']
[nan, 'b2813']
[nan, 'b2863']
['b3011,b3012', 'b3010']
['b3093', 'b3091,b3092']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3211']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3311,b3312,b3313,b3314,b3315,b3316,b3317,b3318,b3319,b3320,b3321']
[nan, 'b3339,b3340,b3341,b3342']
['b3364', 'b3363']
['b3364', 'b3363']
[nan, 'b3376,b3377,b3378,b3379,b3380,b3381']
['b3441', 'b3440']
['b3521', 'b3520']
['b3556', nan]
['b3800', nan]
[nan, nan]
['b4271', 'b4269']
['b4322,b4323', 'b4321']
['b4381,b4382,b4383,b4384', nan]


['ilvIH' 'cra']
['ilvIH' 'cra']
['sfsA-dksA-gluQ' 'thpR']
['gpt' 'frsA']
['ecpBCDE' 'ecpA']
['yahB' 'yahC']
['yahB' 'yahC']
['ppnP' 'ykiA']
['maa' 'tomB-hha']
['hokE' 'insL-2']
['hokE' 'insL-2']
['fldA-uof-fur' 'ybfE']
['ybfQ' 'ybfL']
['fiu' 'mcbA']
['fiu' 'mcbA']
['opgE' 'rybA-mntS']
['bssR' 'yliI']
['bssR' 'yliI']
['deoR' 'ybjG']
['potFGHI' 'ybjO-rlmC']
['potFGHI' 'ybjO-rlmC']
['csgBAC' 'ymdAB-clsC']
['csgBAC' 'ymdAB-clsC']
['solA-yceO' 'bssS']
['yceQ' 'rluC']
['yceQ' 'rluC']
['pinE' 'mcrA']
['ymgJ' 'ycgI_1' 'ycgI_2']
['ymgGD' 'ymgI']
['ycgI_1' 'ycgI_2']
['ycgL' 'ycgM']
['ymgE' 'ycgY']
['purU' 'ychJ']
['cybB' 'ydcA']
['ortT' 'ydcY']
['ortT' 'ydcY']
['yncM' 'ydcC']
['gnsB' 'ynfN']
['cspI' 'essQ-ydfR-rrrQ-rzpQ' 'rzoQ']
['asr' 'ydgU' 'ydgD']
['ydhF' 'ydhL']
['ydhR' 'ydhS']
['ydhR' 'ydhS']
['ydiU' 'ydiV']
['ydiZ' 'yniA']
['ydiZ' 'yniA']
['yeaK' 'yeaL']
['yeaK' 'yeaL']
['yoaK' 'yoaJ']
['yoaK' 'yoaJ']
['yeaR-yoaG' 'leuE']
['fadD-sroD' 'tsaB-yeaY']
['yebO' 'mgrB']
['yebO' 'mgrB']
['yebO' 'm

['b0950,b0951,b0952', nan]
['b0950,b0951,b0952', nan]
[nan, nan]
['b0953', nan]
['b0953', nan]
[nan, 'b0957']
[nan, 'b0963']
[nan, 'b0966']
['b0972,b0973,b0974,b0975,b0976,b0977', 'b0970']
[nan, 'b0981,b0982,b0983']
[nan, nan]
[nan, 'b0984,b0985,b0986']
['b0991,b4517', nan]
['b0991,b4517', nan]
['', nan]
['', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b0996,b0997,b0998', nan]
[nan, 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b1002', nan]
['b1002', nan]
['b1002', nan]
[nan, nan]
['b1013', 'b1006,b1007,b1008,b1009,b1010,b1011,b1012']
[nan, nan]
[nan, nan]
['b1020', nan]
[nan, 'b1021,b1022,b1023,b1024']
[nan, 'b1021,b1022,b1023,b1024']
[nan, nan]
[nan, nan]
['b1033', nan]
['b1033', nan]
['b1033', nan]
['b1041,b1042,b1043', nan]
['b1041,b1042,b1043,b1044,b1045,b1046', nan]
['b1041,b1042,b1043,b1044,b1045,b1046', nan]
['b1044,b1045,b1046', nan]
['b1044,b1045,b1046', nan]
[nan, n

[nan, 'b1874,b1875']
[nan, 'b1874,b1875']
['b1876', 'b1874,b1875']
[nan, 'b1881,b1882,b1883,b1884,b1885,b1886']
[nan, nan]
[nan, 'b1881,b1882,b1883,b1884,b1885,b1886']
[nan, nan]
[nan, 'b1887,b1888,b1889,b1890']
[nan, 'b1887,b1888,b1889,b1890']
[nan, 'b1887,b1888,b1889,b1890']
[nan, nan]
[nan, 'b1896,b1897']
[nan, 'b1896,b1897']
[nan, 'b1896,b1897']
[nan, 'b4460,b1900,b1901']
[nan, 'b4460,b1900,b1901']
['b1902', 'b4460,b1900,b1901']
['b1902', nan]
['b1902', nan]
['b1904', 'b4537,b4663']
['b1904', 'b4537,b4663']
['b1904,b1905', 'b4663']
['b1905', nan]
['b1905', '']
['b1907', 'b1906']
[nan, nan]
[nan, 'b1908']
[nan, 'b1908']
[nan, nan]
[nan, 'b1912']
[nan, 'b1913,b1914']
['b1915', 'b1913,b1914']
['b1915', 'b1913,b1914']
['b1915', 'b1913,b1914']
['', nan]
[nan, 'b1916']
[nan, 'b1916']
[nan, 'b1917,b1918,b1919']
[nan, 'b1917,b1918,b1919']
[nan, 'b1920,b1921,b1922']
[nan, 'b1920,b1921,b1922']
[nan, 'b1920,b1921,b1922']
[nan, nan]
['b1929,b1930', 'b1928']
['b1929,b1930', 'b1928']
['b1931,b19

['b2603,b2604,b2605', nan]
[nan, 'b2606,b2607,b2608,b2609']
[nan, 'b2606,b2607,b2608,b2609']
[nan, 'b2610']
['b2611', 'b2610']
['b2611', 'b2610']
[nan, nan]
['', '']
['b2620', nan]
['', nan]
[nan, nan]
['b2626', nan]
[nan, 'b2627,b2628']
['b2630,b2631', nan]
['b2632,b2633', nan]
[nan, '']
['b2642', 'b2641_2,b2641_1']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2659,b2660,b2661,b2662,b2663', nan]
['b2659,b2660,b2661,b2662,b2663', nan]
[nan, 'b2665,b2666']
['b2667,b2668', nan]
['b2667,b2668', nan]
['b2667,b2668', nan]
[nan, 'b2669']
['b2670', 'b2669']
['b2670', 'b2669']
['b2670', nan]
['b2673,b2674,b2675,b2676', nan]
['b2677,b2678,b2679', nan]
['b2682,b2683,b2684,b2685,b2686', nan]
[nan, 'b2687']
[nan, '']
[nan, '']
[nan, nan]
[nan, 'b2697,b2698,b2699']
['b2715,b2716', 'b2714']
[nan, 'b2717,b2718,b2719,b2720,b2721,b2722,b2723,b2724,b2725']
[nan, nan]
['b2736,b2737', 'b2735']
[nan, nan]
[nan, nan]
[nan, 'b2745']
[nan, 'b2746,b2747,b2748']
[nan, nan]
[nan, 'b2750,b

['b3459', 'b3454,b3455,b3456,b3457,b3458']
['b3459', 'b3454,b3455,b3456,b3457,b3458']
[nan, 'b3461']
['b3471', 'b3470']
['b3471', 'b3470']
['b3471', 'b3470']
['b3471', 'b3470']
[nan, nan]
['b3474', 'b3473']
['b3476,b3477,b3478,b3479,b3480,b3481', nan]
['b3476,b3477,b3478,b3479,b3480,b3481', nan]
['b3476,b3477,b3478,b3479,b3480,b3481', nan]
['b3476,b3477,b3478,b3479,b3480,b3481', nan]
['b3476,b3477,b3478,b3479,b3480,b3481', nan]
['b3482', nan]
['b3483,b4552', nan]
['b3483,b4552', nan]
['b4552,b3484', nan]
['b3484', nan]
['b3484', nan]
['b3484', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3485,b3486,b3487']
[nan, 'b3485,b3486,b3487']
[nan, nan]
[nan, nan]
[nan, nan]
['b3491', nan]
[nan, nan]
['b3493', 'b3492']
['b3496', nan]
[nan, 'b4613']
['b3501,b3502,b3503', nan]
[nan, nan]
['b3506,b3507', nan]
['b3506,b3507', nan]
['b3511', 'b3508,b3509,b3510']
['b3511', 'b3508,b3509,b3510']
['b3511', nan]
[nan, nan]
[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b351

[nan, nan]
['b4128,b4559', nan]
[nan, 'b4130']
[nan, 'b4131,b4132']
[nan, 'b4131,b4132']
[nan, 'b4133']
[nan, 'b4654_2,b4654_1']
[nan, 'b4135,b4136']
[nan, 'b4135,b4136']
[nan, 'b4135,b4136']
[nan, nan]
[nan, 'b4138,b4139']
[nan, 'b4138,b4139']
[nan, 'b4138,b4139']
[nan, 'b4138,b4139']
[nan, 'b4138,b4139']
['b4140', 'b4138,b4139']
['b4140', 'b4138,b4139']
['b4140', 'b4138,b4139']
['b4142,b4143', 'b4141']
['b4147', 'b4146']
['b4147,b4410,b4411', 'b4146']
['b4148', nan]
['b4155', 'b4151,b4152,b4153,b4154']
[nan, nan]
[nan, nan]
[nan, nan]
['b4167,b4168,b4169,b4170,b4171,b4172,b4173,b4174,b4175', 'b4166']
['b4167,b4168,b4169,b4170,b4171,b4172,b4173,b4174,b4175', nan]
['b4176', nan]
['b4176,b4177', nan]
['b4177', nan]
['b4178,b4179,b4180,b4181,b4182', nan]
['b4178,b4179,b4180,b4181,b4182', nan]
['b4193,b4194,b4195,b4196,b4197,b4198', nan]
['b4200,b4201,b4202,b4203', 'b4199']
['b4200,b4201,b4202,b4203', 'b4199']
['b4200,b4201,b4202,b4203', 'b4199']
['b4200,b4201,b4202,b4203', 'b4199']
['b42

[nan, 'b0535']
[nan, nan]
[nan, nan]
['b0545,b0546', nan]
['b0545,b0546', nan]
['b0545,b0546', nan]
[nan, 'b0553_2,b0553_1']
['b0559', 'b0558']
['b0559', 'b0558']
['b0560', 'b4589']
['b0564', nan]
[nan, 'b0568,b0569']
['b0572,b0573,b0574,b0575', 'b0570,b0571']
['b4415,b0582', 'b0581']
['b4415,b0582', 'b0581']
[nan, nan]
['b0585,b4511,b0586,b0587', 'b0583,b0584']
['b0585,b4511,b0586,b0587', 'b0583,b0584']
[nan, 'b0588,b0589,b0590']
['b0598', nan]
['b0600', nan]
[nan, 'b0601']
[nan, 'b0603']
[nan, 'b0604']
[nan, nan]
['b0608', 'b0607']
[nan, nan]
[nan, 'b0610']
[nan, 'b0610']
[nan, 'b0610']
[nan, 'b0610']
[nan, 'b0611']
[nan, 'b0611']
[nan, 'b0613,b0614,b0615,b0616,b0617,b0618']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b0621']
[nan, 'b0621']
['b0622', 'b0621']
['b0622', 'b0621']
['b0622', 'b0621']
['b0623', '']
['b0627', nan]
[nan, 'b0628']
[nan, 'b0628']
[nan, 'b0628']
[nan, 'b0628']
[nan, 'b0630,b0631']
[nan, 'b0630,b0631']
[nan, nan]
[nan, nan]
[nan, 'b0633,b0634,b0635,b0636,b0637']
['

['b1604', nan]
['b1605,b1606', nan]
['b1605,b1606', nan]
[nan, nan]
[nan, nan]
[nan, 'b1615,b1616,b1617']
[nan, 'b1615,b1616,b1617']
[nan, 'b1615,b1616,b1617']
[nan, 'b1615,b1616,b1617']
[nan, 'b1615,b1616,b1617']
[nan, 'b1615,b1616,b1617']
[nan, 'b1618']
[nan, 'b1618']
[nan, 'b1618']
[nan, 'b1619']
[nan, 'b1619']
['b1626,b1627,b1628,b1629,b1630,b1631,b1632,b1633', nan]
['b1626,b1627,b1628,b1629,b1630,b1631,b1632,b1633', nan]
['b1626,b1627,b1628,b1629,b1630,b1631,b1632,b1633', nan]
['b1634', nan]
['b1634', nan]
['b1634', nan]
['b1643,b1644,b1645', 'b1642']
['b1643,b1644,b1645', 'b1642']
[nan, nan]
[nan, nan]
[nan, 'b1646']
['b1649,b1650,b1651', 'b1647,b1648']
['b1655', 'b1654']
['b1655', 'b1654']
['b1658', 'b4602']
[nan, nan]
[nan, 'b1662']
['b1663', 'b1662']
[nan, 'b1664']
['b1667', 'b1664']
['b1667', 'b1664']
['b1667', 'b1664']
['b1667', 'b1664']
['b1667,b1668', nan]
['b1667,b1668', nan]
['b1668', nan]
[nan, 'b1669,b1670,b1671,b1672,b1673,b1674']
['b1677', nan]
[nan, 'b1678']
[nan, '

[nan, 'b2827,b2828']
[nan, 'b2829,b2830']
[nan, 'b2829,b2830']
['b2831', 'b2829,b2830']
['b2831', nan]
['b2831', nan]
['b2831', nan]
['b2831,b2832', nan]
['b2833,b2834', nan]
[nan, nan]
[nan, 'b2840,b2841']
['b2845', 'b2844']
['b2845', 'b2844']
['b2845', 'b2844']
['b2846', nan]
['b2846', nan]
['b2847,b2848', '']
['', nan]
[nan, 'b2863']
[nan, 'b2863']
[nan, 'b2863']
[nan, 'b2865']
[nan, 'b2869']
[nan, 'b2875']
[nan, nan]
['b2901', 'b2899,b2900']
[nan, 'b2902']
[nan, 'b2902']
[nan, nan]
[nan, 'b2903,b2904,b2905']
[nan, 'b2903,b2904,b2905']
[nan, 'b2906,b2907,b2908,b2909']
[nan, '']
['b2917,b2918,b2919,b2920', nan]
[nan, 'b2924']
[nan, 'b2924']
[nan, 'b2924']
[nan, 'b2924']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, nan]
[nan, nan]
['b2942', 'b2939']
['b2944,b2945', nan]
['b2948,b2949', nan]
['b2951,b2952,b2953,b2954,b2955', nan]
[nan, 'b2956']
['b2961,b2962,b2963,b2964', nan]
[nan, 'b2965']

['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
[nan, 'b3775']
[nan, 'b3775']
['b3778', 'b3777_2,b3777_1']
['b3781', 'b3780']
['b3781', 'b3780']
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794,b3795', nan]
['b3795', nan]
['b3795', nan]
[nan, nan]
[nan, nan]
['b3800', nan]
[nan, nan]
['b3806', 'b3802,b3803,b3804,b3805']
['b4558,b3809,b3810,b3811,b3812,b3813', nan]
['b3825,b3826', nan]
['b3827', nan]
['b3831', 'b3830']
[nan, nan]
['b3833,b3834,b3835', nan]
['b3833,b383

[nan, 'b1144']
[nan, nan]
[nan, 'b1185']
[nan, 'b1185']
[nan, nan]
['b1236', nan]
['b1238', 'b1237']
[nan, nan]
[nan, nan]
[nan, 'b1270,b1271']
['b1279,b1280,b1281,b1282', nan]
['b1279,b1280,b1281,b1282', nan]
['b1279,b1280,b1281,b1282', nan]
['b1279,b1280,b1281,b1282', nan]
['b1279,b1280,b1281,b1282', nan]
[nan, nan]
[nan, nan]
['b1304,b1305,b1306,b1307,b1308', nan]
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
['b1321,b1322,b1323', nan]
['b1328', 'b1326,b4525,b4673,b1327']
['b1331', 'b1330']
['b4570_2,b1372,b1373', nan]
['b1388,b1389,b1390,b1391,b1392,b1393,b1394,b1395,b1396,b1397,b1398', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b1478']
[nan, 'b1478']
[nan, 'b1483,b1484,b1485,b1486,b1487,b1488']
[nan, nan]
[nan, nan]
[nan, 'b1507,b1508']
[nan, nan]
[nan, 'b4696_2,b4696_1']
[nan, 'b4696_2,b4696_1']
[nan, 'b4696_2,b4696_1']
[nan, 

['ybaV' 'fadM']
['ylaC' 'maa']
['insE-3EF-3F-3' 'renD-emrE']
['pqiABC' 'rmf']
['rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ'
 'rpsJ-rplCDWB-rpsS-rplV-rpsC-rplP-rpmC-rpsQ']
['insJ' 'insK']
['mokA' 'hokA']
['nepI' 'yicN']
['tamAB-ytfP' 'chpSB']
['tamAB-ytfP' 'chpSB']
['insO_3' 'insO-2-yjhWV']
[nan, nan]
[nan, 'b0010']
[nan, 'b0010']
[nan, 'b0010']
[nan, 'b0011']
['b0016', nan]
[nan, 'b0021,b0022']
['b0032,b0033', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b0035,b0036,b0037,b0038,b0039,b0040']
[nan, 'b0035,b0036,b0037,b0038,b0039,b0040']
['b0046,b0047', nan]
[nan, nan]
[nan, 'b0061,b0062,b0063']
[nan, 'b0066,b0067,b0068,b0069']
['b4662,b0070', nan]
[nan, nan]
['b0097,b0098,b0099', nan]
[nan, nan]
['b0097,b0098,b0099', nan]
['b0097,b0098,b0099', nan]
['', '']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b0119', nan]
['b0125', 'b0124']
['b0125', 'b0124']
['b0130', nan]
[nan, nan]
[nan, 'b0164']
[nan, 'b0166,b0167,b0168']
['b0169,b0170', nan]
[nan, nan]
['b0186', nan]
[nan, nan

['b4576', nan]
[nan, nan]
['b4322,b4323', 'b4321']
[nan, 'b4327']
[nan, nan]
[nan, nan]
[nan, nan]
['b4388,b4389,b4390', nan]
['b4393', nan]
['b4395', 'b4394']
['ybaV' 'fadM']
['ycgI_1' 'ycgI_2']
['yebF' 'yebG']
['rlmM' 'ygdD']
['insJ' 'insK']
['tamAB-ytfP' 'chpSB']
['b0031', nan]
['b0041,b0042,b0043,b0044', nan]
['b0046,b0047', nan]
[nan, nan]
[nan, nan]
[nan, 'b0106,b0107,b0108']
['b0110,b0111', nan]
[nan, 'b0120,b0121,b0122']
['b0123', 'b0120,b0121,b0122']
['b0209,b0210', nan]
['b0209,b0210', nan]
[nan, nan]
[nan, nan]
['b0213', 'b0212']
[nan, 'b0245,b0246,b4504,b0247,b0248,b0249,b0250,b0251']
[nan, 'b0245,b0246,b4504,b0247,b0248,b0249,b0250,b0251']
[nan, 'b0245,b0246,b4504,b0247,b0248,b0249,b0250,b0251']
['b0413,b0414,b0415,b0416,b0417,b0418', 'b0412']
[nan, 'b0419,b0420,b0421,b0422']
['b0442,b0443', nan]
['b0448,b0449', nan]
[nan, nan]
[nan, nan]
['b0456', 'b0454']
['b0473', nan]
['b0475', nan]
['b0475', nan]
['b0518,b4572,b0520,b0521', nan]
[nan, 'b0612']
[nan, 'b0612']
[nan, nan

[nan, 'b2194,b2195,b2196,b2197,b2198,b2199,b2200,b2201,b2202,b2203,b2204,b2205,b2206,b2207,b2208']
[nan, 'b2194,b2195,b2196,b2197,b2198,b2199,b2200,b2201,b2202,b2203,b2204,b2205,b2206,b2207,b2208']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b2225,b2226,b2229,b2230']
[nan, 'b2225,b2226,b2229,b2230']
[nan, nan]
[nan, 'b2225,b2226,b2229,b2230']
[nan, nan]
['b2241,b2242,b2243', nan]
[nan, nan]
[nan, 'b2259']
[nan, 'b2260,b2261,b2262,b2263,b2264,b2265']
['b2269', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2274,b2275', nan]
[nan, nan]
[nan, 'b2276,b2277,b2278,b2279,b2280,b2281,b2282,b2283,b2284,b2285,b2286,b2287,b2288']
[nan, 'b2306,b2307,b2308,b2309,b2310']
[nan, 'b2306,b2307,b2308,b2309,b2310']
[nan, 'b2306,b2307,b2308,b2309,b2310']
[nan, 'b2311,b2312,b2313']
[nan, 'b2354,b2355,b2356,b2357,b2358']
['b2365,b2366', nan]
['b2365,b2366', nan]
[nan, nan]
[nan, nan]
[nan, 'b2383,b2384,b2385,b2386,b2387']
[nan, nan]
['b2390', nan]
['b2390', nan]
['b2390', nan]
['b2390', nan]
['b2394', nan]


[nan, 'b3925,b3926,b3927']
[nan, 'b3925,b3926,b3927']
[nan, 'b3925,b3926,b3927']
[nan, 'b3925,b3926,b3927']
['b3943', nan]
[nan, 'b3945,b3946,b3947']
[nan, 'b3945,b3946,b3947']
[nan, 'b3945,b3946,b3947']
[nan, 'b3945,b3946,b3947']
[nan, nan]
['b3949,b3950', nan]
['b3951,b3952', nan]
['b3953', nan]
[nan, nan]
['b3972,b3973', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b3989', nan]
['b3989', nan]
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
['b4000,b4001', nan]
['b4001', nan]
[nan, nan]
['b4003,b4004', nan]
[nan, nan]
[nan, nan]
['b4026,b4027,b4028,b4029', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b4032,b4033,b4034']
['b4035,b4036,b4037', 'b4032,b4033,b4034']
['b4035,b4036,b4037', 'b4032,b4033,b4034']
['b4035,b4036,b4037', nan]
['b4035,b4036,b4037', nan]
[nan, nan]
[nan, 'b4051']
['b4052', 'b4051']
['b4055', 'b4621']
[nan, nan]
[nan, 'b4067,b406

['b4519', '']
['', '']
['', 'b1160']
['', 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, nan]
[nan, 'b1161']
[nan, 'b1161']
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b4491_1,b4491_2', nan]
['b4491_1,b4491_2', nan]
['b4491_1,b4491_2', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b4594,b4521_1', 'b1171,b1172,b4593']
['b4594,b4521_1', 'b1171,b1172,b4593']
['b1183,b1184', 'b1182']
[nan, 'b1202']
[nan, 'b1202']
[nan, 'b1202']
[nan, 'b1257,b1258,b1259']
[nan, 'b1257,b1258,b1259']
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
['b1363', nan]
['b1365,b1366', nan]
[nan, 'b1374']
[nan, 'b1374']
[nan, 'b1374,b1375']
[nan, 'b1374,b1375']
[nan, 'b1375']
[nan, 'b1377,b1378']
[nan, 'b1377,b1378']
[nan, 'b1377,b1378']
['b4492_1', '']


[nan, 'b3338']
[nan, 'b3338']
[nan, 'b3338']
['b3369', nan]
['b3369', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2,b3446', nan]
['b3446', nan]
['b3446', nan]
['b3446', nan]
['b3446', nan]
['b3483', nan]
['b3483', nan]
['b3483', nan]
['b3483,b4552', nan]
['b3483,b4552', nan]
['b3483,b4552', nan]
['b3483,b4552', nan]

[nan, nan]
[nan, nan]
[nan, nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
['b4279,b4280', nan]
[nan, 'b4309,b4310,b4311']
[nan, 'b4309,b4310,b4311']
[nan, 'b4309,b4310,b4311']
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4313', nan]
['b4313', nan]
['b4313', nan]
[nan, nan]
[nan, 'b4325']
[nan, 'b4325']
[nan, 'b4325']
['b4326', 'b4325']
['b4326', 'b4325']
['b4326', 'b4325']
[nan, nan]
[nan, 'b4345,b4346']
[nan, 'b4345,b4346']
['b4365,b4366', 'b4364']
['b4365,b4366', 'b4364']
['b4365,b4366', 'b4364']
['b4365,b4366', nan]
['yadGH' 'yadI']
['mltD' 'gloB']
['ykfM' 'yafU']
['yafK' 'dinJ-yafQ']
['yafK' 'dinJ-yafQ']
['gpt' 'frsA']
['yafY-ykfBF-yafX-ykfGH-yafW-ykfI' 'ykfL' 'ykfK']
['intF' 'yagP']
['aroL-yaiA-aroM' 'ppnP']
['tsx' 'yajI']
['ybaV' 'fadM']
['allA' 'allR']
['allA' 'allR']
['nfsB

['b0507,b0508,b0509,b0511,b0512,b0513,b0514', nan]
['b0507,b0508,b0509,b0511,b0512,b0513,b0514', nan]
[nan, 'b0515,b0516,b0517']
['b0526', 'b0524,b0525']
[nan, nan]
['b0533,b0534', nan]
['b0545,b0546', nan]
['b0545,b0546', nan]
['b0545,b0546', nan]
['b0561', nan]
['b0564', nan]
[nan, 'b0565,b0566']
[nan, 'b0565,b0566']
[nan, 'b0565,b0566']
[nan, nan]
[nan, nan]
[nan, 'b0565,b0566']
[nan, 'b0565,b0566']
[nan, 'b0565,b0566']
[nan, nan]
[nan, 'b0568,b0569']
[nan, 'b0568,b0569']
[nan, 'b0568,b0569']
[nan, nan]
[nan, 'b0570,b0571']
['b0572,b0573,b0574,b0575', 'b0570,b0571']
['b0572,b0573,b0574,b0575', nan]
['b0572,b0573,b0574,b0575', nan]
['b0572,b0573,b0574,b0575', nan]
['b0576', nan]
[nan, nan]
[nan, 'b0578,b0579']
[nan, 'b0579,b0580']
[nan, 'b0580']
['b4415', 'b0581']
[nan, nan]
[nan, nan]
[nan, 'b0583,b0584']
[nan, 'b0583,b0584']
[nan, nan]
['b0585,b4511,b0586,b0587', 'b0583,b0584']
['b0585,b4511,b0586,b0587', 'b0583,b0584']
['b0585,b4511,b0586,b0587', 'b0583,b0584']
[nan, nan]
['b0585,

[nan, nan]
['b1278', 'b1277']
['b1279,b1280,b1281,b1282', nan]
[nan, 'b1283']
[nan, 'b1284,b4596']
[nan, 'b1284,b4596']
[nan, nan]
[nan, nan]
[nan, 'b1289']
[nan, 'b1290,b1291,b1292,b1293,b1294']
[nan, 'b1290,b1291,b1292,b1293,b1294']
[nan, 'b1290,b1291,b1292,b1293,b1294']
[nan, 'b1290,b1291,b1292,b1293,b1294']
['b1298,b1299,b1300,b1301,b1302', 'b1296,b1297']
['b1298,b1299,b1300,b1301,b1302', nan]
['b1298,b1299,b1300,b1301,b1302', nan]
[nan, nan]
['b1304,b1305,b1306,b1307,b1308', nan]
['b1309,b1310,b1311,b1312,b1313,b1314,b1315,b1316,b1317', nan]
[nan, nan]
[nan, nan]
[nan, 'b1326,b4525,b4673,b1327']
['b1328', 'b1326,b4525,b4673,b1327']
['b1340', nan]
['b1342', 'b1341']
[nan, nan]
[nan, nan]
['b1343', nan]
['b1343', nan]
['b1343', nan]
[nan, 'b1344']
[nan, 'b1344']
[nan, 'b1344']
[nan, 'b4527,b1355']
[nan, 'b4527,b1355,b1356']
['b1357,b1358,b1359,b1360,b1361,b1362', 'b4527,b1355,b1356']
['b1357,b1358,b1359,b1360,b1361,b1362', 'b1356']
['b4570_2,b1372,b1373', nan]
[nan, 'b1375']
[nan, '

[nan, 'b2072,b2073,b4667']
[nan, nan]
[nan, nan]
[nan, nan]
['b2074,b2075,b2076,b2077,b2078,b2079', nan]
[nan, '']
[nan, 'b2082']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2101']
[nan, 'b2101']
[nan, 'b2103,b2104']
[nan, 'b2108,b2109,b2110,b2111']
['b2114', 'b2113']
['b4499_1', nan]
['b4499_2', nan]
['b4541', nan]
['b2119,b2120,b2121,b2122', nan]
[nan, 'b2128,b2129,b2130,b2131']
['b2133', 'b2132']
['b2136', 'b2135']
['b2136', nan]
['b2144,b2145', nan]
['b2144,b2145,b2146,b2147', nan]
['b2146,b2147', nan]
[nan, nan]
[nan, 'b2148,b2149,b2150']
[nan, 'b2148,b2149,b2150']
[nan, nan]
[nan, nan]
[nan, 'b2151']
[nan, 'b2151']
[nan, 'b2155']
[nan, 'b2155']
['b2158', 'b2157']
[nan, nan]
['b2160', nan]
[nan, 'b2161']
[nan, 'b2161']
[nan, 'b2164']
[nan, 'b2165,b2166']
['b2170', 'b2167,b2168,b2169']
['b2171', 'b4502']
['b2176', nan]
['b2177,b2178,b2179,b2180', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2185', nan]
['b2185', nan]
[nan, 'b2186']
[nan, nan]
[nan, 'b2190_2,b2190_1']

[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, nan]
['b2940', 'b2937,b2938,b2939']
['b2943', nan]
['b2943', nan]
['b2943', nan]
['b2945', nan]
['b2948,b2949', nan]
['b2951,b2952,b2953,b2954,b2955', 'b2950']
['b2951,b2952,b2953,b2954,b2955', nan]
['b2951,b2952,b2953,b2954,b2955', nan]
['b2951,b2952,b2953,b2954,b2955', nan]
[nan, 'b2957']
[nan, 'b2957']
[nan, 'b2957']
['b2961,b2962,b2963,b2964', 'b2959,b2960']
[nan, nan]
[nan, 'b2968,b2969']
[nan, 'b2968,b2969']
[nan, nan]
[nan, 'b4466']
[nan, 'b4466']
[nan, 'b4466']
[nan, 'b2975,b2976,b2977,b4467,b4468,b2979']
[nan, 'b2975,b2976,b2977,b4467,b4468,b2979']
[nan, nan]
[nan, nan]
[nan, 'b2975,b2976,b2977,b4467,b4468,b2979']
[nan, 'b2975,b2976,b2977,b4467,b4468,b2979']
[nan, nan]
['b2982', 'b2981']
[nan, nan]
[nan, nan]
['b2989', 'b2988']
[nan, 'b2990,b2991,b2992,b2993,b2994,b2995,b2996,b2997']
[nan, 'b29

[nan, nan]
[nan, nan]
[nan, 'b3524']
[nan, nan]
[nan, nan]
[nan, 'b3529']
[nan, nan]
[nan, 'b3530,b3531,b3532,b3533']
[nan, 'b3530,b3531,b3532,b3533']
['b3536,b3537,b3538', nan]
[nan, nan]
[nan, nan]
[nan, 'b3540,b3541,b3542,b3543,b3544']
[nan, 'b3540,b3541,b3542,b3543,b3544']
[nan, 'b3540,b3541,b3542,b3543,b3544']
[nan, 'b3540,b3541,b3542,b3543,b3544']
[nan, nan]
[nan, nan]
['b3549,b3550', 'b3548']
['b3549,b3550', 'b3548']
['b3549,b3550', nan]
[nan, nan]
['b3553', nan]
['b3555', 'b3554']
['b3555', 'b3554']
['b3555,b3556', nan]
['b3555,b3556', nan]
['b3558', nan]
['b3558', nan]
[nan, nan]
[nan, 'b3562,b3563']
['b3566,b3567,b3568,b3569', 'b3564,b3565']
['b3566,b3567,b3568,b3569', nan]
['b3566,b3567,b3568,b3569', nan]
['b3566,b3567,b3568,b3569', nan]
[nan, nan]
['b3571', 'b3570']
[nan, nan]
['b3572', nan]
[nan, nan]
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', 'b3574']
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', 'b3574']
['b3575,b3576,b3577,b3578,b3579,b3580,b3

['b4050', nan]
['b4050', nan]
['b4050', nan]
['b4053', nan]
['b4054', nan]
[nan, '']
[nan, nan]
['b4063', 'b4062']
[nan, 'b4067,b4068,b4069']
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', 'b4067,b4068,b4069']
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', 'b4067,b4068,b4069']
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', 'b4067,b4068,b4069']
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', nan]
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', nan]
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', nan]
['b4070,b4071,b4072,b4073,b4074,b4075,b4076', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b4084']
[nan, nan]
[nan, 'b4085,b4086,b4087,b4088,b4089']
[nan, 'b4085,b4086,b4087,b4088,b4089']
[nan, 'b4085,b4086,b4087,b4088,b4089']
['b4090', 'b4085,b4086,b4087,b4088,b4089']
['b4090', 'b4085,b4086,b4087,b4088,b4089']
['b4090', 'b4085,b4086,b4087,b4088,b4089']
['b4090', 'b4085,b4086,b4087,b4088,b4089']
['b4090,b4487', nan]
['b4090

['b1625', 'b1624']
['b1667', 'b1664']
[nan, 'b1669,b1670,b1671,b1672,b1673,b1674,b1675']
[nan, 'b1696']
[nan, 'b1707']
[nan, nan]
[nan, 'b1726']
[nan, nan]
[nan, 'b1762']
[nan, 'b1771,b1772,b1773,b1774,b1775,b1776']
[nan, 'b1771,b1772,b1773,b1774,b1775,b1776']
[nan, 'b1805']
['b1817,b1818,b1819', nan]
[nan, 'b1850,b1851']
['b1853', 'b1852']
['b1858,b1859', 'b1857']
['b1862', 'b1860,b1861,b4677']
[nan, 'b1872,b1873']
[nan, 'b1874,b1875']
[nan, 'b1881,b1882,b1883,b1884,b1885,b1886']
[nan, 'b1896,b1897']
['b1905', nan]
[nan, 'b1908']
['b1915', nan]
['b1924,b1925,b1926', 'b1923']
['b1924,b1925,b1926', 'b1923']
['b1973', nan]
['b1973', nan]
['b1973', nan]
['b1974', nan]
['b1974', nan]
['b1976', nan]
['b1978', nan]
['b1983', nan]
[nan, nan]
[nan, 'b1988']
[nan, 'b1991,b1992,b1993']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
['b2071', 'b2070']
['b2098,b2099,b2100', nan]
['b2098,b2099,b2100', nan]
['b2106,b2107', nan]
['b2114', 'b2113']
[nan, nan]
[nan, nan]


['mltD' 'gloB']
['gpt' 'frsA']
['yaiP' 'yaiS']
['sfmA' 'sfmCD']
['ylcH' 'ybcN-ninE-ybcO-rusA-ylcG']
['ylcH' 'ybcN-ninE-ybcO-rusA-ylcG']
['ybfA' 'rhsC-ybfB']
['ybgQPO' 'ybgD']
['elfA' 'elfDCG-ycbUVF']
['cspG' 'ymcE-gnsA']
['yceQ' 'rluC']
['pinR' 'ynaE']
['paaXY' 'ydbA_1']
['ortT' 'ydcY']
['gnsB' 'ynfN']
['dicA' 'ydfABC']
['ruvAB' 'yobI']
['yedX' 'msrPQ']
['sanA-yeiS' 'preTA']
['yfcD' 'yfcE']
['fadIJ' 'yfcZ']
['fadIJ' 'yfcZ']
['yfeYX' 'ypeA-yfeZ']
['gcvR' 'bcp']
['bamB-der' 'yfgM']
['ypjD' 'yfjD']
['ygaM' 'nrdHIEF']
['ygaZH' 'mprA-emrAB']
['alaS' 'recAX']
['ftsB' 'ygbE']
['yqeL' 'yqeK']
['ygeG' 'ygeH']
['ygeG' 'ygeH']
['ygeLK' 'insCD-4C-4D-4-ygeONM']
['yghF' 'yghG']
['mqsRA' 'ygiV']
['ygiL' 'insC-5CD-5D-5-yqiGHI']
['bacA' 'folB']
['yhaH' 'yhaI']
['yhcB' 'degQS']
['yhfXW-php-yhfUTS' 'yhfZY']
['yhhH' 'yrhC']
['yrhC' 'yhhI']
['yiaG' 'cspA']
['yibS' 'yibW_1' 'yibW_2']
['yibW_2' 'yibV_1']
['yibV_1' 'yibV_2']
['tisB' 'emrD']
['yidE' 'ibpAB']
['yiiE' 'yiiF']
['thiCEFSGH' 'rsd']
['mdtNOP' 'ytcA'

['b3093', 'b3091,b3092']
['b3095,b3096', nan]
['b3101', nan]
['b3103,b3104', nan]
['b3104', nan]
[nan, 'b4470,b3110']
[nan, 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3119', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3120,b3121', nan]
[nan, nan]
['b3128', 'b3124,b3125,b3126,b3127']
['b3128', 'b3124,b3125,b3126,b3127']
['b3132,b3133,b3134,b3135', nan]
['b3142', nan]
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
[nan, 'b3173']
[nan, nan]
[nan, 'b3183,b3184,b3185,b3186']
[nan, 'b3208,b3209']
['b3220', nan]
[nan, 'b3221,b3222,b3223,b3224,b3225']
['b3233,b3234,b3235', nan]
[nan, 'b3249,b3250,b3251']
['b3260,b3261', nan]
['b3260,b3261', nan]
['b3262', nan]
[nan, 'b3264']
['b3265,b3266', 'b3264']
['b3267', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b3279', nan]
['b3324,b3325,b3326,b3327,b3328,b3329,b3330,b3331,b3332,b3333,b3334,b3335', 'b3322,b3323']
['b3324,b3325,b3326,b3327,b3328,b3329,b3330,

['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', nan]
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', nan]
[nan, 'b3586,b3587']
[nan, 'b3588']
[nan, 'b3588']
[nan, 'b3589']
[nan, nan]
[nan, nan]
['b3593,b3594', nan]
['b3593,b3594', nan]
['b4651_1,b4651_2,b4615_1', nan]
['b4615_1,b4615_2', nan]
['b4615_1,b4615_2,b4652_1,b4652_2', nan]
[nan, 'b3608,b3609,b3610,b3611']
[nan, 'b3608,b3609,b3610,b3611']
[nan, 'b3608,b3609,b3610,b3611']
['b3612,b3613,b3614', nan]
[nan, 'b3615']
[nan, nan]
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
['b3633,b3634', 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3635,b3636,b3637,b3638']
['b3646', nan]
[nan, 'b3647']
['b3649,b3650,b3651,b3652', nan]
['b3660', nan]
[nan, 'b3663']
['b3665', 'b3664']
[nan, 'b3667,b3668,b3669,b3670,b3671,b3672']
['b4618,b3673', n

['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167,b1168', nan]
['b4491_1,b4491_2', nan]
['b1183,b1184', 'b1182']
[nan, 'b1202']
[nan, 'b1257,b1258,b1259']
[nan, 'b1345,b1346,b1347,b1348,b1349,b1350']
[nan, 'b1345,b1346,b1347,b1348,b1349,b1350,b1351']
['b1363', nan]
[nan, 'b1377,b1378']
['b4492_1', '']
['b4492_1', 'b4674']
['b4492_1', 'b4674']
['b1455', nan]
['b1455', nan]
['b1455', nan]
['b1455', nan]
['', nan]
['', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1459_1,b1459_2', nan]
['b1459_1,b1459_2', nan]
['b1459_1,b1459_2', nan]
['b1459_1,b1459_2,b1460', nan]
['b1459_1,b1459_2,b1460', nan]
['b1460', nan]
['b1460', nan]
['b1460', nan]
['b1460', nan]
['b1460', nan]
['b1461', nan]
[nan, 'b1469']
[nan, 'b1469,b1471_2,b1471_1,

['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
[nan, nan]
[nan, nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2,b3446', nan]
['b3446', nan]
['b3446', nan]
['b3483', nan]
['b3483', nan]
['b3483', nan]
['b3483,b4552', nan]
['b3483,b4552', nan]
['b4552', nan]
['b4552,b3484', nan]
['b4552,b3484', nan]
['b4552,b3484', nan]
['b4552,b3484', nan]
['b3484', nan]
['b3484', nan]
['b3484', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3488']
[nan, 'b3488']
[nan, 'b3488']
[nan, 'b3488']
[nan, 'b3488']
[nan, 'b3488']
[nan, 

['yadGH' 'yadI']
['mltD' 'gloB']
['ykfM' 'yafU']
['yafK' 'dinJ-yafQ']
['gpt' 'frsA']
['gpt' 'frsA']
['yafY-ykfBF-yafX-ykfGH-yafW-ykfI' 'ykfL' 'ykfK']
['maa' 'tomB-hha']
['nfsB' 'ybdF']
['ybdF' 'ybdJ']
['rsfS-rlmH-mrdAB-rlpA' 'leuS-lptE-holA-nadD-cobC']
['rsfS-rlmH-mrdAB-rlpA' 'leuS-lptE-holA-nadD-cobC']
['ybfD' 'ybgA-phr']
['cydX-ybgE' 'ybgC-tolQRA']
['lrp' 'ftsK']
['lrp' 'ftsK']
['yceQ' 'rluC']
['ydaGF' 'racR']
['ortT' 'ydcY']
['yncG' 'yncH']
['ydfH' 'ydfZ']
['gnsB' 'ynfN']
['ydhR' 'ydhS']
['ydiV' 'nlpC']
['btuCED' 'thrS-infC-rpmI-rplT-pheMST-ihfA']
['ydiZ' 'yniA']
['fadD-sroD' 'tsaB-yeaY']
['yobD' 'mntP']
['ruvAB' 'yobI']
['yedK' 'yedL']
['cobUST' 'yeeH']
['plaP' 'yoeI']
['yegLK' 'ibsA']
['yegLK' 'ibsA']
['sanA-yeiS' 'preTA']
['insH-8' 'yejO']
['yfaS' 'yfaATS_1S_2QP']
['yfaS' 'yfaATS_1S_2QP']
['yfcG' 'folX-yfcH']
['yfcG' 'folX-yfcH']
['argT-hisJQMP' 'cvpA-purF-ubiX']
['gcvR' 'bcp']
['bamB-der' 'yfgM']
['ypjI_1' 'ypjI_2' 'yfjXY-ypjJ-yfjZ-ypjF']
['nlpD-rpoS' 'umpG-pcm']
['ygdR' 'tas']


['b0833,b0834', nan]
[nan, nan]
['b0842', 'b0841']
[nan, nan]
['b0846', 'b0844,b0845']
['b0848', 'b0847']
['b0848', 'b0847']
['b0848', 'b0847']
['b0848', 'b0847']
['b0848', '']
['b0850,b0851,b0852,b0853', 'b0849']
['b0850,b0851,b0852,b0853', 'b0849']
['b0850,b0851,b0852,b0853', 'b0849']
[nan, nan]
['b0854,b0855,b0856,b0857', nan]
['b0854,b0855,b0856,b0857', nan]
['b0854,b0855,b0856,b0857', nan]
['b0854,b0855,b0856,b0857', nan]
[nan, nan]
[nan, 'b0860']
[nan, 'b0861,b0862,b0863,b0864']
[nan, nan]
[nan, 'b0869,b0870,b0871,b0872,b0873']
[nan, nan]
[nan, nan]
[nan, 'b0874']
[nan, 'b0874']
['b0876', 'b0875']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b0885']
[nan, nan]
['b0889,b0890', nan]
['b0889,b0890', nan]
[nan, nan]
[nan, nan]
['b0891,b0892', nan]
[nan, nan]
[nan, nan]
['b0898', 'b0897']
['b0901', 'b0900']
['b0906', 'b0905']
['b0907,b0908', nan]
['b0907,b0908', nan]
[nan, nan]
['b0909', nan]
['b0909', nan]
['b0909', nan]
['b0909', nan]
['b0910,b0911,b0912', nan]
['b0910,b0911,b

[nan, nan]
[nan, nan]
['b2074,b2075,b2076,b2077,b2078,b2079', nan]
[nan, '']
[nan, 'b2082']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2101']
[nan, 'b2101']
[nan, 'b2103,b2104']
[nan, 'b2108,b2109,b2110,b2111']
['b2144,b2145,b2146,b2147', nan]
['b2146,b2147', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b2151']
[nan, 'b2151']
[nan, 'b2155']
['b2158', 'b2157']
['b2160', nan]
[nan, 'b2161']
[nan, 'b2161']
[nan, 'b2164']
[nan, 'b2165,b2166']
['b2171', 'b4502']
['b2176', nan]
['b2177,b2178,b2179,b2180', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2185', nan]
['b2185', nan]
[nan, 'b2186']
[nan, nan]
[nan, 'b2190_2,b2190_1']
['b2193', 'b2190_2,b2192,b2190_1']
[nan, nan]
[nan, 'b2194,b2195,b2196,b2197,b2198,b2199,b2200,b2201,b2202,b2203,b2204,b2205,b2206,b2207,b2208']
[nan, 'b2194,b2195,b2196,b2197,b2198,b2199,b2200,b2201,b2202,b2203,b2204,b2205,b2206,b2207,b2208']
[nan, 'b2194,b2195,b2196,b2197,b2198,b2199,b2200,b2201,b2202,b2203,b2204,b2205,b2206,b2207,b2208']
[nan, nan]
[n

['b3119', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3119', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3119', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3119,b3120,b3121', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3119,b3120,b3121', 'b4471,b3113,b3114,b3115,b3116,b3117,b3118']
['b3120,b3121', nan]
['b3120,b3121', nan]
[nan, nan]
[nan, nan]
[nan, 'b3124,b3125,b3126,b3127']
[nan, 'b3124,b3125,b3126,b3127']
[nan, nan]
[nan, 'b3124,b3125,b3126,b3127']
['b3129,b3130', nan]
['b3132,b3133,b3134,b3135', nan]
['b3132,b3133,b3134,b3135', nan]
['b3136,b3137,b3138,b3139,b3140,b3141', nan]
['b3136,b3137,b3138,b3139,b3140,b3141', nan]
['b3142', nan]
['b3143,b3144,b3145', nan]
['b3143,b3144,b3145', nan]
['b3143,b3144,b3145', nan]
[nan, nan]
['b3148,b3149', nan]
['b3153', nan]
['b3155', 'b3154']
[nan, 'b3156,b3157']
[nan, 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', 'b3164,b3165,b3166,b3167,b3168,b3169,b3170']
['b3172', nan]
[nan, nan]
[nan, 'b3176,b3177']
[nan, 'b3176,b

[nan, 'b3754,b3755']
[nan, nan]
['b3764', 'b4480']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', nan]
[nan, nan]
['b3774', 'b3773']
[nan, 'b3775']
[nan, nan]
[nan, 'b3780']
['b3781', 'b3780']
['b3781', 'b3780']
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3801']
[nan, 'b3801']
[nan, 'b3802,b3803,b3804,b3805']
[nan, nan]
[nan, 'b3802,b3803,b3804,b3805']
[nan, 'b3802,b3803,b3804,b3805']
['b455

['bcsQ' 'yhjR']
['yiaG' 'cspA']
['mokA' 'hokA']
['yibG' 'yibS']
['yibG' 'yibS']
['yibG' 'yibS' 'yibW_1' 'yibW_2']
['yibS' 'yibW_1' 'yibW_2']
['yibW_2' 'yibV_1']
['yibW_2' 'yibV_1']
['yibV_1' 'yibV_2']
['yibV_1' 'yibV_2' 'yibU_1']
['yibV_2' 'yibU_1' 'yibU_2']
['yibU_1' 'yibU_2']
['yibU_1' 'yibU_2']
['yicT' 'setC']
['yiiE' 'yiiF']
['mdtNOP' 'ytcA']
['yjfN' 'bsmA']
['yjfN' 'bsmA']
['topAI-yjhQ' 'yjhX']
['b0001,b0002,b0003,b0004', nan]
['b0019,b0020', nan]
['b0041,b0042,b0043,b0044', 'b0035,b0036,b0037,b0038,b0039,b0040']
['b0041,b0042,b0043,b0044', 'b0035,b0036,b0037,b0038,b0039,b0040']
['b4659_1,b4659_2', nan]
[nan, 'b0058,b0059']
[nan, 'b0071,b0072,b0073,b0074,b0075']
[nan, 'b0071,b0072,b0073,b0074,b0075']
['b0076', 'b0071,b0072,b0073,b0074,b0075']
['b0076', 'b0071,b0072,b0073,b0074,b0075']
['b0081,b0082,b0083,b0084,b0085,b0086,b0087,b0088,b0089,b0090,b0091,b0092,b0093,b0094,b0095,b0096', nan]
['', '']
[nan, nan]
[nan, 'b0135,b0136,b0137,b0138']
[nan, 'b0135,b0136,b0137,b0138']
[nan, 'b

[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2046,b2047,b2048,b2049,b2050,b2051,b2052,b2053,b2054,b2055,b2056,b2057']
[nan, 'b2046,b2047,b2048,b2049,b2050,b2051,b2052,b2053,b2054,b2055,b2056,b2057']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4667,b4668']
['b2086', 'b2083,b2085']
[nan, nan]
[nan, nan]
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, nan]
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_2,b2092_1,b2093,b2094,b2095,b2096']
[nan, 'b2091,b2092_

[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b3516,b3517']
['b3521', 'b3520']
['b3521', 'b3520']
['b3521', nan]
[nan, nan]
[nan, nan]
[nan, 'b3534']
['b3536,b3537,b3538', 'b3534,b3535']
['b3536,b3537,b3538', 'b3535']
['b3536,b3537,b3538', nan]
[nan, 'b3540,b3541,b3542,b3543,b3544']
['b3549,b3550', 'b3548']
['b3555,b3556', nan]
['b3556', nan]
['b3557', '']
['b3557', 'b4647,b4455']
['b3566,b3567,b3568,b3569', 'b3564,b3565']
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', 'b3574']
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', nan]
['b3585', 'b3584']
[nan, 'b3586,b3587']
[nan, 'b3586,b3587']
[nan, 'b3586,b3587']
[nan, 'b3586,b3587']
[nan, 'b3586,b3587']
['b3593,b3594', nan]
['b3593,b3594', nan]
['b3593,b3594', nan]
['b3593,b3594', nan]
['b3593,b3594', nan]
['b3595', nan]
['b3596', nan]
['b3596,b4650', nan]
['b3596,b4650', nan]
['b3596,b4650,b4651_1,b4651_2', nan]
['b4650,b4651_1,b4651_2', nan]
['b4651_2,b4615_1', nan]
['b4651_2,b4615_1', nan]
['b4615_1,b4615_2', nan]
['b46

['yqeL' 'yqeK']
['ygeLK' 'insCD-4C-4D-4-ygeONM']
['ibsD' 'ibsE']
['ibsD' 'ibsE']
['yhdN-zntR' 'rpsMKD-rpoA-rplQ']
['yhdN-zntR' 'rpsMKD-rpoA-rplQ']
['yhdN-zntR' 'rpsMKD-rpoA-rplQ']
['rpsMKD-rpoA-rplQ' 'rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ']
['rpsMKD-rpoA-rplQ' 'rplNXE-rpsNH-rplFR-rpsE-rpmD-rplO-secY-rpmJ']
['yhhH' 'yrhC']
['yrhC' 'yhhI']
['yhiS_1' 'slp-dctR']
['yhiS_1' 'slp-dctR']
['yiaG' 'cspA']
['yibG' 'yibS' 'yibW_1']
['yibW_2' 'yibV_1' 'yibV_2']
['yibU_1' 'yibU_2']
['rpmH-rnpA' 'yidD']
['adiC' 'adiY']
['yjdQ_2' 'yjdQ_1']
['yjdQ_2' 'yjdQ_1']
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
['b0001,b0002,b0003,b0004', nan]
[nan, nan]
[nan, 'b0018,b4412']
['b0024,b0025,b0026,b0027,b0028,b0029', 'b0021,b0022,b0023']
['b0024,b0025,b0026,b0027,b0028,b0029', 'b0023']
['b0041,b0042,b0043,b0044', 'b0035,b0036,b0037,b0038,b0039,b0040']
['b4659_1,b4659_2', nan]
[nan, 'b0071,b0072,b0073,b0074,b0075']
[nan,

[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, nan]
[nan, nan]
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 

['intF' 'yagP']
['ylcH' 'ybcN-ninE-ybcO-rusA-ylcG']
['zitB' 'ybgS']
['glnHPQ' 'dps']
['cybB' 'ydcA']
['ydcH' 'rimL']
['ortT' 'ydcY']
['yncG' 'yncH']
['ldtE' 'sufABCDSE']
['yeaK' 'yeaL']
['yobD' 'mntP']
['rlmA' 'yobF-cspC']
['ogrK' 'yegRZ']
['bamB-der' 'yfgM']
['ygaZH' 'mprA-emrAB']
['yqcG' 'ygcG']
['yqjF' 'yqjG']
['yhaH' 'yhaI']
['arfA' 'yhdN-zntR']
['yiaG' 'cspA']
['yibL' 'lldPRD']
['yicT' 'setC']
['tisB' 'emrD']
['yidE' 'ibpAB']
['rarD' 'yigI']
['thiCEFSGH' 'rsd']
['rpiB' 'yjdP']
['yjfN' 'bsmA']
['b0001,b0002,b0003,b0004', nan]
['b0019,b0020', nan]
['b0019,b0020', nan]
['b0032,b0033', nan]
['b0032,b0033', nan]
['b0034', nan]
[nan, 'b0035,b0036,b0037,b0038,b0039,b0040']
['b0048', nan]
['b0048', nan]
[nan, 'b0049,b0050,b0051,b0052,b0053,b0054']
['b4659_1,b4659_2', nan]
[nan, nan]
['b0097,b0098,b0099', nan]
['', '']
['b0110,b0111', 'b0109']
['b0119', nan]
[nan, nan]
[nan, 'b0139,b0140']
[nan, 'b0142,b0143']
['b0150,b0151,b0152,b0153', nan]
['b0190,b0191,b0192', nan]
[nan, nan]
[nan, 'b0

['b3710', nan]
['b3710', nan]
['b3715', 'b3714']
['b3716,b3717', nan]
[nan, 'b3718,b3719,b3720']
[nan, 'b3724,b3725,b3726,b3727,b3728']
[nan, nan]
[nan, nan]
[nan, nan]
['b3764', 'b4480']
['b3764', 'b4480']
['b3764', 'b4480']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', 'b3765']
[nan, 'b3775']
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
['b3784,b3785,b3786,b3787,b3788,b3789,b3790,b3791,b3792,b4481,b3793,b3794', nan]
[nan, nan]
['b3800', nan]
[nan, nan]
[nan, 'b3801']
[nan, nan]
['b3821', 'b3819,b3820']
['b3823', nan]
['b3832', nan]
['b3836,b3838,b3839,b4483', nan]
[nan, nan]
[nan, nan]
[nan, 'b3862']
['b3863', 'b3862']
['b3863', 'b3862']
['b3866', nan]
['b3867', nan]
[nan, '']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['', nan]
[nan, 'b3891,b3892,b3893,b3894']
['b3896', nan]
['b3908', 'b3907']
['b3917', nan]
['b3917', nan]
['b3918', nan]
[nan, 'b3919']
['b3921', 'b3920']
[

['', nan]
['b3918', nan]
[nan, nan]
[nan, nan]
['', nan]
['b3949,b3950', 'b3945,b3946,b3947']
[nan, nan]
[nan, 'b3974']
['b3980', nan]
['b3980', nan]
['b3981,b3982', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b3989', nan]
['b3989', nan]
['b3989', nan]
['b3989', nan]
['b3989', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3990,b3991,b4407,b3992,b3993,b3994']
[nan, 'b4005,b4006']
[nan, 'b4005,b4006']
['b4011', nan]
['b4011', nan]
['b4013', 'b4012']
['b4013', 'b4012']
['b4013', nan]
['b4014,b4015,b4016', nan]
[nan, nan]
[nan, nan]
[nan, 'b4017']
[nan, 'b4017']
['b4019', 'b4018']
['b4019', 'b4018']
['b4022', 'b4021']
[nan, 'b4023']
['b4054', nan]
[nan, nan]
['b4059', 'b4058']
['b4111'

[nan, 'b3376,b3377,b3378,b3379,b3380,b3381']
['b3434', 'b3433']
['b3441', 'b3440']
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
[nan, 'b3454,b3455,b3456,b3457,b3458']
[nan, 'b3461']
['b3483', nan]
['b3483,b4552', nan]
['b4552', nan]
['b4552,b3484', nan]
['b4552,b3484', nan]
['b3484', nan]
[nan, 'b3488']
[nan, 'b3488']
[nan, 'b4660_2,b4660_1']
['b3491', 'b4660_2,b4660_1']
['b3504_1,b3504_2', nan]
['b3504_1,b3504_2', nan]
['b3504_1,b3504_2,b3506,b3507', 'b3505']
['b3504_1,b3504_2,b3506,b3507', 'b3505']
['b3512,b3513,b3514', nan]
['b3512,b3513,b3514', nan]
[nan, nan]
[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b3516,b3517']
[nan, nan]
['b3555,b3556', nan]
['b3556', nan]
['b3556', nan]
[nan, 'b3559,b3560']
['b3575,b3576,b3577,b3578,b3579,b3580,b3581,b3582,b3583', 'b3574']
['b3593,b3594', nan]
['b3595', nan]
['b3596', nan]
['b3596,b4650,b4651_1,b4651_2', nan]
['b4615_1,b4615_2', nan]
['b4615_1,b4615_2', nan]
['b4615_2,b4652_1,b4652_2', nan]
['b3599,b3600

['b0791', 'b0788,b0789,b0790']
['b0799,b0800', 'b0798']
[nan, 'b0809,b0810,b0811']
[nan, 'b0812']
['b0814', 'b0813']
['b0814', 'b0813']
['b0817,b0818', 'b0815,b4705']
['b0817,b0818', 'b4705']
['b0817,b0818', 'b4705']
['b0820', 'b0819']
['b0820', 'b0819']
['b0820', 'b0819']
['b0833,b0834', nan]
['b0842', 'b0841']
['b0848', 'b0847']
['b0850,b0851,b0852,b0853', 'b0849']
['b0850,b0851,b0852,b0853', 'b0849']
['b0854,b0855,b0856,b0857', nan]
['b0854,b0855,b0856,b0857', nan]
[nan, nan]
[nan, 'b0874']
['b0876', 'b0875']
['b0881', 'b0880']
[nan, nan]
[nan, 'b0884']
[nan, 'b0885']
['b0889,b0890', nan]
['b0898', 'b0897']
['b0899', nan]
[nan, 'b0903,b0904']
['b0909', nan]
['b0910,b0911,b0912', nan]
['b0913,b0914,b0915,b0916', nan]
['b0913,b0914,b0915,b0916', nan]
['b0917,b0918', nan]
['b0925', nan]
[nan, nan]
[nan, 'b0929']
[nan, 'b0929']
['b0938', 'b0933,b0934,b0935,b0936,b0937']
['b0938', 'b0933,b0934,b0935,b0936,b0937']
['b0939,b0940,b0941,b0942,b0943,b0944', nan]
['b0950,b0951,b0952', nan]
['b

[nan, nan]
['b2504', 'b2503']
['b2509', 'b2507,b2508']
['b2509', 'b2507,b2508']
[nan, 'b2522']
[nan, 'b2536']
[nan, nan]
['b2558', 'b2557']
['b2561', 'b2559,b2560']
['b2574', 'b2570,b2571,b2572,b2573']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2597', nan]
['b2597', nan]
['b2597,b2598,b2599', nan]
[nan, nan]
['b2625', 'b2623']
['b2625', 'b2623']
['b2626', nan]
['b2630,b2631', nan]
[nan, '']
[nan, nan]
[nan, nan]
[nan, nan]
['b4644_1', nan]
[nan, nan]
[nan, 'b2648']
[nan, nan]
[nan, 'b2650']
[nan, 'b2650']
['b4462', nan]
['b4462', nan]
['b4462', nan]
['b4462', nan]
['b4462', nan]
['b4462', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2659,b2660,b2661,b2662,b2663', nan]
['b2659,b2660,b2661,b2662,b2663', nan]
['b2667,b2668', nan]
['b2670', nan]
['b2672,b2673,b2674,b2675,b2676', 'b2671']
['b2677,b2678,b2679', nan]
[nan, 'b2696']
['b2702,b2703,b2704,b2705,b2706,b2707,b2708', nan]
[nan, 'b2712,b2713']
['b2726,b2727,

[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
['b3633,b3634', 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
['b3640,b3641', nan]
['b3648', 'b3647']
[nan, 'b3656,b3657']
['b4653', 'b3656,b3657']
[nan, 'b3661']
[nan, nan]
[nan, 'b3667,b3668,b3669,b3670,b3671,b3672']
['b4618', 'b3667,b3668,b3669,b3670,b3671,b3672']
['b4618', 'b3667,b3668,b3669,b3670,b3671,b3672']
['b4618,b3673', nan]
['b3673', nan]
[nan, 'b3685,b3686,b3687']
['b3688', 'b3686,b3687']
[nan, nan]
['b3696', 'b3691,b4478,b4477,b3693,b4479']
['b3703,b3704', nan]
['b3707,b3708,b3709', nan]
['b3710', nan]
['b3715', 'b3714']
[nan, 'b3718,b3719,b3720']
[nan, 'b3721,b3722,b3723']
[nan, 'b3721,b3722,b3723']
[nan, 'b3724,b3725,b3726,b3727,b3728']
[nan, 'b3731,b3732,b3733,b3734,b3735,b3736,b3737,b3738,b3739']
[nan, 'b3740,b3741,b3742,b3743']
['b3748,b3749,b3750,b3751,b3752,b3753', nan]
[nan, 'b3754,b3755']
[nan, 'b3754,b3755']
[

[nan, nan]
[nan, nan]
[nan, 'b0903,b0904']
['b0938', 'b0933,b0934,b0935,b0936,b0937']
['b0938', 'b0933,b0934,b0935,b0936,b0937']
['b0938', 'b0933,b0934,b0935,b0936,b0937']
['b0939,b0940,b0941,b0942,b0943,b0944', nan]
['b1001', 'b0999,b1000']
['b1001', 'b0999,b1000']
['b1001', nan]
['b1001', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b1002', nan]
['b1002', nan]
['b1002', nan]
['b1025', 'b1021,b1022,b1023,b1024']
['b1025', 'b1021,b1022,b1023,b1024']
['b1025', 'b1021,b1022,b1023,b1024']
['b1025', nan]
['b1025', nan]
['b1025', nan]
['b1028,b1029', 'b1026,b1027']
[nan, 'b1037,b1038,b1039,b1040']
['b1041,b1042,b1043', 'b1037,b1038,b1039,b1040']
['b1041,b1042,b1043', nan]
['b1041,b1042,b1043', nan]
[nan, 'b1056,b1057']
['', '']
['', 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, 'b1160']
[nan, nan]
[nan, '']
[nan, 'b1161']
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1164,b1165,b1166,b1167', nan]
['b1

['b2877', 'b2876']
['b2878,b2879', nan]
['b2878,b2879', nan]
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b2928,b2929,b2930,b4465,b2933,b2934']
[nan, 'b4466']
[nan, 'b4466']
[nan, 'b4466']
['b2986', 'b2984,b2985']
['b2986', 'b2984,b2985']
['b2986', 'b2984,b2985']
['b2986', 'b2984,b2985']
[nan, 'b2987']
[nan, 'b2987']
[nan, 'b2987']
[nan, 'b3027']
['b3028', 'b3027']
['b3028', 'b3027']
[nan, nan]
[nan, nan]
['b3043', nan]
['b3043', nan]
['b3043', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
['b3046_1,b3044,b3045,b3046_2,b3047,b3048', nan]
[nan, nan]
['b3050,b3051', 'b3049']
['b3050,b3051', 'b3049']
['b3050,b3051', 'b3049']
['b3050,b3051', nan]
['b3050,b3051', nan]
['b3050,b3051', nan]
[nan, 'b3060']
['b3104', nan]
[nan, 'b4471,b3113,b3

[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, 'b3623,b3624,b3625,b3626,b3627,b3628,b3629,b3630,b3631,b3632']
[nan, nan]
['b3659', nan]
['b3659', nan]
['b3659', nan]
['b3665', 'b3664']
['b3665', 'b3664']
['b3680', nan]
['b3707,b3708,b3709', nan]
['b3707,b3708,b3709', nan]
['b3707,b3708,b3709', nan]
[nan, 'b3721,b3722,b3723']
[nan, 'b3721,b3722,b3723

[nan, 'b1377,b1378']
[nan, 'b1377,b1378']
['b4492_1', '']
['b4492_1', 'b4674']
['b4492_1', 'b4674']
['b4492_1', 'b4674']
['b1455', nan]
['b1455', nan]
['', nan]
['', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1456,b1457,b1459_1,b1459_2', nan]
['b1459_1,b1459_2', nan]
['b1459_1,b1459_2', nan]
['b1459_1,b1459_2,b1460', nan]
['b1459_1,b1459_2,b1460', nan]
['b1459_1,b1459_2,b1460', nan]
['b1460', nan]
['b1460', nan]
['b1460', nan]
[nan, 'b1469,b1471_2,b1471_1,b1472']
[nan, 'b1469,b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b1472']
[nan, 'b1471_2,b1471_1,b14

['b3227', 'b3226']
['b3265,b3266', 'b3264']
['b3265,b3266', 'b3264']
['b3265,b3266', 'b3264']
['b3265,b3266', 'b3264']
['b3324,b3325,b3326,b3327,b3328,b3329,b3330,b3331,b3332,b3333,b3334,b3335', 'b3322,b3323']
['b3324,b3325,b3326,b3327,b3328,b3329,b3330,b3331,b3332,b3333,b3334,b3335', 'b3322,b3323']
[nan, 'b3338']
[nan, 'b3338']
[nan, 'b3338']
['b3369', nan]
['b3369', nan]
['b3408,b3409,b3410', nan]
['b3441,b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
[nan, nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['b3446', nan]
['b3446', nan]
['b3446', nan]
['b3483', nan]
['b3

[nan, 'b4297,b4298,b4299']
[nan, nan]
[nan, 'b4309,b4310,b4311']
[nan, 'b4309,b4310,b4311']
[nan, 'b4309,b4310,b4311']
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4313', nan]
['b4313', nan]
[nan, 'b4325']
[nan, 'b4325']
[nan, 'b4325']
['b4326', 'b4325']
['b4326', 'b4325']
['b4326', 'b4325']
['b4342', nan]
['b4342', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b4345,b4346']
[nan, 'b4345,b4346']
[nan, nan]
[nan, 'b4356']
['b4365,b4366', 'b4364']
['b4365,b4366', 'b4364']
['b4365,b4366', 'b4364']
['yaaW' 'yaaI']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['yadI' 'yadE']
['sfsA-dksA-gluQ' 'thpR']
['sfsA-dksA-gluQ' 'thpR']
['ispU' 'cdsA']
['gpt' 'frsA']
['insAB-2A-2B-2-afuBC' 'yagAB-insX']
['yagML' 'yagN']
['intF' 'yagP']
['iraP' 'phoA-psiF']
['bolA' 'tig']
['acrR' 'mscK']
['ybaN' 'apt']
['ybaN' 'apt']
['intD' 'xisD']
['ybfE' 'ybfF']
['zitB' 'ybgS']
['opgE' 'rybA-mntS']
['clpS' 'clpA']
['clpS' 'clpA']
['lrp' 'ftsK']
['lrp' 'ftsK']
['ycaP' 'serC-aroA']
['ompA' 'sulA

[nan, 'b0692,b0693']
['b0707,b0708', nan]
['b0707,b0708', nan]
[nan, nan]
[nan, 'b0716,b0717,b0718']
[nan, 'b0720']
[nan, 'b0720']
[nan, 'b0720']
[nan, 'b0720']
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', 'b0720']
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', 'b0720']
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0721,b0722,b0723,b0724,b0726,b0727,b0728,b0729', nan]
['b0733,b0734', nan]
[nan, nan]
['b0736,b0737,b0738,b0739', nan]
['b0736,b0737,b0738,b0739', nan]
['b0736,b0737,b0738,b0739', nan]
[nan, nan]
[nan, nan]
[nan, 'b0752,b0753']
[nan, 'b0760,b0761']
['b0763,b

['b1779,b1780', 'b1777,b1778']
['b1779,b1780', 'b1778']
['b1779,b1780', 'b1778']
['b1779,b1780', 'b1778']
['b1779,b1780', nan]
['b1779,b1780', nan]
['b1783,b1784', 'b1782']
[nan, 'b1798']
['b1817,b1818,b1819', 'b1816']
['b1817,b1818,b1819', 'b1816']
[nan, nan]
[nan, 'b1830,b1831']
[nan, 'b1830,b1831']
[nan, 'b1830,b1831']
[nan, 'b1830,b1831']
['b1833,b1834', 'b1830,b1831,b1832']
['b1833,b1834', 'b1832']
['b1833,b1834', 'b1832']
['b1833,b1834', 'b1832']
['b1833,b1834', 'b1832']
[nan, nan]
[nan, nan]
['b1833,b1834', nan]
['b1833,b1834', nan]
['b1833,b1834', nan]
[nan, 'b1847']
[nan, nan]
['b1854', nan]
[nan, 'b1856']
['b1858,b1859', 'b1857']
[nan, 'b1863,b1864,b1865']
['b1867,b1868', 'b1866']
['b1867,b1868', 'b1866']
['b1867,b1868', 'b1866']
['b1867,b1868', 'b1866']
['b1867,b1868', nan]
['b1867,b1868,b1869,b1870,b1871', nan]
['b1869,b1870,b1871', nan]
['b1869,b1870,b1871', nan]
['b1869,b1870,b1871', nan]
['b1876', 'b1874,b1875']
[nan, 'b1887,b1888,b1889,b1890']
[nan, 'b1891,b1892']
[nan,

['b2834', nan]
['b2837', nan]
[nan, 'b2840,b2841']
[nan, nan]
['b2872', nan]
['b2872', nan]
['b2880,b2881', nan]
[nan, 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
[nan, 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
[nan, 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
['b2895', 'b2890,b2891_2,b2891_1,b2892,b2893,b2894']
[nan, '']
['b2898', 'b2896,b2897']
['b2898', 'b2896,b2897']
['b2898', 'b2896,b2897']
['b2898', nan]
['b2901', 'b2900']
[nan, 'b2906,b2907,b2908,b2909']
[nan, nan]
[nan, 'b2913']
[nan, 'b2913']
[nan, 'b2913']
[nan, 'b2913']
[nan, 'b2913']
[nan, 'b2914']
['b2916', 'b2914,b2915']
['b2916', 'b2914,b2915']
['b2916', 'b2915']
['b2917,b2918,b2919,b2920', nan]
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, 'b2925,b2926,b2927']
[nan, nan]
[nan, nan]
['b2936', 'b2935']
[nan, 'b2937,b2938']
[nan, nan]
[nan, nan]
[nan, 'b2937,b2938']
['b2940', 'b2937,b2938']
['b2940', 'b2937,b2938,b2939']
['b2940,b2942', 'b2937,b2938,b2939']
['b2942', 'b2939']
['b2942', nan]
['b2942', nan]
['b2

[nan, 'b3343,b3344,b3345,b3346']
[nan, 'b3343,b3344,b3345,b3346']
[nan, 'b3343,b3344,b3345,b3346']
[nan, 'b3347']
['b3348', 'b3347']
[nan, 'b3349,b4551,b3350,b3351']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b4551,b3350,b3351']
['b3352,b3353,b3354', 'b4551,b3350,b3351']
['b3352,b3353,b3354', 'b4551,b3350,b3351']
['b3357', 'b3356']
['b3357', 'b3356']
['b3364', nan]
[nan, nan]
[nan, nan]
['b3365,b3366,b3367,b3368', nan]
['b3365,b3366,b3367,b3368', nan]
['b3365,b3366,b3367,b3368', nan]
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, nan]
[nan, 'b3391,b3392,b3393,b3394,b3395']
[nan, 'b3391,b3392,b3393,b3394,b3395']
[nan, 'b3392,b3393,b3394,b3395']
['b3396', 'b3392,b3393,b3394,b3395']
['b3396', 'b3392,b3393,b3394,b3395']
['b3396', nan]
[nan, nan]
['b3406,b3407', 'b3404,b3405']
[nan, 

['b3939,b3940', 'b3937,b3938']
['b3939,b3940', 'b3938']
['b3939,b3940', 'b3938']
['b3939,b3940', 'b3938']
['b3941', nan]
['b3943', nan]
[nan, 'b3944']
[nan, 'b3945,b3946,b3947']
[nan, 'b3956']
[nan, 'b3956']
[nan, 'b3956']
[nan, 'b3956']
[nan, 'b3956']
[nan, nan]
[nan, nan]
[nan, 'b3957']
['b3958,b3959,b3960', 'b3957']
['b3958,b3959,b3960', 'b3957']
['b3958,b3959,b3960', 'b3957']
['b3958,b3959,b3960', 'b3957']
['b3958,b3959,b3960', nan]
['b3958,b3959,b3960', nan]
['b3958,b3959,b3960', nan]
[nan, nan]
[nan, nan]
['b3961', nan]
[nan, nan]
[nan, 'b3962']
['b3963,b3964', 'b3962']
['b3963,b3964', nan]
['b3963,b3964', nan]
['b3966,b3967', 'b3965']
['b3966,b3967', 'b3965']
['b3966,b3967', 'b3965']
['b3966,b3967', nan]
[nan, nan]
['b3966,b3967', nan]
['b3966,b3967', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3974']
[nan, 'b3974']
[nan, 'b3974']
[nan, 'b3974']
[nan, 'b3974']
['b3980', nan]
['b3980', nan]
['b3980', nan]
['b3981,b3982', nan]
['b3981,

['b0081,b0082,b0083,b0084,b0085,b0086,b0087,b0088,b0089,b0090,b0091,b0092,b0093,b0094,b0095,b0096', nan]
['b0081,b0082,b0083,b0084,b0085,b0086,b0087,b0088,b0089,b0090,b0091,b0092,b0093,b0094,b0095,b0096', nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b0118', 'b0117']
['b0125', 'b0124']
[nan, nan]
['b0127,b0128', 'b0126']
['b0127,b0128', nan]
['b0127,b0128', nan]
['b0127,b0128', nan]
['b0127,b0128', nan]
['b0129,b0130', nan]
[nan, 'b0144,b0145,b0146']
['b0149', nan]
['b0156', nan]
[nan, nan]
[nan, 'b0166,b0167,b0168']
[nan, 'b0166,b0167,b0168']
['b0169,b0170', 'b0166,b0167,b0168']
['b0169,b0170', 'b0166,b0167,b0168']
['b0169,b0170', 'b0166,b0167,b0168']
['b0169,b0170', 'b0166,b0167,b0168']
['b0174,b0175', nan]
['b0190,b0191,b0192', nan]
['b0200', nan]
['b0222', 'b0221']
['b0222', 'b0221']
['b0222', 'b0221']
['b0222', 'b0221']
['b0222', 'b0221']
['b0223', nan]
['b0223', nan]
[nan, 'b0224']
['b0227', 'b0225,b0226']
['b0227', 'b0225,b0226']
['b0228', nan]
['b0231,b0232,b0233,b0234', nan]
[nan, n

[nan, 'b1771,b1772,b1773,b1774,b1775,b1776,b1777']
['b1779,b1780', 'b1778']
['b1779,b1780', nan]
['b1779,b1780', nan]
['b1779,b1780', nan]
['b1779,b1780', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b1781']
['b1783,b1784', 'b1782']
['b1783,b1784', 'b1782']
['b1783,b1784', nan]
['b1783,b1784', nan]
['b1810', nan]
['b1810', nan]
['b1810,b1812,b1813', '']
['b1817,b1818,b1819', 'b1816']
['b1817,b1818,b1819', nan]
[nan, 'b1829']
[nan, 'b1830,b1831']
[nan, 'b1830,b1831']
[nan, nan]
['b1854', nan]
['b1858,b1859', 'b1857']
[nan, 'b1891,b1892']
[nan, 'b4460,b1900,b1901']
[nan, nan]
['b1902', nan]
[nan, 'b1920,b1921,b1922']
['b1924,b1925,b1926,b1927', nan]
['b1953', 'b1952']
['b1955', 'b1952']
[nan, 'b1960,b1961']
['b1974', nan]
[nan, nan]
['b1982', nan]
[nan, 'b1991,b1992,b1993']
['b4538', '']
[nan, 'b2015']
['b2018,b2019,b2020,b2021,b2022,b2023,b2024,b2025,b2026', 'b4539,b2017']
[nan, nan]
[nan, 'b2072,b2073,b4667']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b2072,b2073,b4667']
['b20

[nan, 'b3339,b3340,b3341,b3342,b3343,b3344,b3345,b3346']
[nan, 'b3343,b3344,b3345,b3346']
[nan, 'b3343,b3344,b3345,b3346']
[nan, nan]
[nan, 'b4551,b3350,b3351']
['b3352,b3353,b3354', 'b4551,b3350,b3351']
['b3365,b3366,b3367,b3368', nan]
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3391,b3392,b3393,b3394,b3395']
['b3396', 'b3392,b3393,b3394,b3395']
[nan, nan]
[nan, nan]
['b3408,b3409,b3410', nan]
['b3411', nan]
['b3418', nan]
['b3434', 'b3433']
['b3434', 'b3433']
['b3434', 'b3433']
['b3434', 'b3433']
[nan, 'b4476,b3437,b3438']
[nan, 'b4476,b3437,b3438']
[nan, 'b3454,b3455,b3456,b3457,b3458']
[nan, 'b3462,b3463,b3464']
['b3468', 'b3467']
['b3482', nan]
['b3493', 'b3492']
['b3493', 'b3492']
['b3493', 'b3492']
[nan, '']
[nan, 'b3494']
['b3495', 'b3494']
['b3495', 'b3494']
['b3495', 'b3494']
['b3495', nan]
['b3495', nan]
['b3496', nan]
['b3496', nan]
['b3501,b3502,b3503', nan]
['b3506,b3507', nan]
[nan, 'b3508,b3509,b3510']
[nan, 'b3508,b3509,b3510']
[nan, 'b3508,b3509,b3510']

[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, nan]
['b1729', nan]
['b1729', nan]
['b1729', nan]
[nan, nan]
['b1750,b1751,b1752,b1753,b1754,b1755,b1756', nan]
['b1779,b1780', 'b1778']
['b1779,b1780', 'b1778']
['b1779,b1780', 'b1778']
['b1810', nan]
[nan, 'b1822,b1823,b1824']
[nan, 'b1823,b1824']
[nan, 'b1823,b1824']
[nan, 'b1838']
['b1902', nan]
['b1904', 'b4537,b4663']
[nan, 'b1908']
[nan, 'b1908']
[nan, 'b1908']
[nan, nan]
[nan, 'b1920,b1921,b1922']
['b1955', 'b1952']
[nan, 'b1960,b1961']
['b1978', nan]
[nan, nan]
[nan, nan]
[nan, 'b1985']
[nan, 'b2012,b2013']
['b2018,b2019,b2020,b2021,b2022,b2023,b2024,b2025,b2026', 'b4539,b2017']
['b2018,b2019,b2020,b2021,b2022,b2023,b2024,b2025,b2026', 'b4539,b2017']
[nan, 'b2037,b2038,b2039,b2040,b2041']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4667']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4667,b4668']
[nan, 'b2091

['b4312', nan]
['b4322,b4323', 'b4321']
['b4322,b4323', nan]
['b4326', nan]
['b4342', nan]
['b4342', nan]
[nan, nan]
[nan, 'b4367']
['b4567', 'b4367']
['b4567', 'b4367']
['', 'b4367']
['', 'b4367']
['b4381,b4382,b4383,b4384', nan]
['b4381,b4382,b4383,b4384', nan]
['b4402', 'b4401']
['b4402', 'b4401']
['insAB-1A-1B-1' 'rpsT']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['intF' 'yagP']
['maa' 'tomB-hha']
['acrR' 'mscK']
['ylcH' 'ybcN-ninE-ybcO-rusA-ylcG']
['opgE' 'rybA-mntS']
['cbdX' 'appCBXA']
['yceQ' 'rluC']
['recET-ralR-ydaC-xisR-intR' 'racC']
['recET-ralR-ydaC-xisR-intR' 'racC' 'kilR-ydaE']
['ydaGF' 'racR']
['narU' 'yddLKJ']
['ydhP' 'ynhF']
['ydhR' 'ydhS']
['holE' 'yobB-exoX']
['holE' 'yobB-exoX']
['yecJ' 'azuC']
['ibsA' 'ibsB']
['yfgG' 'yfgHI']
['yfgG' 'yfgHI']
['hscBA-fdx-iscX' 'iscRSUA']
['ftsB' 'ygbE']
['ibsD' 'ibsE']
['ibsD' 'ibsE']
['crp' 'yhfK']
['yhhH' 'yrhC']
['yiaG' 'cspA']
['rpmH-rnpA' 'yidD']
['yjdQ_2' 'yjdQ_1']
['yjdQ_2' 'yjdQ_1']
['b0001,b000

[nan, 'b3339,b3340,b3341,b3342']
[nan, 'b3339,b3340,b3341,b3342']
['b3357', 'b3356']
['b3357,b3358', nan]
[nan, 'b3376,b3377,b3378,b3379,b3380,b3381']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
[nan, 'b3384,b3385,b3386,b3387,b3388,b3389,b3390']
['b3398', 'b3397']
['b3415', nan]
[nan, 'b3428,b3429,b3430,b3431,b3432']
[nan, 'b4476,b3437,b3438']
['b3441', 'b3440']
['b3441', 'b3440']
['b3442,b3443_1,b3444,b3445,b3443_2', nan]
['', nan]
[nan, 'b3461']
[nan, 'b3461']
['b3483,b4552', nan]
[nan, nan]
['b3495', 'b3494']
['b3501,b3502,b3503', 'b4613']
['b3506,b3507', nan]
[nan, 'b3508,b3509,b3510']
[nan, 'b3508,b3509,b3510']
[nan, 'b3508,b3509,b3510']
['b3511', 'b3508,b3509,b3510']
['b3511', 'b3508,b3509,b3510']
['b3511', 'b3508,b3509,b3510']
['b3511', 'b3508,b3509,b3510']
['b3511', nan]
['b3511', nan]
[nan, nan]
['b3512,b3513,b3514', nan]
['b3512,b3513,b3514', nan]
[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b3516,b3517']
[nan, nan]
[nan, 'b3515,b3516,b3517']
[nan, 'b3515,b3516,b3517']
[nan

['b2353', nan]
['', 'b2354,b2355,b2356,b2357,b2358']
['b2369,b2370', 'b2367,b2368']
[nan, 'b2371,b2372,b2373,b2374,b2375']
['b2415,b2416,b2417', nan]
[nan, 'b2421,b2422,b2423,b2424,b2425']
[nan, 'b2421,b2422,b2423,b2424,b2425']
['b2428,b2429,b2430', 'b2427']
[nan, nan]
[nan, 'b2431,b2432']
[nan, 'b2431,b2432']
[nan, nan]
[nan, nan]
['b2443', nan]
['b2448,b2449', nan]
['b2448,b2449', nan]
['b2448,b2449', nan]
['b2450', nan]
[nan, nan]
['b2501,b2502', nan]
['b2504,b2505,b2506', nan]
['b2505,b2506', nan]
[nan, 'b2553,b2554']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2597,b2598,b2599', nan]
['b2616', nan]
[nan, nan]
[nan, nan]
['b2642', 'b2641_2,b2641_1']
['b2642', 'b2641_2,b2641_1']
[nan, 'b2648']
[nan, 'b2648']
[nan, 'b2650']
[nan, 'b2650']
['b4462', nan]
['b2670', 'b2669']
['b2670', nan]
[nan, 'b2698,b2699,b2700']
['b2726,b2727,b2

['b0150,b0151,b0152,b0153', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b1088,b1089,b1090,b1091,b1092,b1093,b1094,b1095', 'b1087']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1838']
['b2448,b2449', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2912', nan]
['b2912', nan]
[nan, 'b2913']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3294,b3295,b3296,b3297,b3298']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3635,b3636,b3637,b3638']
['b3703,b3704', 'b3700,b3701,b3702']
[nan, 'b3754,b3755']
[nan, 'b3754,b3755']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b3766,b4669,b4488_1,b4488_2,b3769,b3770,b3771,b3772', nan]
[

['b1663', 'b1662']
['b1667', 'b1664']
['b1676', 'b1675']
['b1677', nan]
['b1677', nan]
['b1677', nan]
['', nan]
[nan, 'b1679,b1680,b1681,b1682,b1683,b1684']
[nan, 'b1685,b1686,b1687']
[nan, 'b1685,b1686,b1687']
['b1703', 'b1702']
['b1703', 'b1702']
['b1703', 'b1702']
[nan, 'b1706']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
[nan, nan]
['b4494_1,b4494_2', 'b1712,b1713,b1714,b1715,b1716,b1717,b1718,b1719']
['b1723', 'b1722']
['b1723', 'b1722']
['b1729', nan]
['b1729', nan]
['b1779,b1780', 'b1777,b1778']
['b1779,b1780', 'b1778'

[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b3302,b3303,b3304,b3305,b3306,b3307,b3308,b3309,b3310']
[nan, 'b3299,b3300,b3301,b33

[nan, 'b4300,b4301,b4302,b4303,b4304,b4565,b4305']
['b4312', nan]
['b4312', nan]
['b4312', nan]
['b4313', nan]
['b4313', nan]
['b4314,b4315,b4316,b4317,b4318,b4319,b4320', nan]
['b4314,b4315,b4316,b4317,b4318,b4319,b4320', nan]
['b4314,b4315,b4316,b4317,b4318,b4319,b4320', nan]
['b4339', 'b4336,b4337']
['b4342', nan]
['b4342', nan]
['b4365,b4366', nan]
[nan, nan]
[nan, nan]
[nan, 'b4367']
[nan, 'b4367']
['b4567', 'b4367']
['b4567', 'b4367']
['b4567', 'b4367']
['', 'b4367']
[nan, nan]
['b4381,b4382,b4383,b4384', nan]
['b4381,b4382,b4383,b4384', nan]
['b4397,b4398,b4399,b4400', 'b4396']
['b4402', 'b4401']
['b4403', 'b4401']
['b4403', 'b4401']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['insAB-1A-1B-1' 'rpsT']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['yaaY' 'ribF-ileS-lspA-fkpB-ispH']
['maa' 'tomB-hha']
['opgE' 'rybA-mntS']
['clpS' 'clpA']
['ompA' 'sulA']
['yceQ' 'rluC']
['yceQ' 'rluC']
['insZ_3' 'insZ_2' 'insZ_1']
['ymiA-yciX' 'acnA']
['cnu' 'ydgK-rsxABCDGE-nth']
['ydhP' 'ynhF']
['ydhP' 'ynhF']
['y

[nan, 'b2323']
['b2324', 'b2323']
[nan, 'b2340']
[nan, 'b2340']
['b2369,b2370', 'b2367,b2368']
['b2369,b2370', 'b2367,b2368']
['b2369,b2370', 'b2367,b2368']
['b2378', 'b2377']
['b2378', 'b2377']
['b2393', 'b2392']
[nan, 'b2395']
['b2398,b2399', 'b2395']
['b2398,b2399', nan]
[nan, 'b2400']
[nan, 'b2400']
[nan, 'b2400']
[nan, nan]
['b2413', 'b2412']
['b2413', 'b2412']
['b2414', nan]
['b2414', nan]
['b2415,b2416,b2417', nan]
['b2415,b2416,b2417', nan]
['b2435,b2436', 'b2433,b2434']
['b2435,b2436', 'b2433,b2434']
[nan, 'b2476']
['b2479', 'b2477,b2478']
['b2494,b2495', 'b2493']
['b2494,b2495', 'b2493']
['b2504', 'b2503']
['b2505,b2506', nan]
['b2505,b2506', nan]
['b2505,b2506', nan]
['b2509', 'b2507,b2508']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b2533', 'b2532']
['b2533', 'b2532']
['b2533', 'b2532']
[nan, 'b2556']
[nan, 'b2556']
[nan, 'b2556']
[nan, nan]
[nan, 'b2570,b2571,b2572,b2573']
[nan, 'b2570,b2571,b2572,b2573']
[nan, 'b2570,b2571,b2572,b2573']
[nan, 'b2570,b2571,b2572,b2573']

[nan, nan]
['b3847,b3848,b3849,b3850', nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, '']
['b3871', 'b3868,b3869,b3870']
['b3871', 'b3868,b3869,b3870']
['b3871', 'b3868,b3869,b3870']
['b3895', 'b3891,b3892,b3893,b3894']
['b4484,b3915', 'b3911,b3912']
['b4484,b3915', 'b3911,b3912']
['b4484,b3915', nan]
['b3917', nan]
['b3936', 'b3935']
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
[nan, nan]
['b3972,b3973', nan]
[nan, 'b3974']
[nan, 'b3974']
['b3980', nan]
['b3981,b3982', nan]
['b3981,b3982', nan]
['b3981,b3982', nan]
['b3981,b3982', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988', nan]
['b3983,b3984,b3985,b3986,b3987,b3988

['b1817,b1818,b1819', 'b1816']
[nan, 'b1822']
[nan, 'b1822']
[nan, 'b1823,b1824']
[nan, 'b1823,b1824']
[nan, 'b1823,b1824']
[nan, '']
[nan, 'b1830,b1831']
['b1833,b1834', 'b1832']
['', nan]
[nan, 'b1838']
[nan, 'b1838']
[nan, 'b1838']
[nan, 'b1838']
[nan, 'b1838']
['b1842,b1843,b1844', 'b1839,b1840,b1841']
[nan, nan]
[nan, 'b1908']
[nan, 'b1908']
[nan, 'b1908']
[nan, nan]
[nan, 'b1912']
['b1976', nan]
['b1976', nan]
['b1976', nan]
[nan, nan]
['b1978', nan]
['b1978', nan]
[nan, 'b1985']
[nan, 'b1985']
[nan, 'b1988']
['b2018,b2019,b2020,b2021,b2022,b2023,b2024,b2025,b2026', 'b4539,b2017']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2037,b2038,b2039,b2040,b2041']
[nan, 'b2042']
[nan, 'b2072,b2073']
[nan, 'b2072,b2073,b4667']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b2072,b2073,b4667']
['b2074,b2075,b2076,b2077,b2078,b2079', 'b4667,b4668']
[nan, '']
[nan, 'b4498_1']
[nan, 'b4498_1']
[nan, 'b4498_1']
[nan, 'b20

In [83]:
len(df)

1921

In [None]:
len(locus)

In [74]:
TF_list.to_csv(org_folder+'TF_list.csv')

In [None]:
for i in range (0, len(database)): 
    peak_annot_DF = annotate_peaks(TF_list[i], TF_condition[i],database[i],500,DF_gene_info).fillna('')
    final_annot_DF = validate_peak_info(peak_annot_DF,DF_gene_info)
    venn_files = Venn_data_gen(final_annot_DF)
    final_annot_DF.to_json(out_data_table+TF_list[i]+'_binding_table.json',orient='records')
    venn_files.to_json(path.join(out_data_venn, TF_list[i]+'_venn.json'),orient='records')
    binding_width_gen(TF_list[i], database[i], '../../data/e_coli/NC_000913_3/binding_widths/')
    peak_position_gen(TF_list[i], final_annot_DF, '../../data/e_coli/NC_000913_3/positions/')

In [69]:
file = 'phob_M9P_curated.gff'
df = pd.read_csv(org_folder+strain+"/curated_input/"+file,index_col=0, 
                                 delimiter='\t', header=None, 
                                 names = ['ref','condition', 'condition_name', 
                                          "binding_peak_start",'binding_peak_end', 
                                          'binding_peak_strength', 'direction', '.','ID'])
df = df.set_index(pd.Series(range(1,len(df)+1)))
df.head()

Unnamed: 0,condition,condition_name,binding_peak_start,binding_peak_end,binding_peak_strength,direction,.,ID
1,MACE,_filtered_0.95,417086,417115,1.92,+,.,SFB
2,MACE,_filtered_0.95,1198372,1198398,1.88,+,.,GSB
3,MACE,_filtered_0.95,2774093,2774126,1.82,+,.,SFB
4,MACE,_filtered_0.95,2774321,2774354,1.82,+,.,SRB
5,MACE,_filtered_0.95,3284518,3284522,1.23,+,.,GSB


In [70]:
peak_annot_DF = annotate_peaks('PhoB', 'M9P', df, 500, DF_gene_info)
final_annot_DF = validate_peak_info(peak_annot_DF,DF_gene_info)

final_annot_DF

Unnamed: 0,index,condition,binding_peak_start,binding_peak_end,binding_peak_strength,target_locus,target_genes
1,PhoB-1,phob + M9P,417086,417115,1.92,"b0399,b0400,b0397,b0398","phoB,phoR,sbcC,sbcD"
2,PhoB-2,phob + M9P,1198372,1198398,1.88,"b1139,b1137,b1138","lit,ymfD,ymfE"
3,PhoB-3,phob + M9P,2774093,2774126,1.82,,
4,PhoB-4,phob + M9P,2774321,2774354,1.82,,
5,PhoB-5,phob + M9P,3284518,3284522,1.23,"b3138,b3139,b3140,b3141","agaB,agaC,agaD,agaI"
6,PhoB-6,phob + M9P,3321253,3321291,1.69,b3173,yhbX
7,PhoB-7,phob + M9P,3321485,3321524,2.08,b3173,yhbX
8,PhoB-8,phob + M9P,3911549,3911584,8.13,"b3724,b3725,b3726,b3727,b3728","phoU,pstB,pstA,pstC,pstS"
9,PhoB-9,phob + M9P,3911629,3911670,6.93,"b3724,b3725,b3726,b3727,b3728","phoU,pstB,pstA,pstC,pstS"
10,PhoB-10,phob + M9P,4003031,4003074,2.05,"b3817,b3818","yigF,yigG"


In [60]:
len(df)

136

In [40]:
float('nan')

nan

In [47]:
[i for i in peak_annot_DF.genes_m][0]

nan

In [26]:
peak_annot_DF

Unnamed: 0,index,condition,binding_peak_start,binding_peak_end,binding_peak_strength,TU_p,genes_p,TU_m,genes_m
1,Dps-1,dps + expo,235,261,1.50,thrLABC,"b0001,b0002,b0003,b0004",,
2,Dps-2,dps + expo,111536,111543,2.28,,,,
3,Dps-3,dps + expo,167456,167466,1.95,fhuACDB,"b0150,b0151,b0152,b0153",,
4,Dps-4,dps + expo,246985,247015,1.13,yafL,b0227,dinJ-yafQ,"b0225,b0226"
5,Dps-5,dps + expo,256349,256373,1.54,"gpt,frsA","b0238,b0239",,
...,...,...,...,...,...,...,...,...,...
132,Dps-132,dps + expo,4406423,4406463,1.01,nsrR-rnr-rlmB-yjfIJ,"b4178,b4179,b4180,b4181,b4182",,
133,Dps-133,dps + expo,4474258,4474288,1.11,bdcR,b4251,bdcA,b4249
134,Dps-134,dps + expo,4527665,4527698,1.11,,,sgcXBCQAER,"b4300,b4301,b4302,b4303,b4304,b4565,b4305"
135,Dps-135,dps + expo,4566141,4566162,1.19,,,yjiML,"b4334,b4335"


In [None]:
def annotate_peaks(TF_name, TF_condition, peak_df,margin,gene_info):
    
    res_df = peak_df.copy()
#     TF = peak_df.condition_name[1][:4]
    for i,row in res_df.iterrows():
        pos = row['binding_peak_start']
        # Identify genes within MARGIN nt of binding peak
        close_genes = gene_info[(gene_info.start_codon_pos > pos-margin) 
                                & (gene_info.start_codon_pos < pos+margin)]
        for strand,group in close_genes.groupby('strand'):
            #Remove genes that are completely transcribed before binding peak
            if strand == '+':
                group = group[group.stop > pos]
            else:
                group = group[group.start < pos]

            operon = group.operon.unique()
            # Ensure that we're only identifying one operon on either side of binding peak
            if len(operon) > 1:
                print (operon)

            # Get all genes in operon
            bnums = gene_info[gene_info.operon.isin(operon)].index
            
            ## Add gene information to dataframe
            if strand == '+':
                res_df.loc[i,'TU_p'] = ','.join(operon)
                res_df.loc[i,'genes_p'] = ','.join(bnums)
            else:
                res_df.loc[i,'TU_m'] = ','.join(operon)
                res_df.loc[i,'genes_m'] = ','.join(bnums)
    res_df['index'] = [TF_name +'-' + str(i) for i in range(1,peak_df.shape[0]+1)]
    res_df['condition'] = [ TF_name.lower() + " + " + TF_condition for i in peak_df.condition_name]
#     [peak_df.condition_name[2][:4]+' + '+peak_df.condition_name[1][5:8]]*peak_df.shape[0]
    cols = ['index','condition','binding_peak_start','binding_peak_end',
            'binding_peak_strength','TU_p','genes_p','TU_m','genes_m']
    return res_df.reindex(columns = cols)