## filter label tables

This code orders the flourocensce tables (label tables) such that each 'i' row in those tables will match the same 'i' row in the features table. 

In [1]:
import pandas as pd
import numpy as np
from os import chdir
import matplotlib.pyplot as plt

In [2]:
directory = r'/home/karinsio/my_project_dir/iGEM/Merge_Features'
chdir(directory)

In [3]:
normalized_features = pd.read_csv(r'normalized_updated_new_features_table.csv', index_col='ORF')
features = pd.read_csv(r'updated_new_features_table.csv', index_col='ORF')

In [4]:
normalized_features.index #ORF column

Index(['Q0045', 'Q0085', 'Q0105', 'Q0140', 'Q0250', 'Q0275', 'YAL001C',
       'YAL002W', 'YAL003W', 'YAL005C',
       ...
       'YPR188C', 'YPR189W', 'YPR190C', 'YPR191W', 'YPR192W', 'YPR194C',
       'YPR198W', 'YPR199C', 'YPR200C', 'YPR201W'],
      dtype='object', name='ORF', length=4665)

In [5]:
## load the original flourescence data (4 tables):
labels1 = pd.read_csv(r'flourescence_tables_original/flourescence_table_NATIVEpr_GFP.csv').drop(['Unnamed: 0'],axis=1).set_index('ORF')
labels2 = pd.read_csv(r'flourescence_tables_original/flourescence_table_NOP1pr_GFP.csv').drop(['Unnamed: 0'],axis=1).set_index('ORF')
labels3 = pd.read_csv(r'flourescence_tables_original/flourescence_table_TEF2pr_mCherry.csv').drop(['Unnamed: 0'],axis=1).set_index('ORF')
labels4 = pd.read_csv(r'flourescence_tables_original/flourescence_table_TEF2pr_VC.csv').drop(['Unnamed: 0'],axis=1).set_index('ORF')

In [6]:
labels1

Unnamed: 0_level_0,N' NATIVEpr-GFP in SD Intensity,one_hot_ER,"one_hot_ER,ambiguous","one_hot_ER,ambiguous,bud","one_hot_ER,bud","one_hot_ER,bud,neck","one_hot_ER,bud,punctate","one_hot_ER,cell,periphery","one_hot_ER,cell,periphery,punctate","one_hot_ER,cell,periphery,vacuole",...,"one_hot_nuclear,periphery,punctate",one_hot_nucleolus,"one_hot_nucleolus,nucleus","one_hot_nucleolus,punctate",one_hot_nucleus,"one_hot_nucleus,punctate",one_hot_punctate,"one_hot_punctate,vacuole",one_hot_threshold,one_hot_vacuole
ORF,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
YAL001C,18.81,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL002W,21.12,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
YAL003W,16.14,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL004W,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL005C,587.54,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL007C,74.55,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
YAL008W,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL009W,22.58,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL010C,20.62,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
YAL011W,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [7]:
## order the flourescence data according to the features data
labels1_filtered = labels1.loc[normalized_features.index]
labels2_filtered = labels2.loc[normalized_features.index]
labels3_filtered = labels3.loc[normalized_features.index]
labels4_filtered = labels4.loc[normalized_features.index]

In [8]:
## check that the order is correct (all output is true in the following loop):
for i in range(0,len(labels4_filtered.index)):
    print(labels4_filtered.index[i]==normalized_features.index[i])
    

True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True


True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True


True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True


In [9]:
labels1_filtered.to_csv(r'flourescence_tables/flourescence_table_NATIVEpr_GFP.csv')
labels2_filtered.to_csv(r'flourescence_tables/flourescence_table_NOP1pr_GFP.csv')
labels3_filtered.to_csv(r'flourescence_tables/flourescence_table_TEF2pr_mCherry.csv')
labels4_filtered.to_csv(r'flourescence_tables/flourescence_table_TEF2pr_VC.csv')

In [10]:
labels1_filtered.shape

(4665, 72)