#  Measuring TF abundance over growth rate

In [10]:
import numpy as np
import pandas as pd

import bokeh.io
import bokeh.models
import bokeh.palettes
import bokeh.plotting
import seaborn as sns
sns.set_palette('colorblind')
bokeh.io.output_notebook()

## The problem

For the growth experiments, I'm interested in measuring hte abundance of the lac repressor as a function of growth rate. To my knowledge, there hasn't been any explicit measure of the copy number change of a specific transcription factor as a function of growth rate and temperature with single-cell resolution. Probably the closest example of such a sstudy was performed only a few years go in early 2015 

## Examinning transcription related proteins.

In [11]:
# Load in the data. 
data = pd.read_csv('../../data/Nature_Bio_2015_Schmidt_supS7_2.csv', comment='#')

# get all of the tranascription associated factors
tf_data = data[data['Annotated functional COG group (description)']=='Transcription']
tf_data.head()

Unnamed: 0,Uniprot Accession,Description,Gene,Peptides.used.for.quantitation,Confidence.score,Molecular weight (Da),Dataset,Glucose,LB,Glycerol + AA,...,pH6 glucose COV,Xylose COV,Mannose COV,Galactose COV,Succinate COV,Fructose COV,Bnumber,Annotated functional COG groups (letter),Annotated functional COG group (description),Annotated functional COG class
0,P1A8T7,DNA-directed RNA polymerase subunit beta' OS=E...,rpoC,91,6145.53,155145.118,2,2779,7164,4513,...,6.14,6.27,16.15,22.87,16.45,9.29,b3988,K,Transcription,INFORMATION STORAGE AND PROCESSING
1,P1A8V2,DNA-directed RNA polymerase subunit beta OS=Es...,rpoB,89,5161.29,151521.2758,2,3957,8888,5199,...,5.93,4.27,13.51,19.75,13.6,7.77,b3987,K,Transcription,INFORMATION STORAGE AND PROCESSING
94,P1AG31,Transcription termination factor Rho OS=Escher...,rho,28,2197.93,46956.59113,2,3243,5934,4171,...,6.48,2.87,2.68,8.15,1.51,5.54,b3783,K,Transcription,INFORMATION STORAGE AND PROCESSING
98,P1AFF6,Transcription elongation protein nusA OS=Esche...,nusA,27,1899.11,54819.16259,2,5576,11125,7264,...,6.11,5.63,4.78,6.19,2.98,6.63,b3169,K,Transcription,INFORMATION STORAGE AND PROCESSING
99,P1A7Z4,DNA-directed RNA polymerase subunit alpha OS=E...,rpoA,27,1917.81,36471.13747,2,14575,35112,25313,...,6.6,3.74,1.45,8.13,6.18,3.13,b3295,K,Transcription,INFORMATION STORAGE AND PROCESSING


In [9]:
tf_data.columns

Index(['Uniprot Accession', 'Description', 'Gene',
       'Peptides.used.for.quantitation', 'Confidence.score',
       'Molecular weight (Da)', 'Dataset', 'Glucose', 'LB', 'Glycerol + AA',
       'Acetate', 'Fumarate', 'Glucosamine', 'Glycerol', 'Pyruvate',
       'Chemostat mu=1.5', 'Chemostat mu=1.35', 'Chemostat mu=1.21',
       'Chemostat mu=1.12', 'Stationary phase 1 day',
       'Stationary phase 3 days', 'Osmotic-stress glucose', '42C glucose',
       'pH6 glucose', 'Xylose', 'Mannose', 'Galactose', 'Succinate',
       'Fructose', 'Glucose COV', 'LB COV', 'Glycerol + AA COV', 'Acetate COV',
       'Fumarate COV', 'Glucosamine COV', 'Glycerol COV', 'Pyruvate COV',
       'Chemostat mu=1.5 COV', 'Chemostat mu=1.35 COV',
       'Chemostat mu=1.21 COV', 'Chemostat mu=1.12 COV',
       'Stationary phase 1 day COV', 'Stationary phase 3 days COV',
       'Osmotic-stress glucose COV', '42C glucose COV', 'pH6 glucose COV',
       'Xylose COV', 'Mannose COV', 'Galactose COV ', 'Succinate 