In [4]:
import pandas as pd
import numpy as np
from collections import Counter

#########################################
# Calculating all activated CD4 T cells #
#########################################

def NumOfActivatedCD4(grp):
    '''
    This will take one pop group and finds the equivalent group from the GmCD44 group, 
    then takes the percentage from the appropriate GmCD44 percentage and multiplies it to the pop CD4CT group.
    Requirement:
         age = grp.name[0]
         Genotype = str(grp.name[1])
    '''
    
#The CD4Tcell groups equivalent to the CD69 data groups. This 
    pct = GmCD44.loc[(GmCD44['Age'] == grp.name[0]) & (GmCD44['Genotype']==str(grp.name[1]))]['pct_CD4_CD44_pos_CD62L_neg'].iloc[0]
    pct = pct / 100
    return grp * pct

#########################################
# Calculating all EARLY activated CD4 T cells #
#########################################

def NumOfEarlyActivation(grp):
    '''
    This will take one pop group and finds the equivalent group from the GmCD44 group, 
    then takes the percentage from the appropriate GmCD44 percentage and multiplies it to the pop CD4CT group.
    Requirement:
         age = grp.name[0]
         Genotype = str(grp.name[1])
    '''
    
#The CD4Tcell groups equivalent to the CD69 data groups. This 
    pct = GmCD44.loc[(GmCD44['Age'] == grp.name[0]) & (GmCD44['Genotype']==str(grp.name[1]))]['pct_CD4_CD69_pos'].iloc[0]
    pct = pct / 100
    return grp * pct

In [5]:
####################
#Preparing My Data #
####################
pop = pd.read_csv( "/mnt/c/Laptop Backups/HomestaticExpansionProject/ModelData/NaiveTregDifferentiation.csv")
# Choosing spleen only data

In [15]:
# Splnpop = pop.loc[pop['Organ'] == 'Spleen']

# Removing Ages that we do not have information on in the pop file
CD69Ages = [0, 4, 7, 9, 12, 14, 18]
ActivatedCD4pop = pop[pop.Age.isin(CD69Ages)].copy()

########################################
# Preparing Genevieves Activation Data #
########################################

CD44df = pd.read_csv('/mnt/c/Laptop Backups/HomestaticExpansionProject/ModelData/TCellActivationSummary_EdittedinR_D0.csv')

#Selecting only the columns that we want
CD44df = CD44df[[ 'Age', 'Genotype', 'pct_CD4_CD44_pos_CD62L_neg', 'pct_CD4_CD69_pos']]
#Grouping and finding the mean
GmCD44 = CD44df.groupby( [ "Age", "Genotype"] ).mean().reset_index()

In [19]:
ActivatedCD4pop['ActivatedCD4CT'] = (
    ActivatedCD4pop.groupby(["Age", "Genotype"])['NoTregCD4CT']
    .apply(NumOfActivatedCD4)
    .reset_index(level=[0,1], drop=True)
)

ActivatedCD4pop['EarlyActivatedCD4CT'] = (
    ActivatedCD4pop.groupby(["Age", "Genotype"])['ActivatedCD4CT']
    .apply(NumOfEarlyActivation)
    .reset_index(level=[0,1], drop=True)
)

In [20]:
ActivatedCD4pop.to_csv('/mnt/c/Laptop Backups/HomestaticExpansionProject/ModelData/ActivatedCD4pop2_0_2.csv')