In [63]:
import pandas as pd
from scipy.stats import ttest_ind

dataset = pd.read_csv('green_TCPS_Cell.csv')

In [64]:
# change image numbers assigned by cellprofiler to cell type names
dataset.loc[dataset['ImageNumber'].isin([3]), 'CellType'] = 'M1'
dataset.loc[dataset['ImageNumber'].isin([4]), 'CellType'] = 'M2'

# divide the data into two datasets - for M1 and M2 cells data
dataset_m1 = dataset[dataset['CellType'] == 'M1']
dataset_m2 = dataset[dataset['CellType'] == 'M2']

In [65]:
t_test_results = pd.DataFrame(columns=['Measurement', 'mean_diff (M2 - M1)', 't_statistic', 'p_value'])

for column in range(2, 17):
    column_name = dataset_m1.columns[column] 
    t_statistic, p_value = ttest_ind(dataset_m1[column_name], dataset_m2[column_name])
    mean_diff = dataset_m2[column_name].mean() - dataset_m1[column_name].mean()
    t_test_results.loc[column] = [column_name, mean_diff, t_statistic, p_value]

In [66]:
# statistically significant difference
t_test_results[t_test_results['p_value'] < 0.05]

Unnamed: 0,Measurement,mean_diff (M2 - M1),t_statistic,p_value
2,Intensity_IntegratedIntensityEdge_Green,-0.814869,2.390357,0.0175152
3,Intensity_IntegratedIntensity_Green,-30.469256,2.780143,0.005814178
4,Intensity_LowerQuartileIntensity_Green,0.0155,-9.944072,4.588109e-20
6,Intensity_MassDisplacement_Green,-0.440957,2.835604,0.004918668
8,Intensity_MaxIntensity_Green,-0.048132,3.172933,0.001682843
9,Intensity_MeanIntensityEdge_Green,0.006903,-3.820479,0.0001652056
12,Intensity_MinIntensityEdge_Green,0.003707,-5.232972,3.345177e-07
13,Intensity_MinIntensity_Green,0.004654,-6.357938,8.641345e-10
15,Intensity_StdIntensity_Green,-0.013353,2.141984,0.0330862


In [32]:
# not statistically significant difference
t_test_results[t_test_results['p_value'] >= 0.05]

Unnamed: 0,Measurement,mean_diff (M2 - M1),t_statistic,p_value
2,Intensity_IntegratedIntensityEdge_Green,0.24594,-1.243769,0.21384
5,Intensity_MADIntensity_Green,0.001953,-1.834544,0.066833
6,Intensity_MassDisplacement_Green,-0.074615,0.555588,0.578602
8,Intensity_MaxIntensity_Green,0.019825,-1.957635,0.050516
15,Intensity_StdIntensity_Green,-0.004028,1.327794,0.184512
16,Intensity_UpperQuartileIntensity_Green,0.007293,-1.340125,0.180471


In [6]:
dataset_m1.describe()

Unnamed: 0,ImageNumber,ObjectNumber,Intensity_IntegratedIntensityEdge_Green,Intensity_IntegratedIntensity_Green,Intensity_LowerQuartileIntensity_Green,Intensity_MADIntensity_Green,Intensity_MassDisplacement_Green,Intensity_MaxIntensityEdge_Green,Intensity_MaxIntensity_Green,Intensity_MeanIntensityEdge_Green,...,Location_CenterMassIntensity_X_Green,Location_CenterMassIntensity_Y_Green,Location_CenterMassIntensity_Z_Green,Location_Center_X,Location_Center_Y,Location_Center_Z,Location_MaxIntensity_X_Green,Location_MaxIntensity_Y_Green,Location_MaxIntensity_Z_Green,Number_Object_Number
count,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0,...,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0,210.0
mean,2.028571,36.971429,6.013002,111.328046,0.032756,0.013762,1.648765,0.057385,0.186922,0.028791,...,478.162402,505.816639,0.0,478.223764,505.832752,0.0,478.380952,505.804762,0.0,36.971429
std,0.757194,22.808526,2.341931,95.091121,0.009126,0.027808,1.392358,0.094189,0.151197,0.013102,...,276.959593,287.162286,0.0,277.023316,287.038895,0.0,277.984815,288.008498,0.0,22.808526
min,1.0,1.0,0.384352,9.705376,0.005611,0.0,0.050647,0.011222,0.048542,0.00557,...,30.571349,30.296095,0.0,30.776786,30.771635,0.0,32.0,33.0,0.0,1.0
25%,1.0,18.0,4.526512,65.703689,0.02862,0.008699,0.868106,0.039842,0.126476,0.024687,...,243.947371,238.360823,0.0,243.573456,238.805828,0.0,240.5,240.75,0.0,18.0
50%,2.0,35.5,5.651471,93.385407,0.031426,0.011222,1.566751,0.042931,0.163023,0.027158,...,461.638735,499.333086,0.0,460.590441,500.659485,0.0,464.5,494.0,0.0,35.5
75%,3.0,53.0,7.49978,134.537629,0.034231,0.01431,2.055856,0.048542,0.193748,0.028058,...,704.579651,760.757434,0.0,703.796024,759.496807,0.0,705.0,757.25,0.0,53.0
max,3.0,90.0,20.566708,872.319416,0.077162,0.407843,15.688012,1.0,1.0,0.158205,...,978.348818,1002.719298,0.0,978.421647,1001.944834,0.0,990.0,1007.0,0.0,90.0


In [7]:
dataset_m2.describe()

Unnamed: 0,ImageNumber,ObjectNumber,Intensity_IntegratedIntensityEdge_Green,Intensity_IntegratedIntensity_Green,Intensity_LowerQuartileIntensity_Green,Intensity_MADIntensity_Green,Intensity_MassDisplacement_Green,Intensity_MaxIntensityEdge_Green,Intensity_MaxIntensity_Green,Intensity_MeanIntensityEdge_Green,...,Location_CenterMassIntensity_X_Green,Location_CenterMassIntensity_Y_Green,Location_CenterMassIntensity_Z_Green,Location_Center_X,Location_Center_Y,Location_Center_Z,Location_MaxIntensity_X_Green,Location_MaxIntensity_Y_Green,Location_MaxIntensity_Z_Green,Number_Object_Number
count,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0,...,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0,934.0
mean,5.018201,183.925054,6.258942,83.762282,0.046267,0.015715,1.57415,0.08586,0.206747,0.041732,...,511.478731,509.010696,0.0,511.46388,509.002473,0.0,512.068522,508.901499,0.0,183.925054
std,0.684142,132.915654,2.64137,60.685579,0.011638,0.008045,1.830526,0.063798,0.128069,0.009926,...,278.499847,283.249938,0.0,278.522054,283.239009,0.0,278.796014,283.217399,0.0,132.915654
min,4.0,1.0,0.454772,14.261108,0.005611,0.0,0.034679,0.01431,0.074356,0.006175,...,22.500337,15.140004,0.0,22.433315,14.201511,0.0,16.0,21.0,0.0,1.0
25%,5.0,78.25,4.433746,48.040012,0.039842,0.011505,0.625012,0.065657,0.131597,0.034668,...,276.6759,270.199952,0.0,276.289624,270.125822,0.0,275.5,268.25,0.0,78.25
50%,5.0,156.0,5.467004,70.584934,0.045736,0.01431,1.049474,0.082773,0.160218,0.041785,...,508.344889,495.407247,0.0,509.330057,494.30482,0.0,514.5,493.0,0.0,156.0
75%,5.0,263.75,7.512634,101.989346,0.054153,0.017116,1.746149,0.097083,0.23738,0.047667,...,743.387177,767.635813,0.0,743.99361,767.782805,0.0,739.0,766.0,0.0,263.75
max,6.0,497.0,19.673406,962.661675,0.079967,0.205492,15.569378,1.0,1.0,0.138485,...,1009.363875,1001.209061,0.0,1008.667442,1001.790102,0.0,1013.0,1004.0,0.0,497.0
