In [1]:
import os
import numpy as np
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
import matplotlib.patches as mpatches

from sklearn.decomposition import PCA
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import confusion_matrix, plot_confusion_matrix

from scipy import stats
from scipy.stats import wasserstein_distance

In [2]:
def get_pandas_dict(dirpath):
    # Getting filelist:
    file_list = os.listdir(dirpath)
    pandas_dict = {}

    # Iterating through list:
    for filename in file_list:
        filepath = os.path.join(dirpath, filename)
        if os.path.isdir(filepath):
            continue
        if ".txt" not in filepath:
            continue
        pandas_dict[filename.split(".")[0]] = pd.read_csv(filepath, header=2, sep="\t")

    return pandas_dict

In [3]:
pd_dict = get_pandas_dict("Deep Learning Baseline Analysis/Input Feature Files")

In [4]:
keys = list(pd_dict.keys())
keys.sort()
keys

['F91SCTRL_0',
 'F91SDOX_0',
 'L4QCTRL_0',
 'L4QDOX_0',
 'R45HCTRL_0',
 'R45HDOX_0',
 'WTCTRL_0',
 'WTDOX_0']

In [6]:
features = list(pd_dict["WTCTRL_0"])
features.sort()
features

['Area_M01',
 'Bkgd Mean_Ch02',
 'Bkgd StdDev_Ch02',
 'Bright Detail Intensity R7_M02_Ch02',
 'Bright Detail Intensity R7_M02_Ch02 / Intensity_MC_Ch02',
 'Circularity_M01',
 'Diameter_M01',
 'Gradient RMS_M01_Ch01',
 'Intensity_MC_Ch01',
 'Intensity_MC_Ch02',
 'Intensity_MC_Ch06',
 'Object Number',
 'Saturation Count_M02_Ch02']

In [11]:
condition_order = ['WT', 'F91S', 'L4Q', 'R45H']
treatment_order = ['CTRL', 'DOX']

for cond in condition_order:
    for treatment in treatment_order:
        key = cond + treatment + "_0"
        bdi_array = np.array(pd_dict[key]["Bright Detail Intensity R7_M02_Ch02"])
        print(np.mean(bdi_array))

7547.176863661062
8810.641067402752
6799.022458779614
9397.494585491004
9160.910682177402
16161.442621639733
6420.518111722488
17366.01203383015
