## Import modules and tools

In [1]:
import scanpy as sc
import numpy as np
import pandas as pd
import seaborn as sb
import matplotlib.pyplot as plt
from os import path
from os import listdir
import datetime, time

In [2]:
# costome codes

import ma_codes as codes
from ma_codes import mysize, mymap

#### Define a nice colour map for gene expression

In [3]:
from matplotlib import colors
colorsComb = np.vstack([plt.cm.Reds(np.linspace(0, 1, 128)), plt.cm.Greys_r(np.linspace(0.7, 0.8, 0))])
mymap = colors.LinearSegmentedColormap.from_list('my_colormap', colorsComb)

In [4]:
plt.rcParams['savefig.dpi'] = 200 #图片像素
plt.rcParams['figure.dpi'] = 200 #分辨率

In [5]:
import pandas as pd
#显示所有列
pd.set_option('display.max_columns', None)
#显示所有行
pd.set_option('display.max_rows', None)
#设置value的显示长度为100，默认为50
pd.set_option('max_colwidth',100)

#### set timestamp function

In [6]:
def timestamp():
    ts = time.time()
    st = datetime.datetime.fromtimFestamp(ts).strftime('%d-%m-%Y %H:%M:%S')
    return st

#### workdirectory

In [7]:
folder = "/media/qianjianghu/SG_QJData/DataAnlysis/Jupyter/WNT_PCLS/"

#### scanpy setting and version

In [8]:
sc.settings.verbosity = 4             # verbosity: 0=’error’, 1=’warning’, 2=’info’, 3=’hint’, 4=more details, 5=even more details, etc.
sc.logging.print_header()
Obj_folder = '/media/qianjianghu/SG_QJData/DataAnlysis/Jupyter/WNT_PCLS/Object_folder/'  # the file that will store the analysis results

scanpy==1.6.0 anndata==0.7.5 umap==0.4.6 numpy==1.18.5 scipy==1.5.2 pandas==1.1.5 scikit-learn==0.23.2 statsmodels==0.12.0 python-igraph==0.8.3 louvain==0.6.1 leidenalg==0.8.3


## Reload adata

In [9]:
EPITHELIAL = sc.read(Obj_folder + "/PP5_EPITHELIAL_cluster_WNT_PCLS.h5ad")

## ranking genes each cluster

In [10]:
EPITHELIAL

AnnData object with n_obs × n_vars = 4343 × 23558
    obs: 'project', 'genome', 'groups', 'treatment', 'treated_days', 'estimated_cells', 'identifier', 'doublet_scores', 'predicted_doublets', 'n_counts', 'n_genes', 'percent.mito', 'size_factors', 'S_score', 'G2M_score', 'phase', 'louvain', 'leiden', 'leiden_0.3', 'TYPE', 'Epi_leiden_2', 'cell_type', 'Epi_leiden_4', 'Epi_leiden_5', 'Epi_leiden_6', 'cell_type_new', 'cluster'
    var: 'n_cells', 'highly_variable', 'mean', 'std'
    uns: 'Epi_leiden_2_colors', 'Epi_leiden_4_colors', 'Epi_leiden_5_colors', 'Epi_leiden_6_colors', 'TYPE_colors', 'cell_type_colors', 'cell_type_new_colors', 'cluster_colors', 'groups_colors', 'identifier_colors', 'leiden', 'leiden_colors', 'louvain', 'louvain_colors', 'neighbors', 'pca', 'rank_genes_cluster', 'rank_genes_groups', 'treated_days_colors', 'treatment_colors', 'umap'
    obsm: 'X_pca', 'X_umap'
    varm: 'PCs'
    layers: 'counts'
    obsp: 'connectivities', 'distances'

In [11]:
#Calculate marker genes
sc.tl.rank_genes_groups(EPITHELIAL, groupby='cell_type_new', key_added='rank_genes_cluster_cell_type', n_genes=500)

ranking genes
    consider 'cell_type_new' groups:
    with sizes: [403 346 329 325 309 174 232 210 203 185 181 180 161 160 121 110 102  92
  89  85  65  62  60  27  17 115]
    finished: added to `.uns['rank_genes_cluster_cell_type']`
    'names', sorted np.recarray to be indexed by group ids
    'scores', sorted np.recarray to be indexed by group ids
    'logfoldchanges', sorted np.recarray to be indexed by group ids
    'pvals', sorted np.recarray to be indexed by group ids
    'pvals_adj', sorted np.recarray to be indexed by group ids (0:00:07)


In [12]:
result_folder = '/media/qianjianghu/SG_QJData/DataAnlysis/Jupyter/WNT_PCLS/results/'

#### export and layout clusters horizontally

In [13]:
####
#### layout clusters horizontally
####

result = EPITHELIAL.uns['rank_genes_cluster_cell_type']
groups = result['names'].dtype.names
cluster_marker = pd.DataFrame(
    {'Cluster'+group + '_' + key: result[key][group]
    for group in groups for key in ['names', 'pvals','pvals_adj', 'logfoldchanges']})

In [14]:
cluster_marker.head()

Unnamed: 0,ClusterC0_names,ClusterC0_pvals,ClusterC0_pvals_adj,ClusterC0_logfoldchanges,ClusterC1_names,ClusterC1_pvals,ClusterC1_pvals_adj,ClusterC1_logfoldchanges,ClusterC2_Krt8_ADI_names,ClusterC2_Krt8_ADI_pvals,ClusterC2_Krt8_ADI_pvals_adj,ClusterC2_Krt8_ADI_logfoldchanges,ClusterC3_ciliated_names,ClusterC3_ciliated_pvals,ClusterC3_ciliated_pvals_adj,ClusterC3_ciliated_logfoldchanges,ClusterC4_basal_names,ClusterC4_basal_pvals,ClusterC4_basal_pvals_adj,ClusterC4_basal_logfoldchanges,ClusterC5_names,ClusterC5_pvals,ClusterC5_pvals_adj,ClusterC5_logfoldchanges,ClusterC6_ciliated_names,ClusterC6_ciliated_pvals,ClusterC6_ciliated_pvals_adj,ClusterC6_ciliated_logfoldchanges,ClusterC7_names,ClusterC7_pvals,ClusterC7_pvals_adj,ClusterC7_logfoldchanges,ClusterC8_basal_names,ClusterC8_basal_pvals,ClusterC8_basal_pvals_adj,ClusterC8_basal_logfoldchanges,ClusterC9_names,ClusterC9_pvals,ClusterC9_pvals_adj,ClusterC9_logfoldchanges,ClusterC10_ciliated_names,ClusterC10_ciliated_pvals,ClusterC10_ciliated_pvals_adj,ClusterC10_ciliated_logfoldchanges,ClusterC11_Club_names,ClusterC11_Club_pvals,ClusterC11_Club_pvals_adj,ClusterC11_Club_logfoldchanges,ClusterC12_AT2_names,ClusterC12_AT2_pvals,ClusterC12_AT2_pvals_adj,ClusterC12_AT2_logfoldchanges,ClusterC13_Club_names,ClusterC13_Club_pvals,ClusterC13_Club_pvals_adj,ClusterC13_Club_logfoldchanges,ClusterC14_ciliated_names,ClusterC14_ciliated_pvals,ClusterC14_ciliated_pvals_adj,ClusterC14_ciliated_logfoldchanges,ClusterC15_ciliated_names,ClusterC15_ciliated_pvals,ClusterC15_ciliated_pvals_adj,ClusterC15_ciliated_logfoldchanges,ClusterC16_names,ClusterC16_pvals,ClusterC16_pvals_adj,ClusterC16_logfoldchanges,ClusterC17_names,ClusterC17_pvals,ClusterC17_pvals_adj,ClusterC17_logfoldchanges,ClusterC18_AT2_names,ClusterC18_AT2_pvals,ClusterC18_AT2_pvals_adj,ClusterC18_AT2_logfoldchanges,ClusterC19_club_names,ClusterC19_club_pvals,ClusterC19_club_pvals_adj,ClusterC19_club_logfoldchanges,ClusterC20_club_names,ClusterC20_club_pvals,ClusterC20_club_pvals_adj,ClusterC20_club_logfoldchanges,ClusterC21_krt8High_names,ClusterC21_krt8High_pvals,ClusterC21_krt8High_pvals_adj,ClusterC21_krt8High_logfoldchanges,ClusterC22_krt8high_names,ClusterC22_krt8high_pvals,ClusterC22_krt8high_pvals_adj,ClusterC22_krt8high_logfoldchanges,ClusterC23_neuroendocrine_names,ClusterC23_neuroendocrine_pvals,ClusterC23_neuroendocrine_pvals_adj,ClusterC23_neuroendocrine_logfoldchanges,ClusterC24_AT1_names,ClusterC24_AT1_pvals,ClusterC24_AT1_pvals_adj,ClusterC24_AT1_logfoldchanges,ClusterC25_Krt8_ADI_2_names,ClusterC25_Krt8_ADI_2_pvals,ClusterC25_Krt8_ADI_2_pvals_adj,ClusterC25_Krt8_ADI_2_logfoldchanges
0,mt-Rnr2,1.815628e-265,4.277256e-261,1.852911,mt-Rnr2,1.07794e-204,2.539411e-200,1.925961,Tmsb4x,1.686682e-100,5.676408e-97,2.237518,Nupr1,8.588919000000001e-68,3.372296e-64,2.806788,mt-Rnr2,3.51147e-85,1.0340400000000001e-81,1.356172,Clu,4.028291e-38,1.216647e-35,2.54697,Tmem212,1.036238e-94,4.068617e-91,4.224972,Esd,2.414016e-35,1.263764e-32,1.677655,Fth1,4.946481e-42,1.9421530000000002e-39,1.656945,Clu,1.914625e-29,1.80419e-27,2.550858,Fth1,2.1247829999999997e-100,5.561736e-97,1.985962,Trf,4.815077e-58,5.401599e-55,5.199295,Sftpc,2.36406e-257,5.569252e-253,9.878492,Selenbp1,2.759313e-115,1.6250979999999999e-111,4.938071,Sec14l3,5.204444e-78,6.811460000000001e-75,5.871947,Tm4sf1,8.191721000000001e-31,2.412257e-27,2.738625,Hnrnpc,1e-06,1.1e-05,1.679872,Ccdc153,1.120141e-10,3.34029e-09,2.646315,Sftpc,2.947855e-56,7.54843e-54,8.415749,Wfdc2,1.14074e-34,2.465463e-32,2.918976,Scgb1a1,5.703205e-61,1.119634e-57,7.746153,Krt8,1.3638409999999999e-37,5.841704e-35,3.1009,mt-Rnr2,2.797602e-34,6.046413e-33,2.024664,Resp18,2.1e-05,0.000121,11.269704,Ager,6.861547e-14,3.195183e-13,7.902991,Clu,3.478355e-39,7.730481e-37,2.777132
1,Malat1,4.415912e-83,3.467668e-80,1.667595,Malat1,9.391336000000001e-128,5.531027e-124,1.999551,Krt8,1.954261e-70,1.705129e-67,2.396628,Fth1,1.508342e-47,1.7766759999999999e-44,1.326333,Rps12,1.221775e-31,8.591809999999999e-30,1.85301,Cldn4,2.435506e-24,3.9844200000000004e-22,2.43812,Ccdc153,1.096727e-87,2.583669e-84,3.873407,Ncl,7.220534e-35,3.697855e-32,1.623817,Gsta1,1.2509919999999998e-19,6.8062040000000004e-18,3.938409,Tmsb4x,2.316111e-29,2.165196e-27,1.533536,S100a6,2.306375e-94,4.5277989999999995e-91,2.207868,Hp,4.724282e-53,3.9748079999999995e-50,4.158727,Sftpa1,3.300357e-157,5.553559e-154,8.191777,Trf,1.29474e-99,3.389055e-96,6.348213,Ccdc153,1.982682e-65,1.415394e-62,4.681512,Clu,1.8508189999999998e-26,3.3539690000000004e-23,2.449037,Ppp1r15a,1.6e-05,0.000137,2.089035,Foxj1,4.523185e-10,1.223389e-08,2.13173,Sftpa1,5.17261e-46,7.761551e-44,6.467368,Cbr2,1.463733e-31,2.758611e-29,3.809022,Cbr2,1.495342e-47,1.560473e-44,5.006602,Krt18,3.7439950000000005e-27,8.480868e-25,2.745305,Gm42418,4.9946119999999995e-20,5.565897e-19,4.490399,Scg2,2.6e-05,0.000148,30.544918,Sparc,5.026762e-09,1.859034e-08,5.913456,Tpm1,3.3059640000000003e-28,4.554497e-26,2.111871
2,mt-Rnr1,3.012854e-36,2.628771e-34,1.311597,mt-Rnr1,4.659801e-65,2.335651e-62,1.702771,Krt18,2.102818e-67,1.3760609999999999e-64,2.297471,Gm19935,5.330207e-41,3.5876859999999997e-38,3.263643,Rps14,5.8825e-30,3.5808770000000003e-28,1.50607,Phldb2,1.9677250000000002e-23,2.897229e-21,2.228033,Foxj1,8.70104e-89,2.2775449999999998e-85,3.068495,Plin2,1.4509430000000001e-31,5.425605e-29,2.19788,Gsta4,1.2282620000000001e-18,6.053431000000001e-17,2.249505,Krt7,3.727022e-22,1.836845e-20,1.571898,Gsta4,2.346314e-71,2.909183e-68,3.272163,Npc2,4.07685e-50,2.667845e-47,2.922739,Lyz2,1.332946e-118,1.256062e-115,7.439246,Npc2,1.136365e-110,5.354098e-107,3.719419,Tppp3,1.1099769999999999e-57,5.9429200000000004e-55,3.912758,Nupr1,9.688447e-24,1.2012649999999999e-20,2.241548,Ptpn14,6.4e-05,0.000499,2.430466,Tuba1a,1.985523e-08,3.997859e-07,1.683689,Lyz2,4.3316459999999995e-38,4.576005e-36,5.938001,Cp,2.411183e-25,3.138267e-23,4.187604,Cyp2f2,1.4988749999999999e-36,7.846775e-34,6.394827,F3,2.282736e-24,4.336830000000001e-22,4.096493,Lars2,4.2903549999999994e-19,4.5528010000000004e-18,7.607462,Ptprn,4.2e-05,0.000235,7.846186,Cldn18,1.060037e-06,3.459255e-06,4.996635,Cldn4,2.728981e-26,3.365934e-24,3.119922
3,Gm8995,4.782e-26,2.213248e-24,3.179454,Akap12,8.698404e-32,8.776803999999999e-30,3.66653,Actb,1.745869e-66,1.082347e-63,1.728962,Tppp3,3.0301669999999998e-30,8.705449000000001e-28,2.350983,Tmsb4x,7.015126e-30,4.248389e-28,1.460171,Tpm1,8.194889e-24,1.245517e-21,1.383089,Nupr1,2.4548549999999997e-85,5.2574070000000004e-82,2.893992,Lgals3,1.3910180000000001e-31,5.285421e-29,1.652206,Scgb1a1,7.362790000000001e-18,3.354983e-16,2.482672,Actb,8.685873e-22,4.059956e-20,1.245195,Akr1b8,1.7015569999999997e-64,1.67022e-61,3.052373,Selenbp1,5.969136e-45,2.991934e-42,3.599046,Sftpb,2.021462e-104,1.360618e-101,5.252878,Hp,4.150324e-98,8.888486000000001e-95,5.589223,Cbr2,1.1325500000000001e-59,6.507469e-57,3.147283,Prxl2a,2.159813e-18,1.541845e-15,2.086487,Luc7l3,8.1e-05,0.000621,1.515287,Tppp3,5.488434e-08,1.022916e-06,1.935181,Npc2,2.335867e-31,1.725027e-29,2.97547,Trf,4.729882e-25,6.088883000000001e-23,4.996415,Hp,2.9186600000000003e-33,1.322265e-30,4.584358,Tpm1,3.206119e-22,5.1732699999999996e-20,2.164733,Gm26917,3.089036e-18,3.146196e-17,10.494974,Celf4,0.000107,0.000568,5.404445,Cavin2,3.572131e-06,1.132906e-05,4.88247,Fn1,6.992458e-26,8.427341e-24,3.88551
4,Akap12,1.176642e-17,2.828503e-16,2.696359,Gm8995,6.730212e-31,6.497965e-29,3.523536,Myl6,3.278309e-64,1.7960560000000002e-61,2.306008,Mt1,2.450559e-26,5.020022e-24,1.763277,Rpl12,8.695928e-28,4.396109e-26,1.707105,Krt19,7.799826999999999e-21,9.096452e-19,1.492403,Tppp3,2.004995e-82,3.6333589999999997e-79,3.154677,Akr1b8,2.898153e-29,9.868305000000001e-27,1.887856,Esd,1.317758e-16,5.031399e-15,1.638964,Krt8,8.268221e-21,3.4782629999999995e-19,1.597375,Esd,1.948097e-67,2.185394e-64,2.242618,Bsg,7.068337e-37,2.1077959999999998e-34,2.831198,Sftpd,3.675907e-89,1.8041039999999998e-86,4.704707,Bsg,1.539349e-98,3.6263980000000003e-95,3.859809,Calm1,1.72314e-46,6.765621999999999e-44,1.764807,1810037I17Rik,2.0434710000000002e-17,1.174149e-14,1.574555,Brd2,0.00011,0.00081,1.366851,Rsph1,6.471796e-08,1.193912e-06,1.992964,Hspa5,9.071827e-30,6.158908000000001e-28,3.258835,Selenbp1,9.142711000000001e-25,1.1517860000000001e-22,3.112191,Aldh1a1,5.117317e-22,7.581997e-20,3.96215,Rtn4,1.377903e-20,1.844354e-18,2.886471,Rn7sk,3.930607e-17,3.759531e-16,9.354913,Car8,0.000153,0.000791,3.292826,Emp2,4.613112e-06,1.449589e-05,4.424956,Krt19,1.351353e-24,1.515961e-22,1.850168


In [15]:
cluster_marker.tail()

Unnamed: 0,ClusterC0_names,ClusterC0_pvals,ClusterC0_pvals_adj,ClusterC0_logfoldchanges,ClusterC1_names,ClusterC1_pvals,ClusterC1_pvals_adj,ClusterC1_logfoldchanges,ClusterC2_Krt8_ADI_names,ClusterC2_Krt8_ADI_pvals,ClusterC2_Krt8_ADI_pvals_adj,ClusterC2_Krt8_ADI_logfoldchanges,ClusterC3_ciliated_names,ClusterC3_ciliated_pvals,ClusterC3_ciliated_pvals_adj,ClusterC3_ciliated_logfoldchanges,ClusterC4_basal_names,ClusterC4_basal_pvals,ClusterC4_basal_pvals_adj,ClusterC4_basal_logfoldchanges,ClusterC5_names,ClusterC5_pvals,ClusterC5_pvals_adj,ClusterC5_logfoldchanges,ClusterC6_ciliated_names,ClusterC6_ciliated_pvals,ClusterC6_ciliated_pvals_adj,ClusterC6_ciliated_logfoldchanges,ClusterC7_names,ClusterC7_pvals,ClusterC7_pvals_adj,ClusterC7_logfoldchanges,ClusterC8_basal_names,ClusterC8_basal_pvals,ClusterC8_basal_pvals_adj,ClusterC8_basal_logfoldchanges,ClusterC9_names,ClusterC9_pvals,ClusterC9_pvals_adj,ClusterC9_logfoldchanges,ClusterC10_ciliated_names,ClusterC10_ciliated_pvals,ClusterC10_ciliated_pvals_adj,ClusterC10_ciliated_logfoldchanges,ClusterC11_Club_names,ClusterC11_Club_pvals,ClusterC11_Club_pvals_adj,ClusterC11_Club_logfoldchanges,ClusterC12_AT2_names,ClusterC12_AT2_pvals,ClusterC12_AT2_pvals_adj,ClusterC12_AT2_logfoldchanges,ClusterC13_Club_names,ClusterC13_Club_pvals,ClusterC13_Club_pvals_adj,ClusterC13_Club_logfoldchanges,ClusterC14_ciliated_names,ClusterC14_ciliated_pvals,ClusterC14_ciliated_pvals_adj,ClusterC14_ciliated_logfoldchanges,ClusterC15_ciliated_names,ClusterC15_ciliated_pvals,ClusterC15_ciliated_pvals_adj,ClusterC15_ciliated_logfoldchanges,ClusterC16_names,ClusterC16_pvals,ClusterC16_pvals_adj,ClusterC16_logfoldchanges,ClusterC17_names,ClusterC17_pvals,ClusterC17_pvals_adj,ClusterC17_logfoldchanges,ClusterC18_AT2_names,ClusterC18_AT2_pvals,ClusterC18_AT2_pvals_adj,ClusterC18_AT2_logfoldchanges,ClusterC19_club_names,ClusterC19_club_pvals,ClusterC19_club_pvals_adj,ClusterC19_club_logfoldchanges,ClusterC20_club_names,ClusterC20_club_pvals,ClusterC20_club_pvals_adj,ClusterC20_club_logfoldchanges,ClusterC21_krt8High_names,ClusterC21_krt8High_pvals,ClusterC21_krt8High_pvals_adj,ClusterC21_krt8High_logfoldchanges,ClusterC22_krt8high_names,ClusterC22_krt8high_pvals,ClusterC22_krt8high_pvals_adj,ClusterC22_krt8high_logfoldchanges,ClusterC23_neuroendocrine_names,ClusterC23_neuroendocrine_pvals,ClusterC23_neuroendocrine_pvals_adj,ClusterC23_neuroendocrine_logfoldchanges,ClusterC24_AT1_names,ClusterC24_AT1_pvals,ClusterC24_AT1_pvals_adj,ClusterC24_AT1_logfoldchanges,ClusterC25_Krt8_ADI_2_names,ClusterC25_Krt8_ADI_2_pvals,ClusterC25_Krt8_ADI_2_pvals_adj,ClusterC25_Krt8_ADI_2_logfoldchanges
495,Arnt,0.032566,0.093396,1.832983,Tsc22d4,0.009018,0.036542,1.184173,Eif3b,0.041997,0.09515,0.447516,C230072F16Rik,0.041947,0.128004,1.664326,Tomm6,0.290014,0.418366,1.381117,Bin1,0.00078,0.009347,1.074733,mt-Nd1,4.172419e-13,1.136345e-11,0.87567,Dstn,2e-06,4.6e-05,0.791598,Abce1,0.183354,0.359744,0.678382,Pard3b,0.153584,0.315361,1.434699,Arl6,3.281982e-07,7e-06,1.922322,Lman2,0.119028,0.302619,0.715545,Rpl36a,0.000952,0.00626,0.733407,Atxn7l3b,3.212953e-07,6e-06,1.100454,Selenok,7e-06,9e-05,1.40758,Drc7,0.000508,0.008692,1.459904,Mgat2,0.096119,0.257725,1.133836,Psmc3ip,0.080204,0.243538,1.330889,Sltm,0.002328,0.010999,1.111825,Abcd3,0.00726,0.047893,0.96775,Wdr83os,0.052565,0.186045,1.388251,Cpsf6,0.000317,0.002985,2.12971,Hmg20b,0.183082,0.328064,1.248404,Oga,0.153543,0.321771,1.272359,Cpq,0.293007,0.409022,3.042598,Sdcbp2,0.000873,0.00877,1.816639
496,Chd1,0.032681,0.09365,0.728637,Phf11b,0.009076,0.036756,3.905086,Dhrs1,0.042406,0.095947,0.906173,Klhl12,0.043011,0.130405,1.282985,Hypk,0.290728,0.418366,0.531313,Irf2bpl,0.000788,0.009419,1.268461,2010001K21Rik,6.15521e-13,1.651531e-11,3.249036,Clic4,2e-06,4.5e-05,0.806389,Capg,0.183416,0.359775,0.58678,Lzts2,0.153567,0.315361,0.951293,Cspp1,3.196499e-07,7e-06,1.274906,Fgfr1,0.119565,0.303621,1.90169,Npr1,0.00099,0.006484,2.954659,Wdr45,3.437866e-07,6e-06,2.441287,Vapa,7e-06,9e-05,1.180699,Phf20l1,0.000509,0.008704,0.880578,Jmjd8,0.096458,0.258222,1.893682,Fam229b,0.080263,0.243538,2.349549,Ccng2,0.002362,0.011141,3.311383,Srsf5,0.007309,0.048147,0.770297,Puf60,0.052655,0.18628,1.061881,Runx1,0.000318,0.002999,1.317189,Dpp3,0.183139,0.328115,1.063566,Crb3,0.154256,0.323104,1.56493,Pwwp3a,0.293323,0.409022,2.319582,Cnih4,0.000866,0.008713,1.192521
497,Usf3,0.033133,0.094714,1.440059,Bod1l,0.009091,0.036803,0.748075,Amot,0.042925,0.096904,1.798419,Ndufv2,0.043287,0.131024,0.504476,Bex1,0.291479,0.418366,0.85394,Znhit6,0.000804,0.009586,1.699784,Ccdc114,6.242316e-13,1.672998e-11,3.007859,Uba1,2e-06,4.9e-05,0.919785,Gm10639,0.183523,0.359927,2.50002,Epb41l5,0.154985,0.317628,0.882477,Pygl,3.230626e-07,7e-06,1.645297,Tbx1,0.119818,0.304134,1.266537,Fam184a,0.000993,0.006501,2.387876,Eny2,3.481479e-07,6e-06,1.254556,Ift27,7e-06,9.3e-05,1.850911,Ktn1,0.000511,0.008717,0.796018,Msl1,0.096596,0.258534,0.893684,Snhg1,0.080293,0.243597,0.903597,H2afj,0.002346,0.011074,0.809327,Pygb,0.007455,0.048877,1.936892,Mir22hg,0.052671,0.186308,1.465283,Rnf114,0.000324,0.003042,1.419659,Ptprn2,0.183585,0.328689,5.569147,Ncam1,0.154319,0.323209,4.027638,Parva,0.293397,0.409022,1.190198,Atp13a1,0.000903,0.009031,2.741052
498,Inmt,0.033362,0.095234,3.313454,Gm42870,0.009218,0.03723,3.294126,Pdcd5,0.042907,0.096876,0.629606,1700016J18Rik,0.043857,0.132392,2.724003,Mycl,0.29463,0.418366,1.096514,Psmd4,0.000795,0.009498,0.662577,Lrrc36,6.506072e-13,1.741705e-11,4.005573,Mrpl33,3e-06,5.1e-05,0.897586,Gm7868,0.183681,0.360175,4.907669,Psmc2,0.155103,0.317843,0.486043,Appl2,3.208477e-07,7e-06,0.992601,Rbpjl,0.11986,0.304209,1.359751,Dhcr24,0.000993,0.006501,1.106378,Capzb,3.352514e-07,6e-06,0.809898,Wnt11,8e-06,9.6e-05,2.279153,Pdcd6,0.000514,0.008753,0.932989,Rpl19-ps9,0.097305,0.259989,23.814152,Ndufc2,0.080812,0.244642,0.622529,Prdm2,0.002384,0.01123,1.931939,Csad,0.007459,0.048892,1.603817,Palmd,0.053011,0.187148,2.246486,Sfr1,0.000331,0.003101,1.112814,Ephb3,0.183993,0.32919,2.153585,Hoxb3os,0.154603,0.323717,7.48677,Rab3ip,0.293821,0.409022,2.088846,Uba1,0.000884,0.008877,0.809803
499,Csf3r,0.033588,0.095739,5.195017,Slfn3,0.009271,0.037404,4.038545,Mlf2,0.043209,0.097445,0.65124,Ccdc148,0.043884,0.132455,1.885486,Dock4,0.296698,0.418366,1.409159,Ctbp2,0.000808,0.009621,1.203114,Amn1,6.633786e-13,1.771868e-11,2.341094,Slc25a51,3e-06,5.2e-05,1.186127,Cd3eap,0.184645,0.361495,0.7317,Smarcal1,0.155577,0.318582,1.405989,Mall,3.496696e-07,7e-06,2.026695,Vamp3,0.119962,0.304436,0.753128,Ddx17,0.000997,0.006525,1.062509,Mif,3.444627e-07,6e-06,0.84906,Scnn1a,8e-06,9.5e-05,1.751308,Mea1,0.000511,0.008719,0.89862,Pdcd11,0.097576,0.260565,1.070554,AC149090.1,0.080881,0.244785,1.103312,Mme,0.002453,0.011507,3.370503,Rbms3,0.00758,0.049545,2.275038,Chordc1,0.053095,0.187389,1.26428,Trmt10c,0.000341,0.003183,2.650565,Ep400,0.184004,0.32919,1.200516,Rasgrf1,0.154817,0.323964,2.735902,Ctnnd1,0.294201,0.409022,1.395643,Pcyox1,0.000906,0.009041,1.973412


In [16]:
cluster_marker.to_csv(result_folder+"EPITHELIAL_WNT_PCLS_cluster_marker_horizontally.csv")

#### export and layout clusters vertically

In [17]:
####
#### layout clusters vertically
####

cluster_marker=pd.DataFrame(columns = ['names', 'scores','logfoldchanges','pvals','pvals_adj','cluster'])
for group in groups:
    group_marker = pd.DataFrame(
    {key: result[key][group]
    for key in ['names', 'scores','logfoldchanges','pvals','pvals_adj']})
    group_marker['cluster'] = group
    cluster_marker=cluster_marker.append(group_marker)                                    

In [18]:
cluster_marker.head()

Unnamed: 0,names,scores,logfoldchanges,pvals,pvals_adj,cluster
0,mt-Rnr2,45.305584,1.852911,1.815628e-265,4.277256e-261,C0
1,Malat1,22.482218,1.667595,4.415912e-83,3.467668e-80,C0
2,mt-Rnr1,13.649235,1.311597,3.012854e-36,2.628771e-34,C0
3,Gm8995,11.30928,3.179454,4.782e-26,2.213248e-24,C0
4,Akap12,8.949334,2.696359,1.176642e-17,2.828503e-16,C0


In [19]:
cluster_marker.tail()

Unnamed: 0,names,scores,logfoldchanges,pvals,pvals_adj,cluster
495,Sdcbp2,3.41652,1.816639,0.000873,0.00877,C25_Krt8_ADI_2
496,Cnih4,3.416517,1.192521,0.000866,0.008713,C25_Krt8_ADI_2
497,Atp13a1,3.408,2.741052,0.000903,0.009031,C25_Krt8_ADI_2
498,Uba1,3.407791,0.809803,0.000884,0.008877,C25_Krt8_ADI_2
499,Pcyox1,3.405408,1.973412,0.000906,0.009041,C25_Krt8_ADI_2


In [20]:
cluster_marker.reset_index(drop = True,inplace=True) 
# drop = True, Do not try to insert index into dataframe columns

In [21]:
cluster_marker.to_csv(result_folder+"EPITHELIAL_WNT_PCLS_cluster_marker_vertically.csv")