# Import packages and data 

In [1]:
import numpy as np
import pandas as pd
import scanpy as sc
import seaborn as sns
import scipy.stats
import anndata
import matplotlib.pyplot as plt
import matplotlib as mpl
from matplotlib.axes._axes import _log as matplotlib_axes_logger
from scipy import sparse
matplotlib_axes_logger.setLevel('ERROR')
# silence NumbaPerformanceWarning
import warnings
from numba.errors import NumbaPerformanceWarning
warnings.filterwarnings("ignore", category=NumbaPerformanceWarning)

  from pandas.core.index import RangeIndex


In [2]:
sc.settings.verbosity = 1  # verbosity: errors (0), warnings (1), info (2), hints (3)
# Set up the plot config for viewing the annotation clearly.
sc.settings.set_figure_params(dpi=120, dpi_save=1000)
sc.logging.print_versions()

scanpy==1.4.4 anndata==0.7.1 umap==0.3.10 numpy==1.18.1 scipy==1.4.1 pandas==1.0.2 scikit-learn==0.22.2.post1 statsmodels==0.11.1 python-igraph==0.8.0 louvain==0.6.1


# Save meta (and numbers) for YS progenitors

In [3]:
adata = sc.read("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/data/figs5c_ys_fbm_progen_enrichment_comparison_20200514.h5ad")

In [4]:
cell_numbers = adata.obs.groupby(["cell.labels"]).apply(len)
cell_numbers

cell.labels
CMP                    55
ELP                   174
GMP                    40
HSC                   105
MEMP                   55
MEP                    56
Monocyte precursor     26
macrophage             42
neut myeloid           18
dtype: int64

In [5]:
total = sc.read("/Users/b8058304/Documents/PhD_work/Coding/liver/data/ys_total_annotation_20191127.h5ad")

In [6]:
total.obs["cell.labels_progen"] = adata.obs["cell.labels"]

In [7]:
cell_numbers = total.obs.groupby(["cell.labels_progen"]).apply(len)
cell_numbers

cell.labels_progen
CMP                    55
ELP                   174
GMP                    40
HSC                   105
MEMP                   55
MEP                    56
Monocyte precursor     26
macrophage             42
neut myeloid           18
dtype: int64

In [8]:
cell_numbers = total.obs.groupby(["fetal.ids", "cell.labels_progen"]).apply(len)
pd.DataFrame(cell_numbers).to_csv("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/resources_for_pipelines/ys_progen_nrs_by_sample.csv")
cell_numbers

fetal.ids          cell.labels_progen
F32_female_7+6PCW  CMP                     3
                   ELP                    12
                   GMP                     1
                   HSC                     5
                   MEMP                    8
                   MEP                     8
                   macrophage              2
F35_female_7+6PCW  CMP                    11
                   ELP                    19
                   GMP                     2
                   HSC                    19
                   MEMP                   23
                   MEP                    38
                   Monocyte precursor      2
                   macrophage              1
                   neut myeloid            6
F37_female_4PCW    CMP                    41
                   ELP                   143
                   GMP                    37
                   HSC                    81
                   MEMP                   24
                 

In [9]:
total.write("/Users/b8058304/Documents/PhD_work/Coding/liver/data/ys_total_annotation_20191127.h5ad")

# Save meta (and nrs) for liver progenitors

In [10]:
adata = sc.read("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/data/figs5c_fl_fbm_progen_enrichment_comparison_20200518.h5ad")

In [11]:
cell_numbers = adata.obs.groupby(["cell.labels"]).apply(len)
cell_numbers

cell.labels
ELP                        525
GMP                        362
HSC                        242
MEMP                       505
MEP                        639
MPP                       2012
early MK                    81
early erythroid            333
eo/baso/mast precursor      86
erythroid-MPP hybrid        14
macrophage                  81
myeloid DC progenitor       94
pDC progenitor              41
dtype: int64

In [12]:
total = sc.read("/Users/b8058304/Documents/PhD_work/Coding/liver/data/fetal_liver_alladata_Copy1.h5ad")

In [13]:
total.obs["cell.labels_progen"] = adata.obs["cell.labels"]

In [14]:
cell_numbers = total.obs.groupby(["cell.labels_progen"]).apply(len)
cell_numbers

cell.labels_progen
ELP                        525
GMP                        362
HSC                        242
MEMP                       505
MEP                        639
MPP                       2012
early MK                    81
early erythroid            333
eo/baso/mast precursor      86
erythroid-MPP hybrid        14
macrophage                  81
myeloid DC progenitor       94
pDC progenitor              41
dtype: int64

In [15]:
cell_numbers = total.obs.groupby(["fetal.ids", "cell.labels_progen"]).apply(len)
pd.DataFrame(cell_numbers).to_csv("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/resources_for_pipelines/liver_progen_nrs_by_sample.csv")
cell_numbers

fetal.ids           cell.labels_progen    
F16_male_8+1PCW     ELP                        4
                    GMP                        3
                    HSC                        1
                    MEMP                       4
                    MEP                        9
                                              ..
F45_female_13+6PCW  eo/baso/mast precursor     8
                    erythroid-MPP hybrid       1
                    macrophage                18
                    myeloid DC progenitor     11
                    pDC progenitor             4
Length: 169, dtype: int64

In [16]:
total.write("/Users/b8058304/Documents/PhD_work/Coding/liver/data/fetal_liver_alladata_Copy1.h5ad")

# Save nrs for FBM

In [17]:
total = sc.read("/Users/b8058304/Documents/PhD_work/Coding/bm_plus_19pcw/data/bm_plus_19pcw_raw_dr_20200414.h5ad")

In [18]:
cell_numbers = total.obs.groupby(["cell.labels"]).apply(len)
cell_numbers

cell.labels
CD4 T                  327
CD8 T                  171
CD14 monocyte         8787
CD56 bright NK         540
CMP                    425
                      ... 
schwann cells            9
sinusoidal EC          550
stromal macrophage    1493
tDC                    193
tip EC                 363
Length: 64, dtype: int64

In [19]:
cell_numbers = total.obs.groupby(["fetal.ids", "cell.labels"]).apply(len)
pd.DataFrame(cell_numbers).to_csv("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/resources_for_pipelines/fbm_progen_nrs_by_sample.csv")
cell_numbers

fetal.ids         cell.labels       
F21_male_16+2PCW  CD4 T                  12
                  CD8 T                  13
                  CD14 monocyte         217
                  CD56 bright NK         16
                  CMP                    19
                                       ... 
SB19PCW           promyelocyte          816
                  schwann cells           8
                  sinusoidal EC          42
                  stromal macrophage     40
                  tip EC                105
Length: 528, dtype: int64

# Save nrs for ABM

In [20]:
total = sc.read("/Users/b8058304/Documents/PhD_work/Coding/adult_bm/data/adult_bm_raw_dr_20200311.h5ad")

In [21]:
cell_numbers = total.obs.groupby(["cell.labels"]).apply(len)
cell_numbers

cell.labels
CD14 monocyte                   3094
CD16 monocyte                   1938
CD56 bright NK                  1228
CMP                              882
DC1                              135
DC2                              481
DC3                              550
EI macrophage                     77
ELP-B cell                        80
ELP-pDC                           63
GMP                              398
HSC                              862
MEMP                             505
MK                               577
MK progenitor                    280
MSC                              161
Pre B cell                       971
T reg                           6327
early MK                         136
early erythroid                 5441
immature B cell                 2728
interferon induced monocyte      576
late erythroid                  1150
mature CD8 T cell              15725
mature NK                       6074
memory B cell                   4106
memory CD4 T cell         

In [22]:
cell_numbers = total.obs.groupby(["sample", "cell.labels"]).apply(len)
pd.DataFrame(cell_numbers).to_csv("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/resources_for_pipelines/abm_progen_nrs_by_sample.csv")
cell_numbers

sample     cell.labels        
MantonBM1  CD14 monocyte          614
           CD16 monocyte          244
           CD56 bright NK         240
           CMP                    195
           DC1                     55
                                 ... 
MantonBM6  pro B progenitor       313
           promyelocyte           544
           transitional B cell    204
           transitional DC         18
           transitional NK        130
Length: 180, dtype: int64

# Save nrs for CB

In [23]:
total = sc.read("/Users/b8058304/Documents/PhD_work/Coding/cord_blood/data/cord_blood_raw_dr_20200311.h5ad")

In [24]:
cell_numbers = total.obs.groupby(["cell.labels"]).apply(len)
cell_numbers

cell.labels
CD8 T cell          16345
CD14 monocyte       13324
CD16 monocyte         888
CD56 bright NK       4066
CMP                   272
DC1                    67
DC2                   155
DC precursor          169
GMP                   203
HSC                   194
ILC precursor        1519
MEMP                  338
MK                   1262
early MK              496
early erythroid       532
late erythroid        878
mature NK            7860
mid erythroid        2627
myelocyte            3726
naive B cell        19516
naive CD4 T cell    69338
neutrophil           3458
pDC                   242
preDC                 269
premonocyte           607
tDC                    91
dtype: int64

In [25]:
cell_numbers = total.obs.groupby(["sample", "cell.labels"]).apply(len)
pd.DataFrame(cell_numbers).to_csv("/Users/b8058304/Documents/PhD_work/Coding/manuscript_figs/resources_for_pipelines/cb_progen_nrs_by_sample.csv")
cell_numbers

sample     cell.labels   
MantonCB1  CD8 T cell        1739
           CD14 monocyte     5633
           CD16 monocyte      242
           CD56 bright NK     543
           CMP                 50
                             ... 
MantonCB6  neutrophil        1719
           pDC                 74
           preDC              146
           premonocyte        219
           tDC                 63
Length: 104, dtype: int64