In [None]:
import scanpy as sc
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns; sns.set(color_codes=True)
from pathlib import Path

sc.settings.verbosity = 3  # verbosity: errors (0), warnings (1), info (2), hints (3)
sc.settings.set_figure_params(dpi=80, dpi_save=300, color_map='viridis')

In [None]:
data1 = sc.read('/home/jovyan/YS_project/YS/Data_objects/YS_object_14092021/Combined_YS_Fliver_20210929.h5ad')
data1

In [None]:
data2 = sc.read('/home/jovyan/wgeted_files/gastrulation.h5ad')
data2

In [None]:
data2 = data2[data2.obs['corr_concat'].isin(['YS Endoderm_Yolk Sac_gastrulation'])]

In [None]:
data1.obs['celltypes_for_dotplot'] = data1.obs['broad_cell_labels_organ']
data2.obs['celltypes_for_dotplot'] = data2.obs['corr_concat']

In [None]:
adata_list = [data1,data2]
adata = sc.AnnData.concatenate(*adata_list, join='inner', batch_categories=None ,index_unique=None)

In [None]:
cells_to_keep = ['Endoderm_ys','Hepatocyte_fliv','YS Endoderm_Yolk Sac_gastrulation']
adata = adata[adata.obs['celltypes_for_dotplot'].isin(cells_to_keep)]
adata.obs.groupby(['celltypes_for_dotplot']).apply(len)

In [None]:
adata

# Pre-Process data

In [None]:
# normalise count data
sc.pp.normalize_total(adata)

In [None]:
# log the count data
sc.pp.log1p(adata)

In [None]:
# scale the data
sc.pp.scale(adata, max_value=10)
# scale the negative values in adata.X (which have been normalised, logged and scaled) to zero
adata.X = np.where(adata.X < 0, 0, adata.X)

# Plot

In [None]:
adata.obs["celltypes_for_dotplot"] = adata.obs["celltypes_for_dotplot"].astype('category')
adata.obs["celltypes_for_dotplot"] = adata.obs["celltypes_for_dotplot"].cat.reorder_categories(['Endoderm_ys','YS Endoderm_Yolk Sac_gastrulation', 'Hepatocyte_fliv'])

In [None]:
Coagulation_factors = [
    'FGA',
    'FGB',
    'FGG',
    'F2',
    'F2R',
    'F3',
    'F5',
    'F7',
    # 'F9', not in this data
    'F10',
    'F11', 
    'F12',
    'F13A1',
    'F13B',
    'KLKB1',
    'KNG1',
    'SERPINC1',
    'SERPIND1',
    'PROC',
    'PROS1'
]

In [None]:
DEG_of_interest = [
    'MIF',
    'LGALS3',
    'LY6E',
    'PRSS3',
    'CLDN7',
    'GSTA2',
    'PPDPF',
    'TMSB10',
    'SERPINA4',
    'SERPINA5',
    'SERPINF2',
    'SERPING1',
     'ADH1A', 
     'ADH6', 
    'ALDOB',
    'ALDH1A1',
    'APOH',
    'CYP3A7',
    'CYP4A11',
    'CYP27A1',
    #'A1BG',
    'ITIH1',
    'ITIH2',
    'GC',
    'ALB',
    'F12',
    'CPB2'
]

In [None]:
adata.var[adata.var_names.str.match("A1")]

In [None]:
data1.var[data1.var_names.str.match("A1")]

In [None]:
data2.var[data2.var_names.str.match("A1")]

In [None]:
sc.pl.dotplot(adata, var_names=Coagulation_factors, groupby='celltypes_for_dotplot', swap_axes=False, figsize=(8,2.5), use_raw=False, save= 'ext4e_with_gastrulation.pdf') 

In [None]:
sc.pl.dotplot(adata, var_names=DEG_of_interest, groupby='celltypes_for_dotplot', swap_axes=False, figsize=(10,2.5), use_raw=False, save= 'ext4f_with_gastrulation.pdf') 