In [3]:
import scanpy as sc
import numpy as np
import scipy as sp
import pandas as pd
import matplotlib.pyplot as plt
from matplotlib import rcParams
from matplotlib import colors
import seaborn as sb
import rpy2.rinterface_lib.callbacks
import logging
import scrublet as scr
from rpy2.robjects import pandas2ri
import anndata2ri

In [4]:
# Ignore R warning messages
#Note: this can be commented out to get more verbose R output
rpy2.rinterface_lib.callbacks.logger.setLevel(logging.ERROR)

# Automatically convert rpy2 outputs to pandas dataframes
pandas2ri.activate()
anndata2ri.activate()
%load_ext rpy2.ipython

plt.rcParams['figure.figsize']=(8,8) #rescale figures
sc.settings.verbosity = 3
#sc.set_figure_params(dpi=200, dpi_save=300)
sc.logging.print_header()

The rpy2.ipython extension is already loaded. To reload it, use:
  %reload_ext rpy2.ipython
scanpy==1.7.2 anndata==0.7.6 umap==0.5.1 numpy==1.19.5 scipy==1.6.3 pandas==1.2.4 scikit-learn==0.24.2 statsmodels==0.12.2 python-igraph==0.9.1 louvain==0.7.0


## Ptz5

In [5]:
Ptz_5_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_5_IBD/Ileum_Involved/")
Ptz_5_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_5_IBD/Ileum_Uninvolved/")
#Ptz_5_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_5_IBD/Blood/")

Ptz_5_Ileum_Involved.obs['CellId'] = Ptz_5_Ileum_Involved.obs.index
Ptz_5_Ileum_Uninvolved.obs['CellId'] = Ptz_5_Ileum_Uninvolved.obs.index
#Ptz_5_Blood.obs['CellId'] = Ptz_5_Blood.obs.index

Ptz_5_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_5_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
#Ptz_5_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_5_Ileum_Involved.obs['PatientNumber'] = "Ptz5"
Ptz_5_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz5"
#Ptz_5_Blood.obs['PatientNumber'] = "Ptz5"

Ptz_5_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_5_Ileum_Uninvolved.obs['TumorType'] = "IBD"
#Ptz_5_Blood.obs['TumorType'] = "IBD"

Ptz_5_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_5_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
#Ptz_5_Blood.obs['TumorSite'] = "PBMC"

Ptz_5_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_5_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
#Ptz_5_Blood.obs['CellType'] = "PBMC"

Ptz_5_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_5_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
#Ptz_5_Blood.obs['dataset'] = "10X 3 V1"

Ptz_5_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_5_Ileum_Involved.h5ad")
Ptz_5_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_5_Ileum_Uninvolved.h5ad")
#Ptz_5_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_5_Blood.h5ad")

del Ptz_5_Ileum_Involved
del Ptz_5_Ileum_Uninvolved
#del Ptz_5_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz 7

In [6]:
Ptz_7_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_7_IBD/Ileum_Involved/")
Ptz_7_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_7_IBD/Ileum_Uninvolved/")
#Ptz_7_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_7_IBD/Blood/")

Ptz_7_Ileum_Involved.obs['CellId'] = Ptz_7_Ileum_Involved.obs.index
Ptz_7_Ileum_Uninvolved.obs['CellId'] = Ptz_7_Ileum_Uninvolved.obs.index
#Ptz_7_Blood.obs['CellId'] = Ptz_7_Blood.obs.index

Ptz_7_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_7_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
# Ptz_7_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_7_Ileum_Involved.obs['PatientNumber'] = "Ptz7"
Ptz_7_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz7"
# Ptz_7_Blood.obs['PatientNumber'] = "Ptz7"

Ptz_7_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_7_Ileum_Uninvolved.obs['TumorType'] = "IBD"
# Ptz_7_Blood.obs['TumorType'] = "IBD"

Ptz_7_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_7_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
# Ptz_7_Blood.obs['TumorSite'] = "PBMC"

Ptz_7_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_7_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
# Ptz_7_Blood.obs['CellType'] = "PBMC"

Ptz_7_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_7_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
# Ptz_7_Blood.obs['dataset'] = "10X 3 V2"

Ptz_7_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_7_Ileum_Involved.h5ad")
Ptz_7_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_7_Ileum_Uninvolved.h5ad")
# Ptz_7_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_7_Blood.h5ad")

del Ptz_7_Ileum_Involved
del Ptz_7_Ileum_Uninvolved
# del Ptz_7_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz8

In [7]:
Ptz_8_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_8_IBD/Ileum_Involved/")
Ptz_8_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_8_IBD/Ileum_Uninvolved/")
#Ptz_8_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_8_IBD/Blood/")

Ptz_8_Ileum_Involved.obs['CellId'] = Ptz_8_Ileum_Involved.obs.index
Ptz_8_Ileum_Uninvolved.obs['CellId'] = Ptz_8_Ileum_Uninvolved.obs.index
#Ptz_8_Blood.obs['CellId'] = Ptz_8_Blood.obs.index

Ptz_8_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_8_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
# Ptz_8_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_8_Ileum_Involved.obs['PatientNumber'] = "Ptz8"
Ptz_8_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz8"
# Ptz_8_Blood.obs['PatientNumber'] = "Ptz8"

Ptz_8_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_8_Ileum_Uninvolved.obs['TumorType'] = "IBD"
# Ptz_8_Blood.obs['TumorType'] = "IBD"

Ptz_8_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_8_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
# Ptz_8_Blood.obs['TumorSite'] = "PBMC"

Ptz_8_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_8_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
# Ptz_8_Blood.obs['CellType'] = "PBMC"

Ptz_8_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_8_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
# Ptz_8_Blood.obs['dataset'] = "10X 3 V2"

Ptz_8_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_8_Ileum_Involved.h5ad")
Ptz_8_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_8_Ileum_Uninvolved.h5ad")
# Ptz_8_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_8_Blood.h5ad")

del Ptz_8_Ileum_Involved
del Ptz_8_Ileum_Uninvolved
# del Ptz_8_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz10

In [8]:
Ptz_10_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_10_IBD/Ileum_Involved/")
Ptz_10_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_10_IBD/Ileum_Uninvolved/")
# Ptz_10_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_10_IBD/Blood/")

Ptz_10_Ileum_Involved.obs['CellId'] = Ptz_10_Ileum_Involved.obs.index
Ptz_10_Ileum_Uninvolved.obs['CellId'] = Ptz_10_Ileum_Uninvolved.obs.index
# Ptz_10_Blood.obs['CellId'] = Ptz_10_Blood.obs.index

Ptz_10_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_10_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
# Ptz_10_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_10_Ileum_Involved.obs['PatientNumber'] = "Ptz10"
Ptz_10_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz10"
# Ptz_10_Blood.obs['PatientNumber'] = "Ptz10"

Ptz_10_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_10_Ileum_Uninvolved.obs['TumorType'] = "IBD"
# Ptz_10_Blood.obs['TumorType'] = "IBD"

Ptz_10_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_10_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
# Ptz_10_Blood.obs['TumorSite'] = "PBMC"

Ptz_10_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_10_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
# Ptz_10_Blood.obs['CellType'] = "PBMC"

Ptz_10_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_10_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
# Ptz_10_Blood.obs['dataset'] = "10X 3 V2"

Ptz_10_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_10_Ileum_Involved.h5ad")
Ptz_10_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_10_Ileum_Uninvolved.h5ad")
# Ptz_10_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_10_Blood.h5ad")

del Ptz_10_Ileum_Involved
del Ptz_10_Ileum_Uninvolved
# del Ptz_10_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz11

In [9]:
Ptz_11_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_11_IBD/Ileum_Involved/")
Ptz_11_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_11_IBD/Ileum_Uninvolved/")
# Ptz_11_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_11_IBD/Blood/")

Ptz_11_Ileum_Involved.obs['CellId'] = Ptz_11_Ileum_Involved.obs.index
Ptz_11_Ileum_Uninvolved.obs['CellId'] = Ptz_11_Ileum_Uninvolved.obs.index
# Ptz_11_Blood.obs['CellId'] = Ptz_11_Blood.obs.index

Ptz_11_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_11_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
# Ptz_11_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_11_Ileum_Involved.obs['PatientNumber'] = "Ptz11"
Ptz_11_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz11"
# Ptz_11_Blood.obs['PatientNumber'] = "Ptz11"

Ptz_11_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_11_Ileum_Uninvolved.obs['TumorType'] = "IBD"
# Ptz_11_Blood.obs['TumorType'] = "IBD"

Ptz_11_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_11_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
# Ptz_11_Blood.obs['TumorSite'] = "PBMC"

Ptz_11_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_11_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
#Ptz_11_Blood.obs['CellType'] = "PBMC"

Ptz_11_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_11_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
# Ptz_11_Blood.obs['dataset'] = "10X 3 V2"

Ptz_11_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_11_Ileum_Involved.h5ad")
Ptz_11_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_11_Ileum_Uninvolved.h5ad")
# Ptz_11_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_11_Blood.h5ad")

del Ptz_11_Ileum_Involved
del Ptz_11_Ileum_Uninvolved
# del Ptz_11_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz12

In [10]:
Ptz_12_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_12_IBD/Ileum_Involved/")
Ptz_12_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_12_IBD/Ileum_Uninvolved/")
# Ptz_12_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_12_IBD/Blood/")

Ptz_12_Ileum_Involved.obs['CellId'] = Ptz_12_Ileum_Involved.obs.index
Ptz_12_Ileum_Uninvolved.obs['CellId'] = Ptz_12_Ileum_Uninvolved.obs.index
#Ptz_12_Blood.obs['CellId'] = Ptz_12_Blood.obs.index

Ptz_12_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_12_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
#Ptz_12_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_12_Ileum_Involved.obs['PatientNumber'] = "Ptz12"
Ptz_12_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz12"
#Ptz_12_Blood.obs['PatientNumber'] = "Ptz12"

Ptz_12_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_12_Ileum_Uninvolved.obs['TumorType'] = "IBD"
#Ptz_12_Blood.obs['TumorType'] = "IBD"

Ptz_12_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_12_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
#Ptz_12_Blood.obs['TumorSite'] = "PBMC"

Ptz_12_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_12_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
#Ptz_12_Blood.obs['CellType'] = "PBMC"

Ptz_12_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_12_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
#Ptz_12_Blood.obs['dataset'] = "10X 3 V2"

Ptz_12_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_12_Ileum_Involved.h5ad")
Ptz_12_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_12_Ileum_Uninvolved.h5ad")
#Ptz_12_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_12_Blood.h5ad")

del Ptz_12_Ileum_Involved
del Ptz_12_Ileum_Uninvolved
#del Ptz_12_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz13

In [11]:
Ptz_13_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_13_IBD/Ileum_Involved/")
Ptz_13_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_13_IBD/Ileum_Uninvolved/")


Ptz_13_Ileum_Involved.obs['CellId'] = Ptz_13_Ileum_Involved.obs.index
Ptz_13_Ileum_Uninvolved.obs['CellId'] = Ptz_13_Ileum_Uninvolved.obs.index

Ptz_13_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_13_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"


Ptz_13_Ileum_Involved.obs['PatientNumber'] = "Ptz13"
Ptz_13_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz13"


Ptz_13_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_13_Ileum_Uninvolved.obs['TumorType'] = "IBD"


Ptz_13_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_13_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"


Ptz_13_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_13_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"


Ptz_13_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_13_Ileum_Uninvolved.obs['dataset'] = "GSE134809"


Ptz_13_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_13_Ileum_Involved.h5ad")
Ptz_13_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_13_Ileum_Uninvolved.h5ad")

del Ptz_13_Ileum_Involved
del Ptz_13_Ileum_Uninvolved

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz14

In [12]:
Ptz_14_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_14_IBD/Ileum_Involved/")
Ptz_14_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_14_IBD/Ileum_Uninvolved/")
# Ptz_14_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_14_IBD/Blood/")

Ptz_14_Ileum_Involved.obs['CellId'] = Ptz_14_Ileum_Involved.obs.index
Ptz_14_Ileum_Uninvolved.obs['CellId'] = Ptz_14_Ileum_Uninvolved.obs.index
#Ptz_14_Blood.obs['CellId'] = Ptz_14_Blood.obs.index

Ptz_14_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_14_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
#Ptz_14_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_14_Ileum_Involved.obs['PatientNumber'] = "Ptz14"
Ptz_14_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz14"
#Ptz_14_Blood.obs['PatientNumber'] = "Ptz14"

Ptz_14_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_14_Ileum_Uninvolved.obs['TumorType'] = "IBD"
#Ptz_14_Blood.obs['TumorType'] = "IBD"

Ptz_14_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_14_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
#Ptz_14_Blood.obs['TumorSite'] = "PBMC"

Ptz_14_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_14_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
#Ptz_14_Blood.obs['CellType'] = "PBMC"

Ptz_14_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_14_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
#Ptz_14_Blood.obs['dataset'] = "10X 3 V2"

Ptz_14_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_14_Ileum_Involved.h5ad")
Ptz_14_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_14_Ileum_Uninvolved.h5ad")
#Ptz_14_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_14_Blood.h5ad")

del Ptz_14_Ileum_Involved
del Ptz_14_Ileum_Uninvolved
#del Ptz_14_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz15

In [13]:
Ptz_15_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_15_IBD/Ileum_Involved/")
Ptz_15_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_15_IBD/Ileum_Uninvolved/")
#Ptz_15_Blood = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_15_IBD/Blood/")

Ptz_15_Ileum_Involved.obs['CellId'] = Ptz_15_Ileum_Involved.obs.index
Ptz_15_Ileum_Uninvolved.obs['CellId'] = Ptz_15_Ileum_Uninvolved.obs.index
#Ptz_15_Blood.obs['CellId'] = Ptz_15_Blood.obs.index

Ptz_15_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_15_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"
#Ptz_15_Blood.obs['CellFromTumor'] = "Autoimmune"

Ptz_15_Ileum_Involved.obs['PatientNumber'] = "Ptz15"
Ptz_15_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz15"
#Ptz_15_Blood.obs['PatientNumber'] = "Ptz15"

Ptz_15_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_15_Ileum_Uninvolved.obs['TumorType'] = "IBD"
#Ptz_15_Blood.obs['TumorType'] = "IBD"

Ptz_15_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_15_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"
#Ptz_15_Blood.obs['TumorSite'] = "PBMC"

Ptz_15_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_15_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"
#Ptz_15_Blood.obs['CellType'] = "PBMC"

Ptz_15_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_15_Ileum_Uninvolved.obs['dataset'] = "GSE134809"
#Ptz_15_Blood.obs['dataset'] = "10X 3 V2"

Ptz_15_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_15_Ileum_Involved.h5ad")
Ptz_15_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_15_Ileum_Uninvolved.h5ad")
#Ptz_15_Blood.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_15_Blood.h5ad")

del Ptz_15_Ileum_Involved
del Ptz_15_Ileum_Uninvolved
#del Ptz_15_Blood

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical


## Ptz16

In [14]:
Ptz_16_Ileum_Involved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_16_IBD/Ileum_Involved/")
Ptz_16_Ileum_Uninvolved = sc.read_10x_mtx("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/Ptz_16_IBD/Ileum_Uninvolved/")


Ptz_16_Ileum_Involved.obs['CellId'] = Ptz_16_Ileum_Involved.obs.index
Ptz_16_Ileum_Uninvolved.obs['CellId'] = Ptz_16_Ileum_Uninvolved.obs.index

Ptz_16_Ileum_Involved.obs['CellFromTumor'] = "Autoimmune"
Ptz_16_Ileum_Uninvolved.obs['CellFromTumor'] = "Autoimmune"


Ptz_16_Ileum_Involved.obs['PatientNumber'] = "Ptz16"
Ptz_16_Ileum_Uninvolved.obs['PatientNumber'] = "Ptz16"


Ptz_16_Ileum_Involved.obs['TumorType'] = "IBD"
Ptz_16_Ileum_Uninvolved.obs['TumorType'] = "IBD"


Ptz_16_Ileum_Involved.obs['TumorSite'] = "Ileum"
Ptz_16_Ileum_Uninvolved.obs['TumorSite'] = "Ileum"


Ptz_16_Ileum_Involved.obs['CellType'] = "Involved"
Ptz_16_Ileum_Uninvolved.obs['CellType'] = "UnInvolved"


Ptz_16_Ileum_Involved.obs['dataset'] = "GSE134809"
Ptz_16_Ileum_Uninvolved.obs['dataset'] = "GSE134809"


Ptz_16_Ileum_Involved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_16_Ileum_Involved.h5ad")
Ptz_16_Ileum_Uninvolved.write("/mnt/lugli/spuccio/SP028_Autoimmunity/Cariplo/IBD_counts/h5files/Ptz_16_Ileum_Uninvolved.h5ad")

del Ptz_16_Ileum_Involved
del Ptz_16_Ileum_Uninvolved

--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
--> This might be very slow. Consider passing `cache=True`, which enables much faster reading from a cache file.
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
... storing 'CellFromTumor' as categorical
... storing 'PatientNumber' as categorical
... storing 'TumorType' as categorical
... storing 'TumorSite' as categorical
... storing 'CellType' as categorical
... storing 'dataset' as categorical
