### Notebook to format objects cells for `CellChat` CCI inference.

- **Developed by**: Carlos Talavera-López Ph.D
- **Institute of Computational Biology - Computational Health Centre - Helmholtz Munich**
- v230626

### Import required modules

In [None]:
import anndata
import numpy as np
import scipy as sp
import scanpy as sc
import pandas as pd

### Setting up working environment

In [None]:
sc.settings.verbosity = 3
sc.logging.print_versions()
sc.settings.set_figure_params(dpi = 200, color_map = 'RdPu', dpi_save = 300, vector_friendly = True, format = 'svg')

### Read heart global object 

In [None]:
adata = sc.read_h5ad('../../../data/Epithelial_MultiC_ctl230612_states.raw.h5ad')
adata

In [None]:
adata_new = anndata.AnnData(X = adata.X, obs = adata.obs, var = adata.var)
adata_new

### Make a subset of all populations

- Removing stuff like `nan`or doublets.

In [None]:
adata_new.obs['fine_states'].cat.categories

In [None]:
adata_new.obs_names

In [None]:
adata_new.var_names

### Subset per condition

In [None]:
adata_new.obs['group'].cat.categories

In [None]:
adata_new_CTRL = adata_new[adata_new.obs['group'].isin(['healthy_ctrl'])]
adata_new_CTRL

### Export CTRL

In [None]:
sc.pp.normalize_per_cell(adata_new_CTRL, counts_per_cell_after = 1e6)
sc.pp.log1p(adata_new_CTRL)
adata_new_CTRL.X = sp.sparse.csc_matrix(adata_new_CTRL.X)

In [None]:
adata_new_CTRL.write('../../../data/MultiC_Healthy-CTRL_anotated.h5ad')

### Export Conditions

In [None]:
adata_new.obs['group'].cat.categories

In [None]:
adata_new_COND = adata_new[adata_new.obs['group'].isin(['copd_iav'])]
sc.pp.normalize_per_cell(adata_new_COND, counts_per_cell_after = 1e6)
sc.pp.log1p(adata_new_COND)
adata_new_COND.X = sp.sparse.csc_matrix(adata_new_COND.X)
adata_new_COND

In [None]:
adata_new_COND.write('../../../data/Mixed_COPD-IAV_anotated.h5ad')