# Find missing mitochondrial genes

In [1]:
import scanpy as sc
import anndata as ad
import pandas as pd
import numpy as np

#### First trimester single cell

In [7]:
adata = ad.read_h5ad('vt_22.04_annotated.h5ad')

In [8]:
mt_df = pd.read_csv("./MitoCarta_full_transformed.csv")

# Extract the gene names, dropping duplicates
mt_genes = mt_df['Gene'].unique()

# Convert to a list
mt_list = mt_genes.tolist()

In [9]:
len(mt_list)

1136

In [10]:
missing_genes = [gene for gene in mt_list if gene not in adata.var_names]
missing_genes

['FASTKD5',
 'GARS1',
 'KARS1',
 'MARS2',
 'MRPL53',
 'MYG1',
 'MT-ATP6',
 'MT-ATP8',
 'MT-CO1',
 'MT-CO2',
 'MT-CO3',
 'MT-CYB',
 'MT-ND1',
 'MT-ND2',
 'MT-ND3',
 'MT-ND4',
 'MT-ND4L',
 'MT-ND5',
 'MT-ND6',
 'ACOD1',
 'ACSM4',
 'CYP11B1',
 'CYP11B2',
 'FTMT',
 'GLYAT',
 'GPX1',
 'HTD2',
 'MTARC1',
 'MTARC2',
 'OXCT2',
 'PDHA2',
 'PRODH',
 'SLC25A31',
 'SLC25A52',
 'MARCHF5',
 'RTL10',
 'SPATA19',
 'ATP5MF-PTCD1',
 'MCCD1',
 'RP11_469A15.2']

In [11]:
len(missing_genes)

40

#### Third trimester single cell

In [2]:
adata = ad.read_h5ad('./yang_24.06_annotated.h5ad') 

In [3]:
mt_df = pd.read_csv("./MitoCarta_full_transformed.csv")

# Extract the gene names, dropping duplicates
mt_genes = mt_df['Gene'].unique()

# Convert to a list
mt_list = mt_genes.tolist()

In [4]:
len(mt_list)

1136

In [5]:
missing_genes = [gene for gene in mt_list if gene not in adata.var_names]
missing_genes

['GARS1',
 'KARS1',
 'MARS2',
 'MYG1',
 'MT-ATP6',
 'MT-ATP8',
 'MT-CO1',
 'MT-CO2',
 'MT-CO3',
 'MT-CYB',
 'MT-ND1',
 'MT-ND2',
 'MT-ND3',
 'MT-ND4',
 'MT-ND4L',
 'MT-ND5',
 'MT-ND6',
 'ACSM2B',
 'ACSM4',
 'AGXT2',
 'CYP11B1',
 'CYP11B2',
 'FABP1',
 'FTMT',
 'GLYAT',
 'GPX1',
 'HAO2',
 'HTD2',
 'LIPT1',
 'MTARC1',
 'MTARC2',
 'OXCT2',
 'PDHA2',
 'PDP2',
 'PRODH',
 'SLC25A31',
 'SLC25A41',
 'SLC25A52',
 'SLC25A18',
 'SLC25A48',
 'SPHKAP',
 'MARCHF5',
 'SPATA19',
 'ATP5MF-PTCD1',
 'MCCD1',
 'RP11_469A15.2']

In [6]:
len(missing_genes)

46

#### First trimester spatial

In [13]:
adata = sc.read_h5ad('./Spatial/spatial1_annotated.h5ad')

In [14]:
mt_df = pd.read_csv("./MitoCarta_full_transformed.csv")

# Extract the gene names, dropping duplicates
mt_genes = mt_df['Gene'].unique()

# Convert to a list
mt_list = mt_genes.tolist()

In [15]:
len(mt_list)

1136

In [16]:
missing_genes = [gene for gene in mt_list if gene not in adata.var_names]
missing_genes

['ATAD3A',
 'ATAD3B',
 'GARS1',
 'KARS1',
 'METTL15',
 'METTL5',
 'MPV17L2',
 'MRPL1',
 'MRPL10',
 'MRPL11',
 'MRPL12',
 'MRPL13',
 'MRPL14',
 'MRPL15',
 'MRPL16',
 'MRPL17',
 'MRPL18',
 'MRPL19',
 'MRPL2',
 'MRPL20',
 'MRPL21',
 'MRPL22',
 'MRPL23',
 'MRPL24',
 'MRPL27',
 'MRPL28',
 'MRPL3',
 'MRPL30',
 'MRPL32',
 'MRPL33',
 'MRPL34',
 'MRPL35',
 'MRPL36',
 'MRPL37',
 'MRPL38',
 'MRPL39',
 'MRPL4',
 'MRPL40',
 'MRPL41',
 'MRPL42',
 'MRPL43',
 'MRPL44',
 'MRPL45',
 'MRPL46',
 'MRPL47',
 'MRPL48',
 'MRPL49',
 'MRPL50',
 'MRPL51',
 'MRPL52',
 'MRPL53',
 'MRPL54',
 'MRPL55',
 'MRPL57',
 'MRPL58',
 'MRPL9',
 'MRPS10',
 'MRPS11',
 'MRPS12',
 'MRPS14',
 'MRPS15',
 'MRPS16',
 'MRPS17',
 'MRPS18A',
 'MRPS18B',
 'MRPS18C',
 'MRPS2',
 'MRPS21',
 'MRPS22',
 'MRPS23',
 'MRPS24',
 'MRPS25',
 'MRPS26',
 'MRPS27',
 'MRPS28',
 'MRPS30',
 'MRPS31',
 'MRPS33',
 'MRPS34',
 'MRPS35',
 'MRPS36',
 'MRPS5',
 'MRPS6',
 'MRPS7',
 'MRPS9',
 'MYG1',
 'PNPT1',
 'PTCD3',
 'TFAM',
 'TRMT1',
 'PMPCA',
 'TOMM20L',
 '

In [17]:
len(missing_genes)

197

#### Third trimester spatial

In [19]:
adata = sc.read_h5ad('./Spatial/spatial3_annotated.h5ad')

In [20]:
mt_df = pd.read_csv("./MitoCarta_full_transformed.csv")

# Extract the gene names, dropping duplicates
mt_genes = mt_df['Gene'].unique()

# Convert to a list
mt_list = mt_genes.tolist()

In [21]:
len(mt_list)

1136

In [22]:
missing_genes = [gene for gene in mt_list if gene not in adata.var_names]
missing_genes

['ATAD3A',
 'ATAD3B',
 'GARS1',
 'KARS1',
 'METTL15',
 'METTL5',
 'MPV17L2',
 'MRPL1',
 'MRPL10',
 'MRPL11',
 'MRPL12',
 'MRPL13',
 'MRPL14',
 'MRPL15',
 'MRPL16',
 'MRPL17',
 'MRPL18',
 'MRPL19',
 'MRPL2',
 'MRPL20',
 'MRPL21',
 'MRPL22',
 'MRPL23',
 'MRPL24',
 'MRPL27',
 'MRPL28',
 'MRPL3',
 'MRPL30',
 'MRPL32',
 'MRPL33',
 'MRPL34',
 'MRPL35',
 'MRPL36',
 'MRPL37',
 'MRPL38',
 'MRPL39',
 'MRPL4',
 'MRPL40',
 'MRPL41',
 'MRPL42',
 'MRPL43',
 'MRPL44',
 'MRPL45',
 'MRPL46',
 'MRPL47',
 'MRPL48',
 'MRPL49',
 'MRPL50',
 'MRPL51',
 'MRPL52',
 'MRPL53',
 'MRPL54',
 'MRPL55',
 'MRPL57',
 'MRPL58',
 'MRPL9',
 'MRPS10',
 'MRPS11',
 'MRPS12',
 'MRPS14',
 'MRPS15',
 'MRPS16',
 'MRPS17',
 'MRPS18A',
 'MRPS18B',
 'MRPS18C',
 'MRPS2',
 'MRPS21',
 'MRPS22',
 'MRPS23',
 'MRPS24',
 'MRPS25',
 'MRPS26',
 'MRPS27',
 'MRPS28',
 'MRPS30',
 'MRPS31',
 'MRPS33',
 'MRPS34',
 'MRPS35',
 'MRPS36',
 'MRPS5',
 'MRPS6',
 'MRPS7',
 'MRPS9',
 'MYG1',
 'PNPT1',
 'PTCD3',
 'TFAM',
 'TRMT1',
 'PMPCA',
 'TOMM20L',
 '

In [23]:
len(missing_genes)

187