# Analysis RTG gene expression

## Reference
- Single-cell RNA-seq reveals intrinsic and extrinsic regulatory heterogeneity in yeast responding to stress
    - Article. https://doi.org/10.1371/journal.pbio.2004050  
    - RNA sequencing data(GSA102475). https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE102475

In [None]:
# Retrieve table
import pandas as pd
import numbers
df = pd.read_table("data/GSE102475_GASCH_NaCl-scRNAseq_NormData.txt")

In [None]:
def get_key(df, value):
    return [k for k,v in df.items() if value==v]

## Check availibility of RTG Genes

In [None]:
# Gene names
alias = {
    "RTG1": "YOL067C",
    "RTG2": "YGL252C",
    "RTG3": "YBL103C",
    "BMH1": "YER177W",
    "MKS1": "YNL076W",
    "CIT2": "YCR005C"
}

for k in alias.keys():
    if alias[k] in list(df["gene"]):
        print("{} is measured".format(k))
    else:
        print("{} not found".format(k))

## Get RTG gene expression table 

In [None]:
df_filt = df[df["gene"].isin(alias.values())]
# filtered zeros
df_filt_zeroRemoved = df_filt
for key in df_filt.keys():
    col = df_filt[key]
    if 0.00 in list(col):
        del df_filt_zeroRemoved[key]
        
# a to columndd alias
alias_ns = [ get_key(alias, ali)[0] for ali in df_filt_zeroRemoved["gene"]]
df_filt_zeroRemoved["gene_alias"] = alias_ns
df_filt_zeroRemoved

In [None]:
df_filt_zeroRemoved.to_csv("data/RTG-Expression-Table_GSE102475.csv", index=False)