# Basic GTEX handling code

In [1]:
import polars as pl
from pathlib import Path
from pycomfort.files import *
from pycomfort import files

In [2]:
base = Path("..").absolute().resolve()
data = base / "data"
input = data / "input"
gtex = input / "gtex"
gtex.mkdir(parents=True, exist_ok=True)
tprint(gtex)

gtex
	GTEx_8_tissues_snRNAseq_atlas_071421.public_obs.h5ad
	GTEx_8_tissues_snRNAseq_immune_atlas_071421.public_obs.h5ad
	GTEx_Analysis_2017-06-05_v8_RNASeQCv1.1.9_gene_tpm.gct


## Bulk RNA-Seq

In [3]:
gct = files.with_ext(gtex, ".gct")[0]
gct

PosixPath('/home/antonkulaga/rna-clock/data/input/gtex/GTEx_Analysis_2017-06-05_v8_RNASeQCv1.1.9_gene_tpm.gct')

In [6]:
rnas = pl.read_csv(gct, comment_char="#", sep="\t")
rnas.head(10)

Name,Description,GTEX-1117F-0226-SM-5GZZ7,GTEX-1117F-0426-SM-5EGHI,GTEX-1117F-0526-SM-5EGHJ,GTEX-1117F-0626-SM-5N9CS,GTEX-1117F-0726-SM-5GIEN,GTEX-1117F-1326-SM-5EGHH,GTEX-1117F-2426-SM-5EGGH,GTEX-1117F-2526-SM-5GZY6,GTEX-1117F-2826-SM-5GZXL,GTEX-1117F-2926-SM-5GZYI,GTEX-1117F-3026-SM-5GZYU,GTEX-1117F-3226-SM-5N9CT,GTEX-111CU-0126-SM-5GZWZ,GTEX-111CU-0226-SM-5GZXC,GTEX-111CU-0326-SM-5GZXO,GTEX-111CU-0426-SM-5GZY1,GTEX-111CU-0526-SM-5EGHK,GTEX-111CU-0626-SM-5EGHL,GTEX-111CU-0726-SM-5GZYD,GTEX-111CU-0826-SM-5EGIJ,GTEX-111CU-0926-SM-5EGIK,GTEX-111CU-1026-SM-5EGIL,GTEX-111CU-1126-SM-5EGIM,GTEX-111CU-1226-SM-5EGIN,GTEX-111CU-1326-SM-5NQ8L,GTEX-111CU-1426-SM-5GZYP,GTEX-111CU-1526-SM-5N9FS,GTEX-111CU-1726-SM-5EGHM,GTEX-111CU-1826-SM-5GZYN,GTEX-111CU-2026-SM-5GZZC,GTEX-111CU-2226-SM-5N9G5,GTEX-111FC-0126-SM-5N9DL,GTEX-111FC-0226-SM-5N9B8,GTEX-111FC-0326-SM-5GZZ1,GTEX-111FC-0426-SM-5N9CV,...,GTEX-ZZ64-0826-SM-5E449,GTEX-ZZ64-0926-SM-5E44L,GTEX-ZZ64-1026-SM-5GZXG,GTEX-ZZ64-1126-SM-5GZXY,GTEX-ZZ64-1226-SM-5E43R,GTEX-ZZ64-1326-SM-5E444,GTEX-ZZ64-1426-SM-5NQ8C,GTEX-ZZ64-1526-SM-5E43K,GTEX-ZZ64-1626-SM-5E43W,GTEX-ZZ64-1726-SM-5GZYB,GTEX-ZZPT-0226-SM-5E43X,GTEX-ZZPT-0626-SM-5GZXT,GTEX-ZZPT-0926-SM-5GICZ,GTEX-ZZPT-1326-SM-5E43H,GTEX-ZZPT-1426-SM-5N9C5,GTEX-ZZPT-2926-SM-5EQ5S,GTEX-ZZPT-3026-SM-5GZXH,GTEX-ZZPU-0126-SM-5E446,GTEX-ZZPU-0226-SM-5N9BV,GTEX-ZZPU-0326-SM-5N9BJ,GTEX-ZZPU-0426-SM-5GZYH,GTEX-ZZPU-0526-SM-5E44U,GTEX-ZZPU-0626-SM-5E43T,GTEX-ZZPU-0726-SM-5N9C8,GTEX-ZZPU-0826-SM-5GZX5,GTEX-ZZPU-0926-SM-5GZYT,GTEX-ZZPU-1026-SM-5E457,GTEX-ZZPU-1126-SM-5N9CW,GTEX-ZZPU-1226-SM-5N9CK,GTEX-ZZPU-1326-SM-5GZWS,GTEX-ZZPU-1426-SM-5GZZ6,GTEX-ZZPU-1826-SM-5E43L,GTEX-ZZPU-2126-SM-5EGIU,GTEX-ZZPU-2226-SM-5EGIV,GTEX-ZZPU-2426-SM-5E44I,GTEX-ZZPU-2626-SM-5E45Y,GTEX-ZZPU-2726-SM-5NQ8O
str,str,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,...,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64
"""ENSG0000022397...","""DDX11L1""",0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01776,0.03757,0.04667,0.0,0.01832,0.0,0.0,0.06455,0.0,0.1064,0.0,0.0,0.0,0.0,0.01936,0.0,0.2137,0.0,0.0,0.02434,0.0,0.0,0.01768,0.0,...,0.0,0.0,0.0,0.392,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.02796,0.01816,0.0,0.06966,0.03126,0.01874,0.1319,0.02201,0.0,0.0218,0.04614,0.04273,0.03502,0.0,0.0,0.01989,0.0,0.03629,0.0,0.0,0.0,0.0,0.0,0.0,0.01965,0.02522
"""ENSG0000022723...","""WASH7P""",8.764,3.861,7.349,11.07,3.306,5.389,11.99,16.95,10.04,12.5,9.357,6.892,0.9295,1.823,1.794,2.338,0.7206,1.452,0.9525,1.828,1.2,0.838,4.459,1.909,2.198,1.235,4.252,3.101,3.082,1.036,4.753,5.766,4.2,1.197,3.378,...,4.077,11.49,4.14,4.703,2.466,4.744,5.785,1.819,4.201,8.683,4.186,3.604,2.341,4.139,7.497,3.907,2.123,2.747,2.322,1.454,1.135,2.733,2.003,1.938,6.115,1.016,2.252,1.606,2.268,5.386,2.31,2.456,4.023,1.922,2.857,0.8696,2.167
"""ENSG0000027826...","""MIR6859-1""",0.0,0.0,1.004,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4723,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
"""ENSG0000024348...","""MIR1302-2HG""",0.07187,0.0,0.0,0.06761,0.0,0.0,0.0,0.0,0.0,0.06265,0.05905,0.0,0.0,0.04659,0.0,0.0,0.0425,0.05431,0.0,0.06094,0.07078,0.0378,0.0,0.0,0.0,0.0,0.0,0.06096,0.0,0.0,0.0486,0.0,0.04183,0.0,0.0,...,0.0,0.146,0.05038,0.0559,0.0,0.0,0.0,0.0,0.05113,0.0,0.04755,0.1116,0.0,0.0,0.0,0.0,0.0,0.1129,0.0,0.0,0.04352,0.09211,0.04265,0.03496,0.05935,0.0,0.0794,0.0,0.0,0.06073,0.0,0.08464,0.1435,0.0,0.05216,0.0,0.0
"""ENSG0000023761...","""FAM138A""",0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.03904,0.0,0.0,0.0,0.0,0.0,0.0331,0.0,0.02599,0.0,0.0,0.03052,0.04329,0.0,0.02685,0.04188,0.04332,0.0,0.0,0.05034,0.0,0.0,0.0,0.0,0.0,0.0,0.02508,0.0,...,0.0,0.03457,0.03579,0.0,0.05597,0.0,0.0,0.0,0.0,0.0,0.03378,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.03272,0.0,0.0,0.0,0.0,0.0,0.02429,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
"""ENSG0000026802...","""OR4G4P""",0.0,0.056,0.0,0.0,0.0,0.0613,0.09523,0.0,0.0555,0.1292,0.0,0.03656,0.07734,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.03897,0.1216,0.06287,0.0,0.07971,0.07306,0.0,0.0,0.0,0.0,0.0,0.0,0.07278,0.0,...,0.0,0.05017,0.0,0.1153,0.04061,0.1103,0.0,0.03886,0.0,0.0,0.09804,0.0,0.0,0.0,0.0,0.0,0.03857,0.03878,0.04531,0.0,0.04487,0.0,0.0,0.0,0.1224,0.0,0.1228,0.03526,0.0,0.0,0.04624,0.08726,0.0,0.0,0.0,0.04044,0.05191
"""ENSG0000024036...","""OR4G11P""",0.06621,0.05004,0.0,0.0,0.0,0.0,0.0,0.0,0.0992,0.0,0.1088,0.03267,0.1382,0.0,0.04296,0.0337,0.03915,0.0,0.03958,0.1684,0.0,0.2438,0.1629,0.05618,0.0,0.07123,0.06529,0.2247,0.1062,0.1098,0.04477,0.0,0.07707,0.09755,0.1224,...,0.05008,0.08967,0.04642,0.0515,0.03629,0.0,0.0,0.03473,0.1884,0.04887,0.08761,0.05143,0.03341,0.04716,0.04271,0.115,0.1034,0.0,0.08099,0.04028,0.08019,0.0,0.1179,0.0,0.05468,0.03417,0.03658,0.189,0.0,0.0,0.04132,0.07797,0.0,0.1108,0.0961,0.03614,0.0
"""ENSG0000018609...","""OR4F5""",0.0,0.1025,0.07434,0.0,0.04233,0.05609,0.1743,0.0,0.0,0.0591,0.0557,0.1004,0.07077,0.04395,0.04399,0.03451,0.08019,0.05124,0.08106,0.05748,0.1335,0.1426,0.0,0.05753,0.0,0.03647,0.1671,0.115,0.0,0.0,0.1375,0.0331,0.0,0.09989,0.06265,...,0.0,0.09181,0.04753,0.0,0.07433,0.1009,0.0,0.03556,0.0,0.0,0.1346,0.05266,0.06841,0.09658,0.0,0.0,0.0,0.1065,0.1244,0.0,0.08212,0.0869,0.1207,0.0,0.05599,0.06997,0.1124,0.129,0.1367,0.05729,0.1269,0.1198,0.06767,0.1135,0.0,0.148,0.0
"""ENSG0000023800...","""RP11-34P13.7""",0.0,0.04574,0.09953,0.0,0.07556,0.05006,0.03889,0.04627,0.0,0.05275,0.02486,0.02986,0.01579,0.0,0.03927,0.07701,0.01789,0.0,0.03617,0.07696,0.0,0.0,0.07446,0.02567,0.0,0.01628,0.02983,0.4107,0.0,0.03345,0.0,0.02954,0.07044,0.05944,0.0,...,0.0,0.08195,0.02121,0.6354,0.0,0.02252,0.04343,0.01587,0.04305,0.0,0.0,0.0,0.0,0.02155,0.03903,0.02627,0.01575,0.09502,0.03701,0.0,0.0,0.0,0.03592,0.0,0.0,0.01561,0.05014,0.0,0.01525,0.0,0.03776,0.03563,0.0604,0.0,0.1098,0.01651,0.0212
"""ENSG0000023375...","""CICP27""",0.03595,0.01359,0.0,0.0,0.0,0.0,0.0,0.02749,0.0,0.0,0.0,0.0,0.03753,0.05827,0.3966,0.8236,0.02126,0.0,0.4191,0.03049,0.03541,0.06618,0.08848,0.03051,0.1711,0.06769,0.04432,0.2897,0.173,0.0,0.02431,0.008777,0.0,0.0,0.0,...,0.08159,0.04869,0.0,0.1958,0.009854,0.0,0.0129,0.0,0.01279,0.07962,0.03568,0.0,0.0,0.03841,0.1739,0.01561,0.01872,1.656,0.4288,0.4484,0.09798,0.4839,0.1814,0.2186,0.08907,0.06494,0.2284,0.06843,0.09967,0.2583,0.03366,0.04234,0.3409,0.2709,0.05219,0.0,0.1134


In [7]:
rnas.columns

['Name',
 'Description',
 'GTEX-1117F-0226-SM-5GZZ7',
 'GTEX-1117F-0426-SM-5EGHI',
 'GTEX-1117F-0526-SM-5EGHJ',
 'GTEX-1117F-0626-SM-5N9CS',
 'GTEX-1117F-0726-SM-5GIEN',
 'GTEX-1117F-1326-SM-5EGHH',
 'GTEX-1117F-2426-SM-5EGGH',
 'GTEX-1117F-2526-SM-5GZY6',
 'GTEX-1117F-2826-SM-5GZXL',
 'GTEX-1117F-2926-SM-5GZYI',
 'GTEX-1117F-3026-SM-5GZYU',
 'GTEX-1117F-3226-SM-5N9CT',
 'GTEX-111CU-0126-SM-5GZWZ',
 'GTEX-111CU-0226-SM-5GZXC',
 'GTEX-111CU-0326-SM-5GZXO',
 'GTEX-111CU-0426-SM-5GZY1',
 'GTEX-111CU-0526-SM-5EGHK',
 'GTEX-111CU-0626-SM-5EGHL',
 'GTEX-111CU-0726-SM-5GZYD',
 'GTEX-111CU-0826-SM-5EGIJ',
 'GTEX-111CU-0926-SM-5EGIK',
 'GTEX-111CU-1026-SM-5EGIL',
 'GTEX-111CU-1126-SM-5EGIM',
 'GTEX-111CU-1226-SM-5EGIN',
 'GTEX-111CU-1326-SM-5NQ8L',
 'GTEX-111CU-1426-SM-5GZYP',
 'GTEX-111CU-1526-SM-5N9FS',
 'GTEX-111CU-1726-SM-5EGHM',
 'GTEX-111CU-1826-SM-5GZYN',
 'GTEX-111CU-2026-SM-5GZZC',
 'GTEX-111CU-2226-SM-5N9G5',
 'GTEX-111FC-0126-SM-5N9DL',
 'GTEX-111FC-0226-SM-5N9B8',
 'GTEX-111FC-0326-

## Sc-R
NA-Seq

In [None]:
from lassonet import LassoNetClassifierCV
model = LassoNetClassifierCV() # LassoNetRegressorCV
path = model.fit(X_train, y_train)
print("Best model scored", model.score(X_test, y_test))
print("Lambda =", model.best_lambda_)