# Concatonate All Deseq2 Data with AHR, DRE, RefGenome Metadata

## <br> 1. Import Required Packages

In [1]:
import numpy as np
import pandas as pd
import os

## <br> 2. Import Deseq2 Data and All Other Metadata

In [2]:
# Define the directory path
directory = './Results/03f_Named_lncRNAs_DEGs'

# Check if the directory exists
if not os.path.exists(directory):
    # If it does not exist, create the directory
    os.makedirs(directory)

print(f"Directory '{directory}' is ready.")

Directory './Results/03f_Named_lncRNAs_DEGs' is ready.


In [3]:
# Load a working copy of the DESeq2 master table for further analysis or modification
Deseq2_Master_Working = pd.read_csv('./Results/03d_MASTER_Deseq2_Concatonated/RDDR_Deseq2_Master_Wald_with_MGI.txt', 
                            delimiter = '\t')
Deseq2_Master_Working


Unnamed: 0.1,Unnamed: 0,Gene,MGI_Symbol,Celltype,Dose,Type,pDRE,AHR,baseMean,Chr,Start,End,Strand,NR_Annotation,log2FoldChange,Fold-Change,lfcSE,stat,pvalue,padj
0,0,lnc31752,Malat1,B Cells,0.01,lncRNA,0,2,5632.003911,chr19,5842642,5852983,-,lnc31752_Mascrna#Malat1,0.060929,1.043137,0.161392,0.377519,0.705788,1.000000
1,1,lnc4822,.,B Cells,0.01,lncRNA,0,1,3146.387654,chr6,3181101,3202501,+,lnc4822,-0.368362,0.774662,0.385441,-0.955691,0.339228,1.000000
2,2,Foxp1,9130401L11Rik,B Cells,0.01,NM,13,19,941.129495,chr6,98902302,99161922,-,,-0.079404,0.946448,0.359311,-0.220991,0.825099,1.000000
3,3,Foxp1,6030492E11Rik,B Cells,0.01,NM,13,19,941.129495,chr6,98902302,99161922,-,,-0.079404,0.946448,0.359311,-0.220991,0.825099,1.000000
4,4,Foxp1,Gm38865,B Cells,0.01,NM,13,19,941.129495,chr6,98902302,99161922,-,,-0.079404,0.946448,0.359311,-0.220991,0.825099,1.000000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1443131,1443131,lnc1440,.,pDCs,30.00,lncRNA,0,0,2.409755,chr2,69058214,69067863,-,lnc1440,-4.176886,0.055288,1.226191,-3.406392,0.000658,0.004671
1443132,1443132,lnc1686,Gm34484,pDCs,30.00,lncRNA,0,1,0.496732,chr2,124519234,124553367,-,lnc1686,3.818752,14.111033,4.487664,0.850944,0.394800,0.614526
1443133,1443133,lnc2311,Gm40040,pDCs,30.00,lncRNA,3,3,2.592510,chr3,41395983,41447665,-,lnc2311_Platr4Gm40040,-4.979600,0.031695,1.133711,-4.392302,0.000011,0.000141
1443134,1443134,lnc2311,Platr4,pDCs,30.00,lncRNA,3,3,2.592510,chr3,41395983,41447665,-,lnc2311_Platr4Gm40040,-4.979600,0.031695,1.133711,-4.392302,0.000011,0.000141


In [4]:
# Identify DEGs for a specific cell type (COI) with fold-change threshold and adjusted p-value cutoff
COI = 'Periportal Hepatocytes'

# Ensure 'padj' is numeric to avoid comparison issues
Deseq2_Master_Working['padj'] = pd.to_numeric(Deseq2_Master_Working['padj'], errors='coerce')

# Filter DEGs: FC ≥ 1.5 or ≤ 1/1.5, padj ≤ 0.05, and matching Celltype
DEGs = Deseq2_Master_Working[((Deseq2_Master_Working['Fold-Change'] >= 1.5) | (Deseq2_Master_Working['Fold-Change'] <= 1/1.5)) & 
                            (Deseq2_Master_Working['padj'] <= 0.05) &
                            (Deseq2_Master_Working['Celltype'] == COI)]

DEGs

Unnamed: 0.1,Unnamed: 0,Gene,MGI_Symbol,Celltype,Dose,Type,pDRE,AHR,baseMean,Chr,Start,End,Strand,NR_Annotation,log2FoldChange,Fold-Change,lfcSE,stat,pvalue,padj
1017563,1017563,Cyp1a2,.,Periportal Hepatocytes,0.01,NM,0,4,4152.981320,chr9,57584219,57590938,-,,1.701873,3.253229,0.323246,5.264950,1.402274e-07,3.632731e-03
1020679,1020679,lnc12633,.,Periportal Hepatocytes,0.01,lncRNA,1,2,940.309980,chr15,62595995,62615851,-,lnc12633,1.365037,2.575830,0.289268,4.718934,2.370833e-06,3.070940e-02
1026031,1026031,lnc7984,.,Periportal Hepatocytes,0.01,lncRNA,3,6,222.878994,chr9,57572484,57578435,-,lnc7984,2.703680,6.514616,0.586952,4.606307,4.098830e-06,3.539477e-02
1048864,1048864,Cyp1a2,.,Periportal Hepatocytes,0.03,NM,0,4,4152.981320,chr9,57584219,57590938,-,,2.413671,5.328283,0.322258,7.489867,6.894333e-14,1.786046e-09
1048963,1048963,Cyp1a1,.,Periportal Hepatocytes,0.03,NM,5,8,3689.450961,chr9,57595210,57611107,+,,2.620539,6.149797,0.492478,5.321124,1.031282e-07,6.679096e-04
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1266741,1266741,lnc10125,Gm11707,Periportal Hepatocytes,30.00,lncRNA,0,1,4.928723,chr11,106856604,106864765,-,lnc10125_Gm11707,3.294156,9.809340,0.849509,3.877718,1.054407e-04,6.161848e-04
1266749,1266749,lnc15124,Mirt1,Periportal Hepatocytes,30.00,lncRNA,0,0,6.301579,chr19,53429551,53453555,-,lnc15124_Mirt1,4.895596,29.766043,0.924879,5.293229,1.201755e-07,1.319181e-06
1266758,1266758,lnc20433,.,Periportal Hepatocytes,30.00,lncRNA,0,0,3.966456,chr11,58208386,58209565,+,lnc20433,2.465864,5.524575,0.921379,2.676274,7.444578e-03,2.499148e-02
1266762,1266762,lnc24827,.,Periportal Hepatocytes,30.00,lncRNA,0,0,5.464672,chr13,110037102,110039284,-,lnc24827,3.122459,8.708707,0.882836,3.536849,4.049311e-04,2.048368e-03


In [5]:
DEGs[(DEGs['Type'] == 'lncRNA') |
       (DEGs['Type']== 'antisense') |
       (DEGs['Type']== 'lincRNA') |
       (DEGs['Type']== 'NR') |
       (DEGs['Type']== 'lncOfInterest')]['MGI_Symbol'].drop_duplicates(keep='first')


1020679                .
1089063          Gm46943
1092637          Actc1dt
1110348          Gm29966
1116655          Gm38585
               ...      
1266340          Gm41361
1266341    F830031D20Rik
1266494          Gm40621
1266741          Gm11707
1266749            Mirt1
Name: MGI_Symbol, Length: 1374, dtype: object

In [6]:
filtered_df = DEGs[((DEGs['Type'] == 'lncRNA') |
                   (DEGs['Type']== 'antisense') |
                   (DEGs['Type']== 'lincRNA') |
                   (DEGs['Type']== 'NR') |
                   (DEGs['Type']== 'lncOfInterest')) &
    (~DEGs['MGI_Symbol'].str.contains('Rik')) &
    (~DEGs['MGI_Symbol'].str.endswith('os')) & 
    (~DEGs['MGI_Symbol'].str.match(r'.*os\d$')) &
    (~DEGs['MGI_Symbol'].str.endswith('ps')) &
    (~DEGs['MGI_Symbol'].str.startswith('Gm'))&
    (~DEGs['MGI_Symbol'].str.startswith('Mir'))&
    (~DEGs['MGI_Symbol'].str.match(r'^[A-Z]{2}')) & 
    (DEGs['MGI_Symbol'] != '.')
]['MGI_Symbol'].drop_duplicates(keep='first').sort_values()

filtered_df


1092637      Actc1dt
1142319         Airn
1209673        Altre
1211785     Bach2it1
1230311          Bc1
1224793       C79798
1216270        Dancr
1206500        Dleu2
1265485         Dubr
1208310         Gas5
1125700       Gdap10
1265084     Hotairm1
1265083     Hotairm2
1265085      Hoxaas2
1208835          Jpx
1213994        Kantr
1235983     Kcnq1ot1
1235677      Lncpint
1142977     Lncppara
1223524        Lockd
1252404         Meg3
1211592        Mm2pr
1250952      Morrbid
1235494        Neat1
1239826      Platr22
1238794       Platr4
1144252         Pvt1
1263521      Slfnlnc
1213881        Snhg1
1258093       Snhg10
1215374       Snhg12
1215314       Snhg14
1217777       Snhg15
1218535       Snhg16
1213704       Snhg17
1242778       Snhg20
1214136        Snhg3
1254482        Snhg4
1248777        Snhg5
1251990        Snhg6
1244135        Snhg7
1246043        Snhg8
1242717        Tbrg3
1216196    Trp53cor1
1175896         Urml
1262754      Wbscr25
1215970        Zfas1
Name: MGI_Sym

In [7]:
lncRNA_DEGs = DEGs[((DEGs['Type'] == 'lncRNA') |
                   (DEGs['Type']== 'antisense') |
                   (DEGs['Type']== 'lincRNA') |
                   (DEGs['Type']== 'NR') |
                   (DEGs['Type']== 'lncOfInterest')) &
    (~DEGs['MGI_Symbol'].str.contains('Rik')) &
    (~DEGs['MGI_Symbol'].str.endswith('os')) & 
    (~DEGs['MGI_Symbol'].str.match(r'.*os\d$')) &
    (~DEGs['MGI_Symbol'].str.endswith('ps')) &
    (~DEGs['MGI_Symbol'].str.startswith('Gm'))&
    (~DEGs['MGI_Symbol'].str.startswith('Mir'))&
    (~DEGs['MGI_Symbol'].str.match(r'^[A-Z]{2}')) & 
    (DEGs['MGI_Symbol'] != '.') & 
    (DEGs['MGI_Symbol'] != 'C79798')          
]

lncRNA_DEGs_List = lncRNA_DEGs[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs_AHR = lncRNA_DEGs[(lncRNA_DEGs['AHR'] != 0)]
lncRNA_DEGs_AHR_List = lncRNA_DEGs_AHR[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs_DRE = lncRNA_DEGs[(lncRNA_DEGs['pDRE'] != 0)]
lncRNA_DEGs_DRE_List = lncRNA_DEGs_DRE[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs

Unnamed: 0.1,Unnamed: 0,Gene,MGI_Symbol,Celltype,Dose,Type,pDRE,AHR,baseMean,Chr,Start,End,Strand,NR_Annotation,log2FoldChange,Fold-Change,lfcSE,stat,pvalue,padj
1092637,1092637,lnc1630,Actc1dt,Periportal Hepatocytes,0.1,lncRNA,2,2,98.811525,chr2,113884876,113895240,+,lnc1630_C130080G10Rik,-5.036642,0.030466,1.267935,-3.972318,7.117650e-05,4.835494e-02
1125700,1125700,lnc10508,Gdap10,Periportal Hepatocytes,0.3,lncRNA,1,1,55.621736,chr12,32874114,32876907,+,lnc10508_Gdap10,1.295739,2.455027,0.358117,3.618203,2.966553e-04,4.950345e-02
1142319,1142319,lnc13654,Airn,Periportal Hepatocytes,1.0,lncRNA,5,4,7463.530593,chr17,12960071,13079068,+,lnc13654_Airn,1.652342,3.143436,0.446405,3.701440,2.143796e-04,2.124400e-02
1142977,1142977,lnc12813,Lncppara,Periportal Hepatocytes,1.0,lncRNA,4,5,2842.507977,chr15,85529670,85599726,+,lnc12813_Mirlet7c-2#Mirlet7b#LncpparaAC162302.1,0.942870,1.922349,0.253531,3.718961,2.000437e-04,2.062419e-02
1144252,1144252,lnc12608,Pvt1,Periportal Hepatocytes,1.0,lncRNA,9,11,1986.818100,chr15,61909692,62139305,+,lnc12608_Pvt1,2.024089,4.067351,0.426494,4.745883,2.075989e-06,4.320132e-04
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1263521,1263521,AI662270,Slfnlnc,Periportal Hepatocytes,30.0,NR,0,0,17.126892,chr11,83114401,83117410,+,,5.595643,48.356673,0.771058,7.257101,3.954757e-13,1.095743e-11
1265083,1265083,lnc5147,Hotairm2,Periportal Hepatocytes,30.0,lncRNA,2,1,6.383223,chr6,52134912,52151060,+,lnc5147_Hotairm1#Hotairm2#Gm15050#Hoxaas2,2.350850,5.101246,0.773365,3.039766,2.367618e-03,9.483948e-03
1265084,1265084,lnc5147,Hotairm1,Periportal Hepatocytes,30.0,lncRNA,2,1,6.383223,chr6,52134912,52151060,+,lnc5147_Hotairm1#Hotairm2#Gm15050#Hoxaas2,2.350850,5.101246,0.773365,3.039766,2.367618e-03,9.483948e-03
1265085,1265085,lnc5147,Hoxaas2,Periportal Hepatocytes,30.0,lncRNA,2,1,6.383223,chr6,52134912,52151060,+,lnc5147_Hotairm1#Hotairm2#Gm15050#Hoxaas2,2.350850,5.101246,0.773365,3.039766,2.367618e-03,9.483948e-03


In [8]:
lncRNA_DEGs.to_csv('./Results/03f_Named_lncRNAs_DEGs/RDDR_named_lncRNA_FULL_TABLE_in_'+ COI + '.txt', sep='\t', index=False)


lncRNA_DEGs['Row_Name'] = lncRNA_DEGs['MGI_Symbol'] + ' (' + lncRNA_DEGs['Gene'] + ')'

lncRNA_DEGs = lncRNA_DEGs['Row_Name'].drop_duplicates(keep='first')
lncRNA_DEGs.to_csv('./Results/03f_Named_lncRNAs_DEGs/RDDR_named_lncRNA_DEGs_in_'+ COI + '.txt', sep='\t', index=False)


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  lncRNA_DEGs['Row_Name'] = lncRNA_DEGs['MGI_Symbol'] + ' (' + lncRNA_DEGs['Gene'] + ')'


In [9]:
######################################################
# Print Out Counts
######################################################
print("##################")
print("### " + COI)
print("##################")
print("--------------------------------------------------------")
print("--------------------------------------------------------")
print()
print("lncRNA DEGs:", len(lncRNA_DEGs_List))
print()
print("lncRNA DEGs with AHR:", len(lncRNA_DEGs_AHR_List))
print()
print("lncRNA DEGs with DRE:", len(lncRNA_DEGs_DRE_List))
print()
print("--------------------------------------------------------")
print("--------------------------------------------------------")

##################
### Periportal Hepatocytes
##################
--------------------------------------------------------
--------------------------------------------------------

lncRNA DEGs: 47

lncRNA DEGs with AHR: 31

lncRNA DEGs with DRE: 29

--------------------------------------------------------
--------------------------------------------------------


In [10]:
COI = 'Centrilobular Hepatocytes'

Deseq2_Master_Working['padj'] = pd.to_numeric(Deseq2_Master_Working['padj'], errors='coerce')


DEGs = Deseq2_Master_Working[((Deseq2_Master_Working['Fold-Change'] >= 1.5) | (Deseq2_Master_Working['Fold-Change'] <= 1/1.5)) & 
                            (Deseq2_Master_Working['padj'] <= 0.05) &
                            (Deseq2_Master_Working['Celltype'] == COI)]

DEGs

Unnamed: 0.1,Unnamed: 0,Gene,MGI_Symbol,Celltype,Dose,Type,pDRE,AHR,baseMean,Chr,Start,End,Strand,NR_Annotation,log2FoldChange,Fold-Change,lfcSE,stat,pvalue,padj
106193,106193,Cyp1a2,.,Centrilobular Hepatocytes,0.01,NM,0,4,2740.961191,chr9,57584219,57590938,-,,2.019151,4.053451,0.291374,6.929746,4.215961e-12,9.235484e-08
133186,133186,Cyp1a2,.,Centrilobular Hepatocytes,0.03,NM,0,4,2740.961191,chr9,57584219,57590938,-,,2.470874,5.543794,0.290694,8.499914,1.897318e-17,2.078132e-13
133352,133352,Cyp1a1,.,Centrilobular Hepatocytes,0.03,NM,5,8,2101.857316,chr9,57595210,57611107,+,,6.407706,84.900812,0.596546,10.741345,6.508943e-27,1.425849e-22
143064,143064,lnc7984,.,Centrilobular Hepatocytes,0.03,lncRNA,3,6,86.243459,chr9,57572484,57578435,-,lnc7984,5.385475,41.801275,0.837168,6.432971,1.251335e-10,9.137246e-07
143195,143195,lnc4777,Gm46943,Centrilobular Hepatocytes,0.03,lncRNA,3,3,81.319867,chr5,147848112,147855661,+,lnc4777,2.438875,5.422187,0.487511,5.002708,5.653059e-07,2.476718e-03
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
321516,321516,lnc25261,.,Centrilobular Hepatocytes,30.00,lncRNA,0,0,3.747565,chr14,31316156,31319726,-,lnc25261,2.661279,6.325934,1.026311,2.593054,9.512795e-03,2.717622e-02
321522,321522,lnc31218,Gm5095,Centrilobular Hepatocytes,30.00,lncRNA,5,2,2.682039,chr18,47670801,47851703,+,lnc31218_Gm5095,5.057910,33.310614,1.369176,3.694128,2.206429e-04,1.034547e-03
321523,321523,lnc31218,Gm32660,Centrilobular Hepatocytes,30.00,lncRNA,5,2,2.682039,chr18,47670801,47851703,+,lnc31218_Gm5095,5.057910,33.310614,1.369176,3.694128,2.206429e-04,1.034547e-03
321531,321531,lnc35186,.,Centrilobular Hepatocytes,30.00,lncRNA,0,0,3.929996,chr2,177678292,177678904,-,lnc35186,2.442242,5.434856,0.889557,2.745457,6.042668e-03,1.843420e-02


In [11]:
DEGs[(DEGs['Type'] == 'lncRNA') |
       (DEGs['Type']== 'antisense') |
       (DEGs['Type']== 'lincRNA') |
       (DEGs['Type']== 'NR') |
       (DEGs['Type']== 'lncOfInterest')]['MGI_Symbol'].drop_duplicates(keep='first')


143064                .
143195          Gm46943
160166          Gm35190
161979          Gm31190
167452          Gm57111
              ...      
321075          Gm16098
321135          Gm33519
321188    2810457G06Rik
321274          Gm31603
321404         Mir223hg
Name: MGI_Symbol, Length: 1380, dtype: object

In [12]:
filtered_df = DEGs[((DEGs['Type'] == 'lncRNA') |
                   (DEGs['Type']== 'antisense') |
                   (DEGs['Type']== 'lincRNA') |
                   (DEGs['Type']== 'NR') |
                   (DEGs['Type']== 'lncOfInterest')) &
    (~DEGs['MGI_Symbol'].str.contains('Rik')) &
    (~DEGs['MGI_Symbol'].str.endswith('os')) & 
    (~DEGs['MGI_Symbol'].str.match(r'.*os\d$')) &
    (~DEGs['MGI_Symbol'].str.endswith('ps')) &
    (~DEGs['MGI_Symbol'].str.startswith('Gm'))&
    (~DEGs['MGI_Symbol'].str.startswith('Mir'))&
    (~DEGs['MGI_Symbol'].str.match(r'^[A-Z]{2}')) & 
    (DEGs['MGI_Symbol'] != '.')
]['MGI_Symbol'].drop_duplicates(keep='first').sort_values()

filtered_df


226181          Actc1dt
213602             Airn
273756            Altre
273725         Bach2it1
313860      D17Ertd648e
277394            Dancr
296735            Dleu2
271445             Gas5
305188    Gt(ROSA)26Sor
299711              Jpx
249406            Kantr
268092         Kcnq1ot1
215112         Lncppara
294559           Malat1
245882             Meg3
274639            Mm2pr
312127          Morrbid
267569            Neat1
314976            Peg13
277693          Platr22
312283        Ppp1r36dn
215294             Pvt1
276255            Snhg1
315191           Snhg10
278238           Snhg12
277400           Snhg14
307414           Snhg15
280604           Snhg16
303726           Snhg17
301576           Snhg20
304057            Snhg3
313106            Snhg4
307842            Snhg5
310540            Snhg6
303448            Snhg7
304841            Snhg8
305372            Snhg9
302191            Tbrg3
279179        Trp53cor1
217409             Urml
320564          Wbscr25
278910          

In [13]:
lncRNA_DEGs = DEGs[((DEGs['Type'] == 'lncRNA') |
                   (DEGs['Type']== 'antisense') |
                   (DEGs['Type']== 'lincRNA') |
                   (DEGs['Type']== 'NR') |
                   (DEGs['Type']== 'lncOfInterest')) &
    (~DEGs['MGI_Symbol'].str.contains('Rik')) &
    (~DEGs['MGI_Symbol'].str.endswith('os')) & 
    (~DEGs['MGI_Symbol'].str.match(r'.*os\d$')) &
    (~DEGs['MGI_Symbol'].str.endswith('ps')) &
    (~DEGs['MGI_Symbol'].str.startswith('Gm'))&
    (~DEGs['MGI_Symbol'].str.startswith('Mir'))&
    (~DEGs['MGI_Symbol'].str.match(r'^[A-Z]{2}')) & 
    (DEGs['MGI_Symbol'] != '.') & 
    (DEGs['MGI_Symbol'] != 'D17Ertd648e')          
]

lncRNA_DEGs_List = lncRNA_DEGs[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs_AHR = lncRNA_DEGs[(lncRNA_DEGs['AHR'] != 0)]
lncRNA_DEGs_AHR_List = lncRNA_DEGs_AHR[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs_DRE = lncRNA_DEGs[(lncRNA_DEGs['pDRE'] != 0)]
lncRNA_DEGs_DRE_List = lncRNA_DEGs_DRE[['Gene']].drop_duplicates(keep='first').copy()

lncRNA_DEGs

Unnamed: 0.1,Unnamed: 0,Gene,MGI_Symbol,Celltype,Dose,Type,pDRE,AHR,baseMean,Chr,Start,End,Strand,NR_Annotation,log2FoldChange,Fold-Change,lfcSE,stat,pvalue,padj
213602,213602,lnc13654,Airn,Centrilobular Hepatocytes,1.0,lncRNA,5,4,12429.883037,chr17,12960071,13079068,+,lnc13654_Airn,1.223871,2.335725,0.318409,3.843710,0.000121,0.008561
215112,215112,lnc12813,Lncppara,Centrilobular Hepatocytes,1.0,lncRNA,4,5,1274.152548,chr15,85529670,85599726,+,lnc12813_Mirlet7c-2#Mirlet7b#LncpparaAC162302.1,0.870411,1.828184,0.184094,4.728076,0.000002,0.000268
215294,215294,lnc12608,Pvt1,Centrilobular Hepatocytes,1.0,lncRNA,9,11,1210.942926,chr15,61909692,62139305,+,lnc12608_Pvt1,1.321717,2.499634,0.380484,3.473777,0.000513,0.026490
217409,217409,lnc11523,Urml,Centrilobular Hepatocytes,1.0,lncRNA,2,1,532.392784,chr13,68360651,68401078,-,lnc11523_Urml,-1.087721,0.470504,0.309473,-3.514755,0.000440,0.023508
226181,226181,lnc1630,Actc1dt,Centrilobular Hepatocytes,1.0,lncRNA,2,2,41.528784,chr2,113884876,113895240,+,lnc1630_C130080G10Rik,5.165016,35.877716,1.268462,4.071871,0.000047,0.003908
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
312470,312470,lnc25734,Dleu2,Centrilobular Hepatocytes,30.0,lncRNA,0,0,16.317379,chr14,61883871,61885571,-,lnc25734_Dleu2,-2.076409,0.237104,0.530143,-3.916693,0.000090,0.000470
313106,313106,lnc30999,Snhg4,Centrilobular Hepatocytes,30.0,lncRNA,1,0,14.208258,chr18,35690084,35691385,+,lnc30999_Snhg4#Snora74a,2.075450,4.214759,0.580176,3.577279,0.000347,0.001542
314976,314976,lnc12652,Peg13,Centrilobular Hepatocytes,30.0,lncRNA,3,0,9.240352,chr15,72677448,72682173,-,lnc12652_Peg13,-1.582477,0.333908,0.592614,-2.670332,0.007578,0.022402
315191,315191,lnc10895,Snhg10,Centrilobular Hepatocytes,30.0,lncRNA,0,1,12.038520,chr12,104996875,104998570,-,lnc10895_Snhg10#Mir3069#Scarna13,2.972093,7.846739,0.641879,4.630299,0.000004,0.000027


In [14]:
lncRNA_DEGs.to_csv('./Results/03f_Named_lncRNAs_DEGs/RDDR_named_lncRNA_FULL_TABLE_in_'+ COI + '.txt', sep='\t', index=False)

lncRNA_DEGs['Row_Name'] = lncRNA_DEGs['MGI_Symbol'] + ' (' + lncRNA_DEGs['Gene'] + ')'

lncRNA_DEGs = lncRNA_DEGs['Row_Name'].drop_duplicates(keep='first')
lncRNA_DEGs.to_csv('./Results/03f_Named_lncRNAs_DEGs/RDDR_named_lncRNA_DEGs_in_'+ COI + '.txt', sep='\t', index=False)


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  lncRNA_DEGs['Row_Name'] = lncRNA_DEGs['MGI_Symbol'] + ' (' + lncRNA_DEGs['Gene'] + ')'


In [15]:
######################################################
# Print Out Counts
######################################################
print("##################")
print("### " + COI)
print("##################")
print("--------------------------------------------------------")
print("--------------------------------------------------------")
print()
print("lncRNA DEGs:", len(lncRNA_DEGs_List))
print()
print("lncRNA DEGs with AHR:", len(lncRNA_DEGs_AHR_List))
print()
print("lncRNA DEGs with DRE:", len(lncRNA_DEGs_DRE_List))
print()
print("--------------------------------------------------------")
print("--------------------------------------------------------")

##################
### Centrilobular Hepatocytes
##################
--------------------------------------------------------
--------------------------------------------------------

lncRNA DEGs: 47

lncRNA DEGs with AHR: 28

lncRNA DEGs with DRE: 25

--------------------------------------------------------
--------------------------------------------------------
