In [2]:
%matplotlib inline
import numpy as np
import scipy as sp
import matplotlib as mpl
import matplotlib.cm as cm
import matplotlib.pyplot as plt
import pandas as pd
import time
pd.set_option('display.width', 500)
pd.set_option('display.max_columns', 100)
pd.set_option('display.notebook_repr_html', True)
import seaborn as sns
sns.set_style('whitegrid')
sns.set_context('poster')

In [3]:
import csv
import random

In [4]:
def find_csv_length(file_to_read):
    '''
    Takes an input csv file and returns the number or rows skipping the header.
    '''
    with open(file_to_read, 'r') as file_in:

        csv_in = csv.reader(file_in)

        next(csv_in)
        
        i = 0
        for line in csv_in:
            i+=1
        
    return i
            

In [5]:
def select_random_rows(file_to_read, file_to_write, num_rows):
    '''
    Takes an input csv file and writes a smaller csv file containing num_rows randomly seleceted from 
    the input csv file. As well, it returns the indicies of the chosen rows.
    
    params: 
        file_to_read (string) (file.csv) path to some existing csv file to read
        file_to_write (string) (file.csv) path to csv file to write as output
        num_rows (list) number of rows to randomly select
        
    returns:
        rows_selected (list) indicies of the rows included in the new file

    '''
    with open(file_to_read, 'r') as file_in:

        csv_in = csv.reader(file_in)

        header = next(csv_in)
        
            
        with open(file_to_write, 'w') as file_out:

            csv_out = csv.writer(file_out)
            csv_out.writerow(header)
            
            length = find_csv_length(file_to_read)
        
            row_list = random.sample(range(length), num_rows)
                         
            for i, line in enumerate(csv_in):
                if i in row_list:
                    csv_out.writerow(line)
                    
                        
    print(f'A file named {file_to_write} has been created with {num_rows} rows.')
    
    return row_list       

In [11]:
a = select_random_rows('test_sample.csv', 'test_sample_10.csv', 10)

A file named test_sample_10.csv has been created with 10 rows.


In [12]:
a

[32, 24, 52, 164, 93, 22, 45, 47, 126, 87]

In [13]:
df = pd.read_csv('test_sample_10.csv')

In [14]:
df

Unnamed: 0,course_id,user_id,registered,viewed,explored,certified,completed,ip,cc_by_ip,countryLabel,continent,city,region,subdivision,postalCode,un_major_region,un_economic_group,un_developing_nation,un_special_region,latitude,longitude,LoE,YoB,gender,grade,passing_grade,start_time,first_event,last_event,nevents,ndays_act,nplay_video,nchapters,nforum_posts,nforum_votes,nforum_endorsed,nforum_threads,nforum_comments,nforum_pinned,roles,nprogcheck,nproblem_check,nforum_events,mode,is_active,cert_created_date,cert_modified_date,cert_status,verified_enroll_time,verified_unenroll_time,profile_country,y1_anomalous,email_domain,language_brwsr,language_brwsr_country,language_brwsr_sec,language_brwsr_sec_country,language_brwsr_code,language_brwsr_subcode,language_brwsr_sec_code,language_brwsr_sec_subcode,language_brwsr_nevents,language_brwsr_ndiff,language,language_download,language_nevents,language_ndiff,ntranscript,nshow_answer,nvideo,nvideos_unique_viewed,nvideos_total_watched,nseq_goto,nseek_video,npause_video,avg_dt,sdv_dt,max_dt,n_dt,sum_dt,roles_isBetaTester,roles_isInstructor,roles_isStaff,roles_isCCX,roles_isFinance,roles_isLibrary,roles_isSales,forumRoles_isAdmin,forumRoles_isCommunityTA,forumRoles_isModerator,forumRoles_isStudent
0,HarvardX/PH525.1x/1T2018,2938910,True,False,,False,False,138.246.2.124,DE,Germany,Europe,Munich,BY,Bavaria,80469,Western Europe,Developed regions,,,48.15,11.5833,,,,,0.7,2018-04-24 13:12:07,2018-04-24 13:12:07.098634,2018-04-24 13:12:14.881608,3,1,0,,,,,,,,Student,0,0,0,audit,1,,,,,,,,gmail.com,German,Germany,English,United States,de,DE,en,US,3.0,1.0,,,,,0,0,0,,,0,0,0,3.891487,0.164682,4.007935,2,7.782974,,,,,,,,,,,1
1,HarvardX/PH525.1x/1T2018,3486642,True,True,False,False,False,109.246.19.122,GB,United Kingdom,Europe,Preston,LAN,Lancashire,PR1,Northern Europe,Developed regions,,,53.7361,-2.7195,m,1982.0,m,,0.7,2018-03-13 23:13:55,2018-03-13 23:13:54.877029,2018-03-13 23:16:11.870773,20,2,0,1.0,,,,,,,Student,0,0,0,audit,1,,,,,,,,gmail.com,English,United States,,,en,US,,,4.0,1.0,,,,,0,0,0,,,0,0,0,15.221527,21.948681,59.801161,18,273.987488,,,,,,,,,,,1
2,HarvardX/PH525.1x/1T2018,5142536,True,False,,False,False,46.99.60.25,AL,Albania,Europe,,,,,Southern Europe,Developed regions,,,41.0,20.0,b,1992.0,m,,0.7,2018-03-24 08:48:09,2018-03-24 08:48:09.319671,2018-03-24 08:52:38.297648,8,2,0,,,,,,,,Student,0,0,0,audit,1,,,,,,XK,,gmail.com,English,United Kingdom,,,en,GB,,,2.0,1.0,,,,,0,0,0,,,0,0,0,89.659326,75.20413,139.776028,6,537.955954,,,,,,,,,,,1
3,HarvardX/PH525.1x/1T2018,7547010,True,True,False,False,False,187.114.109.178,BR,Brazil,Americas,Fortaleza,PI,Piaui,,South America,Developing_Nations,,Latin America and the Caribbean,-3.3167,-41.4167,,,,,0.7,2018-03-08 20:20:11,2018-03-08 00:00:00,2018-03-08 20:28:32.492233,24,2,2,1.0,,,,,,,Student,0,0,0,audit,1,,,,,,BR,,gmail.com,Portuguese,Brazil,English,United States,pt,BR,en,US,7.0,1.0,en,0.0,1.0,1.0,0,0,2,1.0,0.027027,0,0,0,9.783005,17.018062,48.571808,20,195.660102,,,,,,,,,,,1
4,HarvardX/PH525.1x/1T2018,7939044,True,False,,False,False,156.17.14.204,PL,Poland,Europe,Wroclaw,DS,Lower Silesian Voivodeship,,Eastern Europe,Developed regions,,,51.1,17.0333,,,m,,0.7,2018-01-30 20:31:52,2018-01-30 20:31:52.360470,2018-02-10 16:28:59.820000,57,2,6,,,,,,,,Student,0,0,0,audit,1,,,,,,PL,,gmail.com,,,,,,,,,,,,,,,0,0,6,5.0,0.135135,0,38,5,12.072759,24.105686,104.64,54,651.929,,,,,,,,,,,1
5,HarvardX/PH525.1x/1T2018,8926674,True,False,,False,False,189.40.79.25,BR,Brazil,Americas,Brasília,DF,Federal,,South America,Developing_Nations,,Latin America and the Caribbean,-15.7833,-47.9167,b,1991.0,m,,0.7,2018-03-20 21:55:47,2018-03-20 21:55:49.498569,2018-04-02 13:26:37.331467,4,4,0,,,,,,,,Student,0,0,0,audit,1,,,,,,BR,,hotmail.com,,,,,,,,,,,,,,,0,0,0,,,0,0,0,,,,0,,,,,,,,,,,,1
6,HarvardX/PH525.1x/1T2018,13754754,True,True,False,False,False,124.124.244.211,IN,India,Asia,Delhi,DL,National Capital Territory of Delhi,,Southern Asia,Developing_Nations,,,28.6667,77.2167,b,1991.0,f,,0.7,2018-05-09 07:46:21,2018-05-09 00:00:00,2018-05-29 10:17:00.405261,57,4,3,2.0,,,,,,,Student,0,0,0,audit,1,,,,,,IN,,metlife.com,English,United States,,,en,US,,,50.0,1.0,en,0.0,3.0,1.0,0,0,3,1.0,0.027027,0,0,3,30.96268,72.146906,236.391108,53,2050.7993,,,,,,,,,,,1
7,HarvardX/PH525.1x/1T2018,14499189,True,True,False,False,False,88.255.172.39,TR,Turkey,Asia,Istanbul,34,Istanbul,,Western Asia,Developing_Nations,,,41.0186,28.9647,p,1971.0,f,,0.7,2018-01-31 05:48:05,2018-01-31 05:48:05.212482,2018-02-08 13:27:53.297527,14,3,0,1.0,,,,,,,Student,0,0,0,audit,1,,,,,,TR,,gmail.com,Turkish,Turkey,English,United States,tr,TR,en,US,7.0,1.0,en,0.0,1.0,1.0,0,0,0,,,0,0,0,10.406883,21.605931,68.644435,10,131.572753,,,,,,,,,,,1
8,HarvardX/PH525.1x/1T2018,17430364,True,True,False,False,False,14.23.165.230,CN,China,Asia,Guangzhou,44,Guangdong,,Eastern Asia,Developing_Nations,,,23.1167,113.25,,,,,0.7,2018-03-19 14:26:40,2018-03-19 14:26:39.869650,2018-06-06 16:00:43.555222,102,9,9,2.0,,,,,,,Student,0,0,0,audit,1,,,,,,CN,,gmail.com,Chinese,China,,,zh,CN,,,68.0,1.0,en,0.0,7.0,1.0,0,0,9,1.0,0.027027,3,6,9,17.302403,43.226622,190.041146,90,2018.29208,,,,,,,,,,,1
9,HarvardX/PH525.1x/1T2018,18176841,True,True,False,False,False,128.179.139.229,CH,Switzerland,Europe,Lausanne,VD,Vaud,1006,Western Europe,Developed regions,,,46.5112,6.6371,,,,,0.7,2018-04-13 12:29:30,2018-04-13 12:29:29.761094,2018-04-13 12:33:59.392435,20,2,0,1.0,,,,,,,Student,0,0,0,audit,0,,,,,,CH,,epfl.ch,French,France,English,United States,fr,FR,en,US,20.0,1.0,en,0.0,1.0,1.0,0,0,0,,,0,0,0,29.959038,63.4408,194.967446,18,539.262682,,,,,,,,,,,1


In [5]:
select_random_rows('beta_post_Funnorm_PPMI_EPICn524final030618.csv', 'test_subset.csv', 10)

A file named test_subset.csv has been created with 10 rows.


[271592, 495174, 542673, 709310, 275584, 646188, 66543, 239268, 236789, 479490]

In [6]:
df = pd.read_csv('test_subset.csv')

In [7]:
df

Unnamed: 0,200973410159_R03C01,200991620021_R01C01,200991620021_R03C01,200989060105_R03C01,200989060135_R07C01,200989060162_R04C01,200973410167_R04C01,200973410143_R01C01,200973410143_R06C01,200973410167_R05C01,200973410167_R08C01,200989060001_R06C01,200989060130_R01C01,201004820204_R02C01,200973410121_R04C01,201004820204_R01C01,201004820204_R07C01,200989060051_R05C01,200973410159_R07C01,200989060143_R08C01,200989060061_R07C01,200973410144_R07C01,200989060002_R01C01,201004820064_R05C01,201004820067_R08C01,201050360014_R02C01,200989060162_R02C01,200989060162_R01C01,200973410159_R02C01,200991620021_R05C01,201050360065_R07C01,201050360065_R08C01,200989060105_R05C01,200989060135_R04C01,200989060135_R01C01,200989060135_R06C01,200989060152_R03C01,200989060152_R06C01,200989060140_R08C01,200989060018_R03C01,200989060088_R03C01,200989060130_R03C01,200989060140_R07C01,200989060104_R03C01,200989060149_R05C01,200989060076_R05C01,200989060076_R06C01,200989060019_R08C01,200989060051_R03C01,200989060063_R08C01,...,200991620029_R02C01,200989060128_R06C01,200991620011_R05C01,200989060063_R01C01,200973410144_R05C01,200989060051_R02C01,201050360013_R02C01,201004820182_R04C01,200989060059_R03C01,201004820182_R02C01,200989060002_R07C01,200989060002_R06C01,200989060059_R02C01,200989060002_R05C01,201050360013_R03C01,200989060002_R08C01,200989060002_R04C01,201004820064_R03C01,201004820064_R02C01,200989060016_R01C01,200989060155_R04C01,200989060016_R03C01,201004820067_R01C01,201050360080_R01C01,200989060015_R06C01,201004820067_R03C01,200989060015_R05C01,200989060155_R02C01,201004820067_R02C01,201004820064_R01C01,200989060016_R02C01,200989060155_R01C01,200989060155_R03C01,200989060111_R02C01,200989060089_R05C01,200989060089_R08C01,200973410143_R03C01,200989060089_R06C01,200973410143_R02C01,200989060089_R07C01,200989060089_R02C01,200989060089_R01C01,200989060089_R04C01,200973410143_R08C01,200973410143_R07C01,200989060089_R03C01,200989060150_R04C01,200989060150_R05C01,200989060150_R06C01,200991620049_R08C01
cg18960668,0.256975,0.277177,0.35753,0.367134,0.251264,0.284267,0.219275,0.459903,0.389783,0.253656,0.252398,0.352431,0.434733,0.294749,0.235902,0.253067,0.333933,0.252929,0.30501,0.278288,0.24678,0.281498,0.295087,0.138535,0.269945,0.394037,0.341489,0.32164,0.292208,0.298687,0.303668,0.341673,0.183512,0.194883,0.325746,0.303578,0.290345,0.378482,0.191072,0.44538,0.320847,0.240428,0.276578,0.226885,0.241421,0.319824,0.344236,0.394822,0.266479,0.187986,...,0.227245,0.328055,0.544253,0.341666,0.303988,0.364942,0.230998,0.299757,0.394859,0.272427,0.372679,0.30544,0.199017,0.321034,0.276072,0.335665,0.164864,0.33374,0.249588,0.277997,0.374598,0.362052,0.250194,0.296107,0.242079,0.263068,0.263829,0.295185,0.227499,0.29465,0.274623,0.42559,0.285756,0.293035,0.212176,0.19232,0.30286,0.203462,0.220526,0.237262,0.395729,0.311049,0.305205,0.349104,0.223146,0.342854,0.252918,0.329668,0.366928,0.132065
cg08276579,0.917048,0.932091,0.946874,0.935778,0.909927,0.924693,0.901925,0.921999,0.930833,0.90616,0.907885,0.931083,0.906888,0.919985,0.898346,0.910233,0.919028,0.922876,0.928737,0.928224,0.90908,0.926413,0.925341,0.92782,0.919599,0.942851,0.928895,0.899855,0.933629,0.919195,0.914107,0.931366,0.922984,0.918625,0.920117,0.912433,0.922123,0.927205,0.909225,0.910421,0.901358,0.919976,0.914881,0.938746,0.929763,0.850622,0.930372,0.926803,0.934228,0.925328,...,0.917755,0.933847,0.935803,0.911014,0.934507,0.909457,0.907676,0.912865,0.922605,0.925176,0.933357,0.914722,0.901166,0.942945,0.930564,0.925183,0.921706,0.920002,0.911658,0.920015,0.924458,0.924182,0.919936,0.921416,0.916589,0.931743,0.916437,0.919909,0.937091,0.905099,0.93224,0.914545,0.9304,0.935356,0.916832,0.917713,0.919173,0.911739,0.935597,0.908673,0.924914,0.920789,0.917459,0.916209,0.92283,0.919223,0.941675,0.921676,0.93247,0.90445
cg16451938,0.824158,0.825078,0.844017,0.860181,0.772778,0.843168,0.744988,0.766682,0.867499,0.768923,0.769303,0.882682,0.854419,0.86911,0.6593,0.86325,0.873713,0.879329,0.74086,0.858301,0.86464,0.829599,0.755926,0.793869,0.786152,0.869864,0.79227,0.687352,0.814421,0.879943,0.859232,0.837791,0.857852,0.838723,0.794744,0.812206,0.84366,0.824347,0.744665,0.869098,0.759367,0.865463,0.839376,0.852593,0.864477,0.852449,0.82624,0.796121,0.871475,0.812554,...,0.853972,0.866219,0.848272,0.859662,0.894095,0.890692,0.811104,0.861463,0.813719,0.879346,0.827088,0.813546,0.844121,0.832741,0.841852,0.825378,0.789433,0.826265,0.791708,0.830953,0.833859,0.810609,0.844257,0.88013,0.824703,0.832955,0.866813,0.844172,0.881417,0.81575,0.852035,0.804627,0.847669,0.833193,0.763412,0.820362,0.743927,0.817059,0.817595,0.856446,0.796688,0.813422,0.851047,0.785096,0.799164,0.871334,0.844973,0.852625,0.813722,0.83946
cg18732713,0.370261,0.372602,0.366068,0.374701,0.325756,0.368244,0.325568,0.324586,0.497594,0.329173,0.315361,0.372661,0.336496,0.342554,0.366421,0.37046,0.346015,0.392462,0.312042,0.331466,0.385344,0.356714,0.37181,0.339759,0.332552,0.374207,0.339879,0.323354,0.363893,0.353373,0.330421,0.366811,0.37549,0.338081,0.422694,0.337283,0.365272,0.391834,0.323054,0.366123,0.362112,0.345785,0.382889,0.390674,0.392255,0.343747,0.352538,0.341169,0.396176,0.357272,...,0.373322,0.376145,0.400539,0.378252,0.354711,0.34402,0.412506,0.348947,0.37897,0.35789,0.375036,0.33352,0.404012,0.363331,0.367471,0.309576,0.365314,0.319464,0.341404,0.363753,0.389981,0.345063,0.384831,0.365735,0.405841,0.33923,0.311535,0.363764,0.331792,0.360971,0.376939,0.470141,0.316704,0.359775,0.306314,0.335784,0.369048,0.315856,0.395908,0.335852,0.342946,0.349053,0.344732,0.308025,0.340391,0.325218,0.360706,0.373311,0.361985,0.424937
cg19125992,0.942156,0.906924,0.901853,0.909107,0.895392,0.909833,0.917347,0.911649,0.909696,0.913529,0.908927,0.932533,0.913139,0.921911,0.875666,0.902626,0.92733,0.910488,0.906164,0.926327,0.930088,0.935409,0.920489,0.923896,0.889812,0.932977,0.924132,0.913332,0.930868,0.909135,0.925186,0.934081,0.903172,0.896208,0.920851,0.909986,0.878773,0.941103,0.927014,0.91041,0.910125,0.940971,0.924246,0.907296,0.920134,0.910225,0.904142,0.930029,0.916259,0.912904,...,0.923302,0.93786,0.935646,0.90929,0.937354,0.926656,0.933931,0.925579,0.924997,0.893877,0.916712,0.941432,0.519249,0.930561,0.927937,0.913766,0.890234,0.917715,0.907519,0.545162,0.90552,0.911657,0.902333,0.911597,0.924181,0.912701,0.918379,0.920699,0.939166,0.913932,0.894188,0.923503,0.913449,0.921836,0.912405,0.917185,0.924086,0.931156,0.94123,0.942037,0.930324,0.934094,0.945962,0.914928,0.935997,0.927292,0.919837,0.931478,0.896949,0.924712
cg01613414,0.820081,0.781646,0.799927,0.77125,0.80811,0.817099,0.730764,0.800454,0.787824,0.765905,0.802552,0.836259,0.882079,0.820827,0.857499,0.753766,0.839529,0.788522,0.836626,0.836326,0.851233,0.84501,0.870732,0.760378,0.797337,0.807317,0.746872,0.7469,0.853495,0.715503,0.673203,0.846529,0.864476,0.777603,0.81544,0.757649,0.68981,0.736872,0.806597,0.745207,0.728881,0.851294,0.825734,0.859939,0.835767,0.797297,0.785037,0.814392,0.810297,0.837966,...,0.848369,0.81398,0.895919,0.854267,0.849776,0.803898,0.807639,0.791204,0.774993,0.814889,0.868045,0.860788,0.794008,0.814642,0.8506,0.881612,0.846885,0.840053,0.813854,0.841011,0.82941,0.824253,0.798534,0.744514,0.781248,0.801545,0.83457,0.816964,0.779968,0.810158,0.760449,0.79441,0.78403,0.802639,0.74177,0.835907,0.811765,0.806645,0.822815,0.857698,0.806517,0.750211,0.747549,0.829358,0.779118,0.77098,0.803469,0.851511,0.814526,0.854951
cg25579969,0.910342,0.903379,0.911472,0.866271,0.892252,0.890847,0.834386,0.901089,0.919612,0.867267,0.88377,0.929256,0.90483,0.885325,0.894512,0.909533,0.932048,0.929113,0.904045,0.903861,0.934836,0.881522,0.908997,0.900598,0.915869,0.925815,0.837731,0.918465,0.920265,0.887927,0.879953,0.895989,0.926119,0.91455,0.907521,0.895898,0.90434,0.89781,0.907061,0.853297,0.864707,0.924362,0.922141,0.919272,0.914586,0.931386,0.915253,0.921356,0.917198,0.867231,...,0.912453,0.892346,0.924202,0.899501,0.932989,0.909127,0.921704,0.895858,0.907923,0.903523,0.923881,0.938136,0.933871,0.920124,0.849956,0.908574,0.918591,0.917678,0.912616,0.894585,0.919774,0.90055,0.911576,0.891951,0.890605,0.89727,0.908447,0.908404,0.901829,0.904758,0.843322,0.906844,0.897808,0.928688,0.889094,0.921685,0.910296,0.913423,0.915361,0.889815,0.919183,0.911619,0.916178,0.917283,0.92062,0.919666,0.914754,0.916549,0.906335,0.933476
cg26944011,0.02258,0.020582,0.015355,0.01529,0.01811,0.012918,0.028174,0.01655,0.016285,0.018063,0.023859,0.017,0.02355,0.016766,0.015548,0.018543,0.016516,0.014628,0.014604,0.014324,0.017475,0.015438,0.018292,0.015445,0.014848,0.018051,0.014737,0.015252,0.020719,0.01503,0.01736,0.018233,0.021703,0.016201,0.015906,0.016783,0.016901,0.017853,0.02329,0.023146,0.019743,0.015869,0.018997,0.016219,0.012732,0.014102,0.013874,0.014627,0.016035,0.020368,...,0.016531,0.015657,0.014305,0.016657,0.018946,0.014062,0.013657,0.017804,0.013034,0.016156,0.013386,0.013151,0.019069,0.014201,0.015447,0.013333,0.014802,0.014549,0.014118,0.017482,0.016743,0.012862,0.014733,0.015997,0.01619,0.014315,0.014769,0.022064,0.015009,0.017409,0.01551,0.017265,0.016037,0.01587,0.013355,0.017803,0.020255,0.013589,0.014384,0.016606,0.015397,0.015018,0.012934,0.017196,0.014662,0.018811,0.013355,0.014412,0.016296,0.018505
cg27539852,0.67029,0.586824,0.588272,0.581855,0.545991,0.547786,0.562232,0.463629,0.581356,0.520879,0.574631,0.712815,0.59358,0.625242,0.580561,0.586202,0.670337,0.566834,0.570992,0.572692,0.608896,0.581311,0.592687,0.543066,0.603604,0.598684,0.655984,0.560537,0.620965,0.568307,0.582212,0.646963,0.61749,0.557901,0.649937,0.543164,0.546972,0.598025,0.478732,0.579463,0.51115,0.620933,0.674963,0.627085,0.595182,0.566039,0.54953,0.685963,0.606891,0.564721,...,0.607586,0.663114,0.677242,0.589014,0.611951,0.625557,0.591022,0.560843,0.582605,0.564523,0.626868,0.562503,0.492824,0.624898,0.642641,0.592194,0.633133,0.58851,0.568243,0.590548,0.637021,0.595179,0.62995,0.592914,0.543564,0.613443,0.574237,0.645094,0.489905,0.602395,0.603666,0.675024,0.617386,0.590052,0.582616,0.588763,0.600753,0.590869,0.613613,0.594793,0.534048,0.540621,0.636297,0.612931,0.600083,0.550631,0.682466,0.60773,0.631579,0.468912
cg07741793,0.02189,0.017741,0.023963,0.027288,0.018343,0.033426,0.017127,0.02012,0.019409,0.023237,0.015539,0.018108,0.020676,0.016761,0.017196,0.024817,0.02177,0.022674,0.023851,0.02947,0.01916,0.024969,0.020175,0.025869,0.020405,0.024555,0.02677,0.026236,0.022173,0.033123,0.023956,0.024203,0.026657,0.021347,0.02522,0.024086,0.022674,0.031793,0.029542,0.064887,0.024738,0.017396,0.022337,0.021253,0.018425,0.022617,0.017482,0.025421,0.017266,0.022971,...,0.015684,0.026027,0.019498,0.029495,0.019803,0.021546,0.034171,0.022807,0.025056,0.019356,0.016718,0.016184,0.019478,0.015729,0.026529,0.020057,0.01396,0.019134,0.023196,0.027758,0.021379,0.022713,0.021557,0.052614,0.022683,0.021659,0.019995,0.018695,0.027353,0.025584,0.025852,0.021043,0.018576,0.022852,0.021524,0.015868,0.021777,0.015962,0.013882,0.018475,0.017647,0.015155,0.019644,0.01781,0.015628,0.018968,0.023713,0.020342,0.017195,0.025952


In [8]:
L = find_csv_length('beta_post_Funnorm_PPMI_EPICn524final030618.csv')
L

864067

In [20]:
def select_rows_in(file_to_read, file_to_write, rows):
    '''
    Takes an input csv file and writes a smaller csv file containing num_rows randomly seleceted from 
    the input csv file. As well, it returns the indicies of the chosen rows.
    
    params: 
        file_to_read (string) (file.csv) path to some existing csv file to read
        file_to_write (string) (file.csv) path to csv file to write as output
        num_rows (list) number of rows to randomly select
        
    returns:
        rows_selected (list) indicies of the rows included in the new file

    '''
    with open(file_to_read, 'r') as file_in:

        csv_in = csv.reader(file_in)

        header = next(csv_in)
        
        count = 0  
        with open(file_to_write, 'w') as file_out:

            csv_out = csv.writer(file_out)
            csv_out.writerow(header)
                         
            for line in csv_in:
                if line[0] in rows:
                    csv_out.writerow(line)
                    count+=1
                    
                        
    print(f'A file named {file_to_write} has been created with {count} rows.')
          

In [8]:
df_test = pd.read_csv('test_sample.csv')
names = df_test.course_id

In [15]:
df_test

Unnamed: 0,course_id,user_id,registered,viewed,explored,certified,completed,ip,cc_by_ip,countryLabel,continent,city,region,subdivision,postalCode,un_major_region,un_economic_group,un_developing_nation,un_special_region,latitude,longitude,LoE,YoB,gender,grade,passing_grade,start_time,first_event,last_event,nevents,ndays_act,nplay_video,nchapters,nforum_posts,nforum_votes,nforum_endorsed,nforum_threads,nforum_comments,nforum_pinned,roles,nprogcheck,nproblem_check,nforum_events,mode,is_active,cert_created_date,cert_modified_date,cert_status,verified_enroll_time,verified_unenroll_time,profile_country,y1_anomalous,email_domain,language_brwsr,language_brwsr_country,language_brwsr_sec,language_brwsr_sec_country,language_brwsr_code,language_brwsr_subcode,language_brwsr_sec_code,language_brwsr_sec_subcode,language_brwsr_nevents,language_brwsr_ndiff,language,language_download,language_nevents,language_ndiff,ntranscript,nshow_answer,nvideo,nvideos_unique_viewed,nvideos_total_watched,nseq_goto,nseek_video,npause_video,avg_dt,sdv_dt,max_dt,n_dt,sum_dt,roles_isBetaTester,roles_isInstructor,roles_isStaff,roles_isCCX,roles_isFinance,roles_isLibrary,roles_isSales,forumRoles_isAdmin,forumRoles_isCommunityTA,forumRoles_isModerator,forumRoles_isStudent
0,HarvardX/PH525.1x/1T2018,49605,True,True,True,False,False,50.232.62.163,US,United States,Americas,Temperance,MI,Michigan,48182,Northern America,Developed regions,,,41.7940,-83.5879,b,,m,,0.7,2018-01-26 17:36:56,2018-01-26 17:36:56.323525,2018-06-01 02:16:01.923220,1858.0,95.0,119.0,4.0,,,,,,,Student,0.0,192.0,0.0,verified,1,,,,2018-02-20 00:12:25.437347,,US,,gmail.com,English,United States,,,en,US,,,950.0,1.0,en,4.0,153.0,1.0,1.0,19.0,119.0,16.0,0.432432,195.0,59.0,88.0,8.646717,42.820852,286.956932,1572.0,26288.841328,,,,,,,,,,,1.0
1,HarvardX/PH525.1x/1T2018,58453,True,True,False,False,False,181.113.152.43,EC,Ecuador,Americas,Guayaquil,G,Provincia del Guayas,,South America,Developing_Nations,,Latin America and the Caribbean,-2.1667,-79.9000,a,1980.0,m,,0.7,2018-01-03 15:42:35,2018-01-03 15:42:35.381842,2018-03-15 16:08:38.344821,119.0,7.0,11.0,2.0,,,,,,,Student,0.0,12.0,0.0,audit,1,,,,,,EC,,gmail.com,Spanish; Castilian,Mexico,Spanish; Castilian,,es,MX,es,,49.0,1.0,en,0.0,4.0,1.0,0.0,0.0,11.0,2.0,0.054054,0.0,2.0,11.0,22.991269,57.936367,283.841825,100.0,2861.397814,,,,,,,,,,,1.0
2,HarvardX/PH525.1x/1T2018,70351,True,False,,False,False,213.74.81.45,TR,Turkey,Asia,Antalya,07,Antalya,,Western Asia,Developing_Nations,,,36.9081,30.6956,,,,,0.7,2018-05-01 00:07:38,2018-05-01 00:07:38.150497,2018-05-01 00:34:09.598821,20.0,4.0,0.0,,,,,,,,Student,0.0,0.0,0.0,audit,0,,,,,,,,gmail.com,Turkish,Turkey,English,United States,tr,TR,en,US,10.0,1.0,,,,,0.0,0.0,0.0,,,0.0,0.0,0.0,26.583604,38.480580,70.941777,12.0,319.003248,,,,,,,,,,,1.0
3,HarvardX/PH525.1x/1T2018,70954,True,True,False,False,False,69.73.78.100,US,United States,Americas,Palm Harbor,FL,Florida,34683,Northern America,Developed regions,,,28.0859,-82.7625,,,,,0.7,2018-03-08 04:32:17,2018-03-08 04:32:17.267452,2018-03-16 22:41:28.448171,20.0,4.0,0.0,1.0,,,,,,,Student,0.0,0.0,0.0,audit,1,,,,,,,,gmail.com,English,United States,,,en,US,,,3.0,1.0,,,,,0.0,0.0,0.0,,,0.0,0.0,0.0,1.323438,1.049496,3.051486,12.0,12.765054,,,,,,,,,,,1.0
4,HarvardX/PH525.1x/1T2018,203176,True,True,False,False,False,189.102.101.16,BR,Brazil,Americas,São Paulo,SP,Sao Paulo,,South America,Developing_Nations,,Latin America and the Caribbean,-24.5157,-48.4219,b,1985.0,f,,0.7,2018-03-30 01:35:03,2018-03-30 00:00:00,2018-04-03 14:12:05.498351,180.0,6.0,24.0,2.0,,,,,,,Student,0.0,4.0,0.0,audit,1,,,,,,,,gmail.com,English,United States,,,en,US,,,73.0,1.0,en,0.0,10.0,1.0,0.0,0.0,24.0,2.0,0.054054,8.0,16.0,24.0,31.097345,44.176848,243.795929,162.0,4585.006562,,,,,,,,,,,1.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
195,HarvardX/PH525.1x/1T2018,19405699,True,True,False,False,False,158.109.244.250,ES,Spain,Europe,Premiá De Mar,B,Barcelona,08330,Southern Europe,Developed regions,,,41.4921,2.3652,,,,,0.7,2018-05-30 14:20:08,2018-05-30 00:00:00,2018-06-08 13:34:35.708034,74.0,4.0,1.0,2.0,,,,,,,Student,0.0,6.0,0.0,audit,1,,,,,,ES,,gmail.com,Spanish; Castilian,,English,,es,419,en,,49.0,1.0,en,0.0,5.0,1.0,0.0,0.0,1.0,1.0,0.027027,1.0,0.0,1.0,23.132751,45.663992,269.146997,65.0,1262.338666,,,,,,,,,,,1.0
196,HarvardX/PH525.1x/1T2018,19419074,True,False,,False,False,115.154.235.36,CN,China,Asia,Tong,54,Tibet Autonomous Region,,Eastern Asia,Developing_Nations,,,29.5000,87.6000,b,1998.0,m,,0.7,2018-05-31 13:57:25,2018-05-31 13:57:25.382363,2018-05-31 13:58:24.265149,3.0,1.0,0.0,,,,,,,,Student,0.0,0.0,0.0,audit,1,,,,,,CN,,qq.com,Chinese,China,,,zh,CN,,,1.0,1.0,,,,,0.0,0.0,0.0,,,0.0,0.0,0.0,29.441393,36.039363,54.925071,2.0,58.882786,,,,,,,,,,,1.0
197,HarvardX/PH525.1x/1T2018,19445101,True,False,,False,False,184.187.147.53,US,United States,Americas,Lafayette,LA,Louisiana,70503,Northern America,Developed regions,,,30.1689,-92.0599,,,f,,0.7,2018-06-02 23:10:05,2018-06-02 23:10:04.629683,2018-06-10 03:49:21.362218,19.0,5.0,1.0,,,,,,,,Student,0.0,0.0,0.0,audit,1,,,,,,US,,gmail.com,English,United States,,,en,US,,,12.0,1.0,en,0.0,1.0,1.0,0.0,0.0,1.0,,,0.0,0.0,0.0,11.792554,26.124575,97.756919,14.0,163.339562,,,,,,,,,,,1.0
198,HarvardX/ER22.1x/1T2018,152554,True,False,,False,False,85.72.96.176,GR,Greece,Europe,Athens,I,Attica,,Southern Europe,Developed regions,,,37.9833,23.7333,,,,,0.6,2018-01-20 13:01:25,2018-01-20 13:01:25.178838,2018-01-20 13:01:38.072479,4.0,1.0,0.0,,,,,,,,Student,0.0,0.0,0.0,audit,1,,,,,,,,gmail.com,English,United States,,,en,US,,,1.0,1.0,,,,,0.0,0.0,0.0,,,0.0,0.0,0.0,4.297880,5.301080,10.297196,3.0,12.893641,,,,,,,,,,,1.0


In [17]:
names[199]

'HarvardX/ER22.1x/1T2018'

In [18]:
keep = ['HarvardX/ER22.1x/1T2018']

In [21]:
select_rows_in('test_sample.csv',  'test_sample_keep.csv', rows=keep)

A file named test_sample_keep.csv has been created with 2 rows.


In [22]:
df_keep = pd.read_csv('test_sample_keep.csv')
df_keep

Unnamed: 0,course_id,user_id,registered,viewed,explored,certified,completed,ip,cc_by_ip,countryLabel,continent,city,region,subdivision,postalCode,un_major_region,un_economic_group,un_developing_nation,un_special_region,latitude,longitude,LoE,YoB,gender,grade,passing_grade,start_time,first_event,last_event,nevents,ndays_act,nplay_video,nchapters,nforum_posts,nforum_votes,nforum_endorsed,nforum_threads,nforum_comments,nforum_pinned,roles,nprogcheck,nproblem_check,nforum_events,mode,is_active,cert_created_date,cert_modified_date,cert_status,verified_enroll_time,verified_unenroll_time,profile_country,y1_anomalous,email_domain,language_brwsr,language_brwsr_country,language_brwsr_sec,language_brwsr_sec_country,language_brwsr_code,language_brwsr_subcode,language_brwsr_sec_code,language_brwsr_sec_subcode,language_brwsr_nevents,language_brwsr_ndiff,language,language_download,language_nevents,language_ndiff,ntranscript,nshow_answer,nvideo,nvideos_unique_viewed,nvideos_total_watched,nseq_goto,nseek_video,npause_video,avg_dt,sdv_dt,max_dt,n_dt,sum_dt,roles_isBetaTester,roles_isInstructor,roles_isStaff,roles_isCCX,roles_isFinance,roles_isLibrary,roles_isSales,forumRoles_isAdmin,forumRoles_isCommunityTA,forumRoles_isModerator,forumRoles_isStudent
0,HarvardX/ER22.1x/1T2018,152554,True,False,,False,False,85.72.96.176,GR,Greece,Europe,Athens,I,Attica,,Southern Europe,Developed regions,,,37.9833,23.7333,,,,,0.6,2018-01-20 13:01:25,2018-01-20 13:01:25.178838,2018-01-20 13:01:38.072479,4,1,0,,,,,,,,Student,0,0,0,audit,1,,,,,,,,gmail.com,English,United States,,,en,US,,,1,1,,,,,0,0,0,,,0,0,0,4.29788,5.30108,10.297196,3,12.893641,,,,,,,,,,,1
1,HarvardX/ER22.1x/1T2018,157833,True,True,False,False,False,,,,,,,,,,,,,,,b,1979.0,m,,0.6,2018-02-04 18:32:13,2018-02-04 18:32:13.167948,2018-02-10 13:48:06.117000,260,5,0,1.0,,,,,,,Student,0,0,0,audit,1,,,,,,,,yahoo.es,Spanish; Castilian,Spain,English,,es,ES,en,,1,1,,,,,0,0,0,,,0,0,0,11.611371,41.550799,294.0,243,2977.188138,,,,,,,,,,,1


In [28]:
df_353 = pd.read_csv('keycpgs.csv')
keep = list(df_353.CpGMarker)

In [29]:
keep

['cg00075967',
 'cg00374717',
 'cg00864867',
 'cg00945507',
 'cg01027739',
 'cg01353448',
 'cg01584473',
 'cg01644850',
 'cg01656216',
 'cg01873645',
 'cg01968178',
 'cg02085507',
 'cg02154074',
 'cg02217159',
 'cg02331561',
 'cg02332492',
 'cg02364642',
 'cg02388150',
 'cg02479575',
 'cg02489552',
 'cg02580606',
 'cg02654291',
 'cg02827112',
 'cg02972551',
 'cg03103192',
 'cg03167275',
 'cg03270204',
 'cg03565323',
 'cg03588357',
 'cg03760483',
 'cg04084157',
 'cg04126866',
 'cg04528819',
 'cg04836038',
 'cg05250458',
 'cg05294243',
 'cg05365729',
 'cg05675373',
 'cg05755779',
 'cg05921699',
 'cg05960024',
 'cg06121469',
 'cg06144905',
 'cg06361108',
 'cg06462291',
 'cg06493994',
 'cg06557358',
 'cg06738602',
 'cg06810647',
 'cg06952310',
 'cg06993413',
 'cg07285276',
 'cg07291563',
 'cg07337598',
 'cg07455279',
 'cg07595943',
 'cg08030082',
 'cg08090772',
 'cg08124722',
 'cg08251036',
 'cg08370996',
 'cg08413469',
 'cg08434234',
 'cg08771731',
 'cg08965235',
 'cg09019938',
 'cg091186

In [30]:
select_rows_in('beta_post_Funnorm_PPMI_EPICn524final030618.csv',  'beta_post_kept.csv', rows=keep)

A file named beta_post_kept.csv has been created with 335 rows.


In [32]:
df_beta_keep = pd.read_csv('beta_post_kept.csv')

In [33]:
df_beta_keep

Unnamed: 0,200973410159_R03C01,200991620021_R01C01,200991620021_R03C01,200989060105_R03C01,200989060135_R07C01,200989060162_R04C01,200973410167_R04C01,200973410143_R01C01,200973410143_R06C01,200973410167_R05C01,200973410167_R08C01,200989060001_R06C01,200989060130_R01C01,201004820204_R02C01,200973410121_R04C01,201004820204_R01C01,201004820204_R07C01,200989060051_R05C01,200973410159_R07C01,200989060143_R08C01,200989060061_R07C01,200973410144_R07C01,200989060002_R01C01,201004820064_R05C01,201004820067_R08C01,201050360014_R02C01,200989060162_R02C01,200989060162_R01C01,200973410159_R02C01,200991620021_R05C01,201050360065_R07C01,201050360065_R08C01,200989060105_R05C01,200989060135_R04C01,200989060135_R01C01,200989060135_R06C01,200989060152_R03C01,200989060152_R06C01,200989060140_R08C01,200989060018_R03C01,200989060088_R03C01,200989060130_R03C01,200989060140_R07C01,200989060104_R03C01,200989060149_R05C01,200989060076_R05C01,200989060076_R06C01,200989060019_R08C01,200989060051_R03C01,200989060063_R08C01,...,200991620029_R02C01,200989060128_R06C01,200991620011_R05C01,200989060063_R01C01,200973410144_R05C01,200989060051_R02C01,201050360013_R02C01,201004820182_R04C01,200989060059_R03C01,201004820182_R02C01,200989060002_R07C01,200989060002_R06C01,200989060059_R02C01,200989060002_R05C01,201050360013_R03C01,200989060002_R08C01,200989060002_R04C01,201004820064_R03C01,201004820064_R02C01,200989060016_R01C01,200989060155_R04C01,200989060016_R03C01,201004820067_R01C01,201050360080_R01C01,200989060015_R06C01,201004820067_R03C01,200989060015_R05C01,200989060155_R02C01,201004820067_R02C01,201004820064_R01C01,200989060016_R02C01,200989060155_R01C01,200989060155_R03C01,200989060111_R02C01,200989060089_R05C01,200989060089_R08C01,200973410143_R03C01,200989060089_R06C01,200973410143_R02C01,200989060089_R07C01,200989060089_R02C01,200989060089_R01C01,200989060089_R04C01,200973410143_R08C01,200973410143_R07C01,200989060089_R03C01,200989060150_R04C01,200989060150_R05C01,200989060150_R06C01,200991620049_R08C01
cg13319175,0.916345,0.876005,0.881291,0.899211,0.867874,0.897708,0.871227,0.865747,0.869889,0.857018,0.892127,0.927430,0.898095,0.901209,0.878139,0.897519,0.919912,0.909166,0.897363,0.899597,0.913324,0.906904,0.898545,0.861094,0.902422,0.921204,0.899402,0.874042,0.936332,0.875255,0.876821,0.931561,0.883577,0.896184,0.878123,0.875765,0.880811,0.889130,0.882632,0.858117,0.862757,0.886989,0.902004,0.880851,0.926401,0.900353,0.914724,0.907060,0.905040,0.884370,...,0.920556,0.875876,0.915823,0.876539,0.914493,0.894515,0.898725,0.890642,0.875103,0.904435,0.893954,0.913948,0.886439,0.876601,0.852615,0.895850,0.895640,0.885598,0.890469,0.891203,0.910783,0.911835,0.849204,0.868406,0.886590,0.862745,0.897424,0.890681,0.883839,0.890066,0.893017,0.886585,0.896447,0.908400,0.896727,0.889071,0.895682,0.919407,0.892414,0.890483,0.903454,0.874479,0.886547,0.903353,0.874404,0.901497,0.901106,0.904594,0.906945,0.900819
cg21211748,0.047419,0.030216,0.076499,0.034195,0.041080,0.039377,0.064212,0.030131,0.027508,0.075733,0.061607,0.042668,0.038038,0.045508,0.039002,0.045152,0.037788,0.029904,0.055917,0.032440,0.049021,0.040951,0.041700,0.040622,0.032647,0.028520,0.044752,0.076612,0.044435,0.042660,0.045388,0.033342,0.048191,0.045820,0.041412,0.034575,0.066650,0.034762,0.069202,0.057960,0.054692,0.030165,0.068611,0.022271,0.040550,0.032001,0.032455,0.044891,0.044013,0.069246,...,0.034591,0.034910,0.030977,0.046048,0.032656,0.041572,0.036654,0.038555,0.034846,0.045215,0.050157,0.038743,0.027520,0.034853,0.102066,0.028284,0.032630,0.040133,0.056641,0.056894,0.043156,0.052440,0.035643,0.051339,0.040201,0.035783,0.038368,0.042958,0.037987,0.040536,0.044133,0.033566,0.046383,0.048084,0.030749,0.028954,0.027162,0.024336,0.024664,0.029273,0.042628,0.026849,0.032234,0.027519,0.032025,0.034256,0.031233,0.034991,0.039544,0.045187
cg19420968,0.935816,0.882283,0.937541,0.899474,0.889517,0.941420,0.925693,0.906165,0.918314,0.931796,0.934539,0.931074,0.930660,0.930587,0.921493,0.916475,0.907264,0.923141,0.922356,0.918700,0.922848,0.924055,0.921169,0.891853,0.904941,0.947824,0.931094,0.930029,0.951262,0.902234,0.889663,0.945333,0.929708,0.891502,0.875043,0.914225,0.948413,0.919984,0.934099,0.839931,0.910730,0.944695,0.942856,0.941273,0.921449,0.939859,0.904658,0.918985,0.933108,0.911612,...,0.917614,0.925623,0.939414,0.930139,0.933994,0.928292,0.920399,0.904126,0.923681,0.916562,0.937830,0.938737,0.949337,0.915748,0.938315,0.931722,0.942630,0.899282,0.908845,0.908341,0.923580,0.932190,0.823493,0.930873,0.921128,0.927002,0.929968,0.922248,0.906646,0.902595,0.894574,0.883304,0.908161,0.926374,0.908853,0.940152,0.932815,0.933807,0.925806,0.947019,0.916057,0.923495,0.926400,0.913651,0.918014,0.930116,0.924397,0.943358,0.940351,0.917752
cg14992253,0.113106,0.220858,0.160648,0.128289,0.126839,0.183459,0.150445,0.111694,0.118929,0.150319,0.156461,0.118659,0.125346,0.144135,0.116116,0.132270,0.098547,0.161780,0.166939,0.143203,0.152033,0.113414,0.119850,0.154022,0.161299,0.159121,0.270407,0.164418,0.167658,0.192471,0.225667,0.125642,0.111332,0.103792,0.138385,0.127778,0.319838,0.299768,0.100364,0.208824,0.163354,0.101373,0.168132,0.122001,0.144978,0.119378,0.137831,0.133496,0.173509,0.150132,...,0.127445,0.136089,0.160049,0.163845,0.117725,0.135493,0.198408,0.138479,0.150312,0.122839,0.107963,0.129341,0.092611,0.104589,0.114758,0.136132,0.072262,0.137010,0.117421,0.147897,0.080690,0.162826,0.134996,0.281434,0.134502,0.131412,0.114952,0.147279,0.119274,0.123644,0.171979,0.065506,0.163898,0.144405,0.141162,0.099437,0.133085,0.098226,0.085858,0.095625,0.130786,0.113597,0.147672,0.074254,0.119721,0.158719,0.107109,0.108319,0.155217,0.103635
cg26372517,0.412038,0.311121,0.313840,0.341520,0.399415,0.330026,0.398900,0.422172,0.365501,0.222714,0.272880,0.288781,0.353669,0.445083,0.275665,0.319735,0.294355,0.362118,0.321096,0.323320,0.324136,0.235142,0.387763,0.224873,0.254749,0.337570,0.470419,0.414921,0.441531,0.318563,0.376382,0.337760,0.193545,0.201479,0.250123,0.296171,0.540038,0.446971,0.211144,0.385929,0.324609,0.247135,0.437256,0.271226,0.463403,0.301198,0.374377,0.232330,0.377852,0.452804,...,0.386909,0.245356,0.269991,0.326956,0.309796,0.358394,0.303241,0.312452,0.232956,0.207225,0.315192,0.265754,0.348933,0.258418,0.289011,0.332591,0.392771,0.317997,0.206850,0.324121,0.312818,0.254848,0.269391,0.368929,0.333468,0.311867,0.304701,0.301322,0.253058,0.334909,0.435284,0.186879,0.470016,0.395888,0.280699,0.249270,0.220112,0.343489,0.334678,0.376989,0.290872,0.368072,0.310332,0.172419,0.257962,0.312521,0.348701,0.256887,0.175009,0.161334
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
cg11932564,0.020158,0.023174,0.017405,0.016433,0.014904,0.019076,0.019297,0.015787,0.030293,0.020950,0.019273,0.015444,0.017906,0.018769,0.017828,0.017002,0.017502,0.015665,0.017320,0.012204,0.016333,0.013246,0.016368,0.018062,0.015716,0.013472,0.015942,0.015282,0.016723,0.016270,0.018650,0.020333,0.013984,0.013190,0.017736,0.015477,0.016649,0.016682,0.024782,0.027172,0.019482,0.017286,0.018462,0.016535,0.014618,0.013083,0.013502,0.021184,0.016546,0.019383,...,0.013786,0.019093,0.015200,0.019398,0.012493,0.016236,0.017738,0.013040,0.014257,0.013643,0.014224,0.012704,0.014950,0.013815,0.011800,0.014371,0.012879,0.013960,0.013829,0.015019,0.016842,0.016805,0.018617,0.022275,0.014303,0.016017,0.012799,0.019101,0.014739,0.015463,0.016396,0.014849,0.017109,0.015217,0.015816,0.017031,0.017601,0.015031,0.015472,0.015775,0.014947,0.018116,0.016419,0.013387,0.016238,0.027973,0.016935,0.014461,0.018425,0.017338
cg26453588,0.524586,0.498783,0.544513,0.476794,0.446309,0.453400,0.562225,0.428903,0.554503,0.495106,0.482119,0.538680,0.532973,0.562343,0.515401,0.531157,0.542460,0.467905,0.526458,0.429302,0.507425,0.486692,0.471455,0.444624,0.557265,0.611528,0.645554,0.433972,0.505977,0.540428,0.558596,0.546744,0.571587,0.492550,0.509657,0.570132,0.590317,0.555349,0.418218,0.538689,0.484731,0.469568,0.471765,0.551559,0.544250,0.475052,0.538024,0.459502,0.529372,0.454250,...,0.525862,0.482137,0.546774,0.494551,0.562117,0.473997,0.481989,0.486641,0.486611,0.482645,0.484040,0.515651,0.501674,0.452415,0.588210,0.440306,0.463709,0.433048,0.500910,0.577659,0.535054,0.523870,0.602011,0.533073,0.566427,0.512239,0.478257,0.487700,0.439007,0.451047,0.554606,0.316252,0.484776,0.488698,0.557134,0.457409,0.529737,0.497830,0.510540,0.553170,0.460952,0.550750,0.560237,0.476549,0.490693,0.670780,0.446466,0.558492,0.543867,0.389627
cg26394940,0.041061,0.127253,0.097200,0.190352,0.063016,0.110756,0.072319,0.073846,0.140488,0.067683,0.088953,0.124914,0.034840,0.081097,0.018473,0.097369,0.046601,0.130190,0.038882,0.064215,0.084891,0.047237,0.054772,0.035593,0.037484,0.074996,0.089179,0.051416,0.084300,0.201744,0.062412,0.101049,0.050877,0.084571,0.034747,0.105991,0.090762,0.046095,0.080043,0.147209,0.126841,0.026583,0.115295,0.018769,0.055626,0.066939,0.085516,0.069818,0.129040,0.061889,...,0.062541,0.094435,0.021426,0.081869,0.061575,0.142160,0.042970,0.050425,0.102778,0.060405,0.036848,0.042067,0.059875,0.066523,0.047604,0.054219,0.045345,0.040006,0.049527,0.025835,0.083914,0.080608,0.079077,0.184023,0.073556,0.043785,0.041944,0.098253,0.062309,0.058219,0.178361,0.026611,0.077470,0.042071,0.040488,0.030404,0.024811,0.035947,0.038628,0.043991,0.069933,0.082184,0.211747,0.065737,0.155777,0.084738,0.035516,0.051450,0.112723,0.038591
cg13269407,0.066466,0.147126,0.142710,0.239307,0.105967,0.152722,0.090906,0.092356,0.163214,0.095290,0.121744,0.137083,0.070855,0.124598,0.040288,0.143673,0.068133,0.187694,0.053848,0.140641,0.119108,0.085627,0.075509,0.070858,0.085957,0.085526,0.138121,0.104084,0.106275,0.194135,0.101069,0.122398,0.104917,0.169435,0.068124,0.129566,0.113337,0.067098,0.155457,0.155105,0.174008,0.069346,0.165375,0.060664,0.089428,0.093921,0.079257,0.103750,0.172024,0.091322,...,0.084487,0.153321,0.052074,0.083524,0.091345,0.168825,0.091945,0.079378,0.138403,0.103800,0.077265,0.074950,0.118042,0.125098,0.086352,0.047383,0.081237,0.063279,0.068529,0.043837,0.144385,0.107634,0.123209,0.203998,0.088172,0.084785,0.079614,0.100506,0.100228,0.096888,0.180998,0.066029,0.086344,0.070610,0.050918,0.053722,0.056842,0.056503,0.060835,0.044348,0.103203,0.128064,0.223256,0.088225,0.228685,0.133757,0.065732,0.100730,0.109772,0.060828
