In [1]:
from pip._internal import main as pip

try:
    import pprint
except ImportError:
    pip(['install', 'pprint'])
    import pprint

try:
    import requests
except ImportError:
    pip(['install', 'requests'])
    import requests

try:
    import pandas as pd
except ImportError:
    pip(['install', 'pandas'])
    import pandas as pd

try:
    import simplejson as json
except ImportError:
    pip(['install', 'simplejson'])
    import simplejson as json

import re

pd.set_option('display.max_colwidth', -1)
pd.set_option('display.max_rows', 99999)
pd.set_option('display.max_columns', 99999)

## Select EdelweissData server and authenticate

In [2]:
try:
    from edelweiss_data import API, QueryExpression as Q
except ImportError:
    from edelweiss_data import API, QueryExpression as Q

edelweiss_api_url = 'https://api.develop.edelweiss.douglasconnect.com'
api = API(edelweiss_api_url)
api.authenticate()

## List metadata of all TG-Gates sets on the server

In [3]:
columns = [
#    ("Metadata", "$"),
    ("Compound", "$.Compound.Name"),
    ("SMILES", "$.Compound.SMILES"),
    ("Organism", "$.Assay.Organism"),
    ("Study type", "$.Assay.\"Study type\""),
    ("Organ", "$.Assay.Organ"),
    ("Dose", "$.Assay.Exposure.Dose"),
    ("Duration", "$.Assay.Exposure.Duration")
]
condition = Q.search_anywhere("TG-GATES")
TGGATES = api.get_published_datasets(limit=200, columns=columns, condition=condition)
#TGGATES

In [4]:
TGGATES = TGGATES[(TGGATES['Organism']=="\"Human\"") & (TGGATES['Organ']=="\"Liver\"") & (TGGATES['Study type']=="\"in_vitro\"")]
TGGATES

Unnamed: 0_level_0,Unnamed: 1_level_0,dataset,Compound,SMILES,Organism,Study type,Organ,Dose,Duration
id,version,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
472755fe-211b-40a0-a05b-696a2a384aff,1,<PublishedDataset '472755fe-211b-40a0-a05b-696a2a384aff':1 - TG-GATES-ORN_cs_aoplink_WY-14643_Human_Liver_in vitro_24_hr_high_FOLD_CHANGES>,"""WY-14643""","""CC1=C(C(=CC=C1)NC2=CC(=NC(=N2)SCC(=O)O)Cl)C""","""Human""","""in_vitro""","""Liver""","""high""",24
ece66bab-bee8-47f1-8f16-b154f6e3f359,1,<PublishedDataset 'ece66bab-bee8-47f1-8f16-b154f6e3f359':1 - TG-GATES-ORN_cs_aoplink_WY-14643_Human_Liver_in vitro_24_hr_low_FOLD_CHANGES>,"""WY-14643""","""CC1=C(C(=CC=C1)NC2=CC(=NC(=N2)SCC(=O)O)Cl)C""","""Human""","""in_vitro""","""Liver""","""low""",24
a7908788-399f-4449-820d-f321ca387232,1,<PublishedDataset 'a7908788-399f-4449-820d-f321ca387232':1 - TG-GATES-ORN_cs_aoplink_fenofibrate_Human_Liver_in vitro_24_hr_high_FOLD_CHANGES>,"""fenofibrate""","""CC(C)OC(=O)C(C)(C)OC1=CC=C(C=C1)C(=O)C2=CC=C(C=C2)Cl""","""Human""","""in_vitro""","""Liver""","""high""",24
66f8d3e3-d470-49a4-af08-2625d3ec42aa,1,<PublishedDataset '66f8d3e3-d470-49a4-af08-2625d3ec42aa':1 - TG-GATES-ORN_cs_aoplink_WY-14643_Human_Liver_in vitro_8_hr_middle_FOLD_CHANGES>,"""WY-14643""","""CC1=C(C(=CC=C1)NC2=CC(=NC(=N2)SCC(=O)O)Cl)C""","""Human""","""in_vitro""","""Liver""","""middle""",8
e40ebbc7-844d-4b79-b5c0-10c36fd6eb77,1,<PublishedDataset 'e40ebbc7-844d-4b79-b5c0-10c36fd6eb77':1 - TG-GATES-ORN_cs_aoplink_fenofibrate_Human_Liver_in vitro_8_hr_middle_FOLD_CHANGES>,"""fenofibrate""","""CC(C)OC(=O)C(C)(C)OC1=CC=C(C=C1)C(=O)C2=CC=C(C=C2)Cl""","""Human""","""in_vitro""","""Liver""","""middle""",8
912b41ce-bb1f-47fb-8b8f-e88cb8744315,1,<PublishedDataset '912b41ce-bb1f-47fb-8b8f-e88cb8744315':1 - TG-GATES-ORN_cs_aoplink_lofibrate_Human_Liver_in vitro_24_hr_low_FOLD_CHANGES>,"""clofibrate""","""CCOC(=O)C(C)(C)OC1=CC=C(C=C1)Cl""","""Human""","""in_vitro""","""Liver""","""low""",24
530f243f-ded1-4fe1-a01e-37995296dde3,1,<PublishedDataset '530f243f-ded1-4fe1-a01e-37995296dde3':1 - TG-GATES-ORN_cs_aoplink_WY-14643_Human_Liver_in vitro_8_hr_low_FOLD_CHANGES>,"""WY-14643""","""CC1=C(C(=CC=C1)NC2=CC(=NC(=N2)SCC(=O)O)Cl)C""","""Human""","""in_vitro""","""Liver""","""low""",8
0d2ce56e-ee3f-47fa-bbbf-b0853b5d4151,1,<PublishedDataset '0d2ce56e-ee3f-47fa-bbbf-b0853b5d4151':1 - TG-GATES-ORN_cs_aoplink_lofibrate_Human_Liver_in vitro_8_hr_middle_FOLD_CHANGES>,"""clofibrate""","""CCOC(=O)C(C)(C)OC1=CC=C(C=C1)Cl""","""Human""","""in_vitro""","""Liver""","""middle""",8
acb77d9b-9d0e-425a-a67a-c78bb5c4663d,1,<PublishedDataset 'acb77d9b-9d0e-425a-a67a-c78bb5c4663d':1 - TG-GATES-ORN_cs_aoplink_lofibrate_Human_Liver_in vitro_8_hr_high_FOLD_CHANGES>,"""clofibrate""","""CCOC(=O)C(C)(C)OC1=CC=C(C=C1)Cl""","""Human""","""in_vitro""","""Liver""","""high""",8
4b6aa018-0cf8-47a5-8ce0-1a5551e9f634,1,<PublishedDataset '4b6aa018-0cf8-47a5-8ce0-1a5551e9f634':1 - TG-GATES-ORN_cs_aoplink_gemfibrozil_Human_Liver_in vitro_8_hr_high_FOLD_CHANGES>,"""gemfibrozil""","""CC1=CC(=C(C=C1)C)OCCCC(C)(C)C(=O)O""","""Human""","""in_vitro""","""Liver""","""high""",8


## Access first dataset

In [5]:
data = TGGATES.iloc[0]['dataset'].get_data()
data

Unnamed: 0,PROBEID,SYMBOL,ENSEMBL,ENTREZID,logFC,AveExpr,t,P.Value,adj.P.Val,B
1,205999_x_at,CYP3A4,ENSG00000160868,1576,1.722137,1.626904,50.46183,0.0,0.0,1253.587116
2,205939_at,CYP3A7,ENSG00000160870,1551,1.337397,1.301707,39.188226,0.0,0.0,753.2932
3,211843_x_at,CYP3A7-CYP3A51P,ENSG00000282301,100861540,1.310793,1.581767,38.408686,1.686483e-318,3.073616e-314,723.350212
4,208367_x_at,CYP3A4,ENSG00000160868,1576,1.299005,0.970862,38.063261,6.567899e-313,8.977497e-309,710.274423
5,243015_at,CYP3A5,ENSG00000106258,1577,1.141211,1.132945,33.439605,1.03694e-242,1.1338939999999999e-238,546.622619
6,218245_at,TSKU,ENSG00000182704,25987,1.131982,2.062511,33.169183,7.125215999999999e-239,6.492852999999999e-235,537.706288
7,221433_at,FGF21,ENSG00000105550,26291,1.033026,0.880748,30.269606,1.293684e-199,8.84152e-196,446.651787
8,217779_s_at,PNRC2,ENSG00000189266,55629,-0.974653,2.068771,-28.559154,4.427444e-178,2.689672e-174,396.842252
9,209921_at,SLC7A11,ENSG00000151012,23657,0.910682,0.767476,26.684687,7.104468e-156,3.884368000000001e-152,345.582858
10,205998_x_at,CYP3A4,ENSG00000160868,1576,0.907741,0.885971,26.598513,6.8737089999999994e-155,3.416546e-151,343.309978
