In [24]:
%load_ext autoreload
%autoreload 2

import pandas as pd
from IPython.display import display



The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


# Working with PK-DB data
To easily work with PK-DB data we provide the `pkdb_analysis` python library.
These includes helper functions for querying data and filter existing data sets. In the following we provide an overview over the typical functionality when working with PK-DB data.

The main class to work with is `PKData`. It is possible to directly query the database or to load data from file.

## Load data from file
PKData can be serialized to HDF5 files. In the following we will load the test data set and print an overview.

In [39]:
from pkdb_analysis import PKData, PKFilter
from pkdb_analysis.test import TESTDATA_CONCISE_FALSE_ZIP

data = PKData.from_archive(TESTDATA_CONCISE_FALSE_ZIP)
print(data)
data._concise()
print(data)

------------------------------
PKData (139812198895440)
------------------------------
studies           505  (  505)
groups           1456  (11993)
individuals      6395  (57683)
interventions    1209  ( 1865)
outputs         72206  (72206)
timecourses      3113  ( 3113)
scatters           42  (   42)
------------------------------
------------------------------
PKData (139812198895440)
------------------------------
studies           444  (  444)
groups            932  ( 8340)
individuals      5957  (53939)
interventions    1209  ( 1865)
outputs         72206  (72206)
timecourses      3113  ( 3113)
scatters           42  (   42)
------------------------------


## Load data from database
Alternatively data can be loaded from the database using the `PKDB.query()` function.
This is documented in the `Querying PK-DB` section.

## Accessing groups, individuals, interventions, outputs and timecourses
All PKData consists of consistent information on:
- `studies`: PK-DB studies, uniquely identified via a `study_sid`
- `groups`: groups, uniquely identified via `group_pk`
- `individuals`: individuals, uniquely identified via `individual_pk`
- `interventions`: interventions, uniquely identified via `intervention_pk`
- `outputs`: outputs, uniquely identified via `output_pk`
- `timecourses`: timecourses, uniquely identified via `subset_pk`
- `scatters`: scatters, uniquely identified via `subset_pk`


The `print` function provides a simple overview over the content

In [3]:
print(data)

------------------------------
PKData (139813265808400)
------------------------------
studies           505  (  505)
groups           1456  (11993)
individuals      6395  (57683)
interventions    1209  ( 1865)
outputs         72206  (72206)
timecourses       423  (  423)
scatters           42  (   42)
------------------------------


We can access the information via the respective fields, e.g., groups via `data.groups` or the multi-index data via `data.groups_mi`.

In [4]:
data.groups

Unnamed: 0.1,Unnamed: 0,study_name,study_sid,measurement_type,group_count,group_name,max,substance,count,group_parent_pk,...,unit,se,min,cv,median,group_pk,characteristica_pk,mean,choice,value
0,0,Abernethy1982,PKDB00198,sex,42,all,,,25,-1,...,,,,,,1,8,,F,
1,1,Abernethy1982,PKDB00198,species,42,all,,,42,-1,...,,,,,,1,5,,homo sapiens,
2,2,Abernethy1982,PKDB00198,healthy,42,all,,,42,-1,...,,,,,,1,6,,Y,
3,3,Abernethy1982,PKDB00198,sex,42,all,,,17,-1,...,,,,,,1,7,,M,
4,4,Abernethy1982,PKDB00198,species,21,obese,,,42,1,...,,,,,,2,5,,homo sapiens,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
11988,11988,Zhang2016,PKDB00275,sex,24,all,,,24,-1,...,,,,,,1504,28452,,M,
11989,11989,Zhang2016,PKDB00275,age,24,all,40.0,,24,-1,...,year,,18.0,,,1504,28453,,,
11990,11990,Zhang2016,PKDB00275,bmi,24,all,24.0,,24,-1,...,kilogram / meter ** 2,,19.0,,,1504,28454,,,
11991,11991,Zhang2016,PKDB00275,overnight fast,24,all,,,24,-1,...,,,,,,1504,28455,,Y,


       Unnamed: 0     study_name  study_sid measurement_type  group_count  \
0               0  Abernethy1982  PKDB00198              sex           42   
1               1  Abernethy1982  PKDB00198          species           42   
2               2  Abernethy1982  PKDB00198          healthy           42   
3               3  Abernethy1982  PKDB00198              sex           42   
4               4  Abernethy1982  PKDB00198          species           21   
...           ...            ...        ...              ...          ...   
11988       11988      Zhang2016  PKDB00275              sex           24   
11989       11989      Zhang2016  PKDB00275              age           24   
11990       11990      Zhang2016  PKDB00275              bmi           24   
11991       11991      Zhang2016  PKDB00275   overnight fast           24   
11992       11992      Zhang2016  PKDB00275          species           24   

      group_name   max substance  count  group_parent_pk  ...  \
0         

In [11]:
data.groups_mi

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 0,study_name,study_sid,measurement_type,group_count,group_name,max,substance,count,group_parent_pk,sd,unit,se,min,cv,median,mean,choice,value
group_pk,characteristica_pk,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1
312,6576,4370,Chiew2010,PKDB00026,species,9,all,,,9,-1,,,,,,,,homo sapiens,
312,6577,4371,Chiew2010,PKDB00026,healthy,9,all,,,9,-1,,,,,,,,Y,
312,6578,4372,Chiew2010,PKDB00026,overnight fast,9,all,,,9,-1,,,,,,,,Y,
312,6579,4373,Chiew2010,PKDB00026,sex,9,all,,,8,-1,,,,,,,,M,
312,6580,4374,Chiew2010,PKDB00026,sex,9,all,,,1,-1,,,,,,,,F,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1853,37445,11616,Mohammed1993,PKDB00102,overnight fast,5,healthy,,,10,1851,,,,,,,,Y,
1853,37446,11617,Mohammed1993,PKDB00102,sex,5,healthy,,,10,1851,,,,,,,,NR,
1853,37460,11618,Mohammed1993,PKDB00102,weight,5,healthy,88.0,,5,1851,11.0,kilogram,,58.0,,,75.0,,
1853,37461,11619,Mohammed1993,PKDB00102,age,5,healthy,24.0,,5,1851,1.0,year,,22.0,,,23.0,,


                             Unnamed: 0    study_name  study_sid  \
group_pk characteristica_pk                                        
312      6576                      4370     Chiew2010  PKDB00026   
         6577                      4371     Chiew2010  PKDB00026   
         6578                      4372     Chiew2010  PKDB00026   
         6579                      4373     Chiew2010  PKDB00026   
         6580                      4374     Chiew2010  PKDB00026   
...                                 ...           ...        ...   
1853     37445                    11616  Mohammed1993  PKDB00102   
         37446                    11617  Mohammed1993  PKDB00102   
         37460                    11618  Mohammed1993  PKDB00102   
         37461                    11619  Mohammed1993  PKDB00102   
         37462                    11620  Mohammed1993  PKDB00102   

                            measurement_type  group_count group_name   max  \
group_pk characteristica_pk          

To access the number of items use the `*_count`.

In [12]:
print(f"Number of groups: {data.groups_count}")

Number of groups: 1404


The `groups`, `individuals`, `interventions`, `outputs` and `timecourses` are `pandas.DataFrame` instances, so all the classical pandas operations can be applied on the data.
For instance to access a single `group` use logical indexing by the `group_pk` field.
E.g. to get the group `20` use

In [15]:
data.groups[data.groups.group_pk==312]

Unnamed: 0.1,Unnamed: 0,study_name,study_sid,measurement_type,group_count,group_name,max,substance,count,group_parent_pk,...,unit,se,min,cv,median,group_pk,characteristica_pk,mean,choice,value
4370,4370,Chiew2010,PKDB00026,species,9,all,,,9,-1,...,,,,,,312,6576,,homo sapiens,
4371,4371,Chiew2010,PKDB00026,healthy,9,all,,,9,-1,...,,,,,,312,6577,,Y,
4372,4372,Chiew2010,PKDB00026,overnight fast,9,all,,,9,-1,...,,,,,,312,6578,,Y,
4373,4373,Chiew2010,PKDB00026,sex,9,all,,,8,-1,...,,,,,,312,6579,,M,
4374,4374,Chiew2010,PKDB00026,sex,9,all,,,1,-1,...,,,,,,312,6580,,F,
4375,4375,Chiew2010,PKDB00026,abstinence,9,all,,paracetamol,9,-1,...,day,,7.0,,,312,6581,,,
4376,4376,Chiew2010,PKDB00026,medication,9,all,,,9,-1,...,,,,,,312,6582,,N,
4377,4377,Chiew2010,PKDB00026,age,9,all,46.0,,9,-1,...,year,,27.0,,,312,6583,34.0,,
4378,4378,Chiew2010,PKDB00026,weight,9,all,84.0,,9,-1,...,kilogram,,62.0,,,312,6584,73.11,,


      Unnamed: 0 study_name  study_sid measurement_type  group_count  \
4370        4370  Chiew2010  PKDB00026          species            9   
4371        4371  Chiew2010  PKDB00026          healthy            9   
4372        4372  Chiew2010  PKDB00026   overnight fast            9   
4373        4373  Chiew2010  PKDB00026              sex            9   
4374        4374  Chiew2010  PKDB00026              sex            9   
4375        4375  Chiew2010  PKDB00026       abstinence            9   
4376        4376  Chiew2010  PKDB00026       medication            9   
4377        4377  Chiew2010  PKDB00026              age            9   
4378        4378  Chiew2010  PKDB00026           weight            9   

     group_name   max    substance  count  group_parent_pk  ...      unit  se  \
4370        all   NaN          nan      9               -1  ...       NaN NaN   
4371        all   NaN          nan      9               -1  ...       NaN NaN   
4372        all   NaN          nan  

In the group tables multiple rows exist which belong to a single group! This is important to understand filtering of the data later on. For instance in this example the information on `species`, `healthy`, `smoking`, `age` and `overnight_fast` are all separate rows in the `groups` table, but belong to a single row.

When looking at the multi-index table this becomes more clear. We now get the group 20 form the `groups_mi`. We can simply use the `.loc` to lookup the group by `pk`

In [17]:
data.groups_mi.loc[312]

Unnamed: 0_level_0,Unnamed: 0,study_name,study_sid,measurement_type,group_count,group_name,max,substance,count,group_parent_pk,sd,unit,se,min,cv,median,mean,choice,value
characteristica_pk,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1
6576,4370,Chiew2010,PKDB00026,species,9,all,,,9,-1,,,,,,,,homo sapiens,
6577,4371,Chiew2010,PKDB00026,healthy,9,all,,,9,-1,,,,,,,,Y,
6578,4372,Chiew2010,PKDB00026,overnight fast,9,all,,,9,-1,,,,,,,,Y,
6579,4373,Chiew2010,PKDB00026,sex,9,all,,,8,-1,,,,,,,,M,
6580,4374,Chiew2010,PKDB00026,sex,9,all,,,1,-1,,,,,,,,F,
6581,4375,Chiew2010,PKDB00026,abstinence,9,all,,paracetamol,9,-1,,day,,7.0,,,,,
6582,4376,Chiew2010,PKDB00026,medication,9,all,,,9,-1,,,,,,,,N,
6583,4377,Chiew2010,PKDB00026,age,9,all,46.0,,9,-1,,year,,27.0,,,34.0,,
6584,4378,Chiew2010,PKDB00026,weight,9,all,84.0,,9,-1,,kilogram,,62.0,,,73.11,,


                    Unnamed: 0 study_name  study_sid measurement_type  \
characteristica_pk                                                      
6576                      4370  Chiew2010  PKDB00026          species   
6577                      4371  Chiew2010  PKDB00026          healthy   
6578                      4372  Chiew2010  PKDB00026   overnight fast   
6579                      4373  Chiew2010  PKDB00026              sex   
6580                      4374  Chiew2010  PKDB00026              sex   
6581                      4375  Chiew2010  PKDB00026       abstinence   
6582                      4376  Chiew2010  PKDB00026       medication   
6583                      4377  Chiew2010  PKDB00026              age   
6584                      4378  Chiew2010  PKDB00026           weight   

                    group_count group_name   max    substance  count  \
characteristica_pk                                                     
6576                          9        all   NaN    

In a similar manner we can explore the other information, i.e. `individuals`, `interventions`, `outputs` and `timecourses`.

In [18]:
data.individuals_mi

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 0,study_name,study_sid,measurement_type,max,substance,count,individual_group_pk,sd,unit,se,min,cv,median,mean,choice,value
individual_pk,individual_name,characteristica_pk,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1
1341,LP,6591,8142,Clements1976,PKDB00186,species,,,4,313,,,,,,,,homo sapiens,
1341,LP,6592,8137,Clements1976,PKDB00186,sex,,,4,313,,,,,,,,M,
1341,LP,6593,8138,Clements1976,PKDB00186,healthy,,,4,313,,,,,,,,Y,
1341,LP,6594,8139,Clements1976,PKDB00186,overnight fast,,,4,313,,,,,,,,Y,
1341,LP,6595,8140,Clements1976,PKDB00186,age,37.0,,4,313,,year,,28.0,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8589,P8,37345,59275,Caraco1999,10381807,sex,,,18,1847,,,,,,,,M,
8589,P8,37346,59276,Caraco1999,10381807,smoking,,,18,1847,,,,,,,,N,
8589,P8,37358,59278,Caraco1999,10381807,ethnicity,,,8,1847,,,,,,,,chinese,
8589,P8,37389,59277,Caraco1999,10381807,age,,,1,1847,,year,,,,,,,41.0


                                                  Unnamed: 0    study_name  \
individual_pk individual_name characteristica_pk                             
1341          LP              6591                      8142  Clements1976   
                              6592                      8137  Clements1976   
                              6593                      8138  Clements1976   
                              6594                      8139  Clements1976   
                              6595                      8140  Clements1976   
...                                                      ...           ...   
8589          P8              37345                    59275    Caraco1999   
                              37346                    59276    Caraco1999   
                              37358                    59278    Caraco1999   
                              37389                    59277    Caraco1999   
                              37390                    59279    

In [19]:
data.interventions_mi

Unnamed: 0_level_0,Unnamed: 0,study_sid,study_name,raw_pk,normed,name,route,form,application,time,...,substance,value,mean,median,min,max,sd,se,cv,unit
intervention_pk,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
0,242,PKDB00026,Chiew2010,671,True,paracetamol,oral,tablet,single dose,0.0,...,paracetamol,0.000079,,,0.000077,0.000083,,,,count
1,243,PKDB00026,Chiew2010,673,True,PEx,oral,tablet,single dose,0.0,...,panadol extend,0.000079,,,0.000075,0.000081,,,,count
2,244,PKDB00186,Clements1976,675,True,paracetamol12mg/kg_iv,iv,solution,single dose,0.0,...,paracetamol,0.000012,,,,,,,,count
3,245,PKDB00188,Clements1978,677,True,paracetamol20mg/kg_po,oral,solution,single dose,0.0,...,paracetamol,0.000020,,,,,,,,count
4,245,PKDB00188,Clements1978,677,True,paracetamol20mg/kg_po,oral,solution,single dose,0.0,...,paracetamol,0.000020,,,,,,,,count
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1171,1381,10381807,Caraco1999,3597,True,COD,oral,capsule,single dose,0.0,...,codeine phosphate,0.120000,,,,,,,,gram
1172,1381,10381807,Caraco1999,3597,True,COD,oral,capsule,single dose,0.0,...,codeine phosphate,0.120000,,,,,,,,gram
1172,1383,10381807,Caraco1999,3601,True,QUI,oral,capsule,single dose,,...,quinidine,0.100000,,,,,,,,gram
1173,1384,PKDB00096,Kronstrand2001,3607,True,COD,oral,NR,single dose,0.0,...,codeine phosphate,0.100000,,,,,,,,gram


                 Unnamed: 0  study_sid      study_name  raw_pk  normed  \
intervention_pk                                                          
0                       242  PKDB00026       Chiew2010     671    True   
1                       243  PKDB00026       Chiew2010     673    True   
2                       244  PKDB00186    Clements1976     675    True   
3                       245  PKDB00188    Clements1978     677    True   
4                       245  PKDB00188    Clements1978     677    True   
...                     ...        ...             ...     ...     ...   
1171                   1381   10381807      Caraco1999    3597    True   
1172                   1381   10381807      Caraco1999    3597    True   
1172                   1383   10381807      Caraco1999    3601    True   
1173                   1384  PKDB00096  Kronstrand2001    3607    True   
1174                   1385  PKDB00102    Mohammed1993    3609    True   

                                  nam

In [20]:
data.outputs_mi

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 0,study_name,measurement_type,tissue,sd,se,min,time_unit,normed,calculated,...,method,max,substance,label,unit,cv,median,mean,time,choice
output_pk,intervention_pk,group_pk,individual_pk,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1
29987,0,312,-1,31210,Chiew2010,cmax,plasma,,0.021276,,,True,False,...,,,paracetamol,paracetamol,gram / liter,0.746605,,0.085492,,
29988,0,312,-1,32535,Chiew2010,cmax,plasma,,0.007244,,,True,False,...,,,paracetamol glucuronide,paracetamol,gram / liter,0.198094,,0.109713,,
29989,0,312,-1,31213,Chiew2010,cmax,plasma,,0.002045,,,True,False,...,,,paracetamol sulfate,paracetamol,gram / liter,0.276726,,0.022172,,
29990,0,312,-1,33656,Chiew2010,tmax,plasma,,0.404200,,,True,False,...,,,paracetamol,paracetamol,hour,0.873002,,1.389000,,
29991,0,312,-1,29717,Chiew2010,tmax,plasma,,0.175700,,,True,False,...,,,paracetamol glucuronide,paracetamol,hour,0.148228,,3.556000,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
186700,1174,1852,-1,99176,Mohammed1993,cmax,plasma,,,,,True,True,...,,,codeine,,gram / liter,,,0.000143,,
186701,1174,1852,-1,99167,Mohammed1993,kel,plasma,,,,,True,True,...,,,codeine,,1 / minute,,,0.004981,,
186702,1174,1852,-1,99156,Mohammed1993,thalf,plasma,,,,,True,True,...,,,codeine,,hour,,,2.319383,,
186703,1174,1852,-1,99191,Mohammed1993,tmax,plasma,,,,,True,True,...,,,codeine,,hour,,,0.750000,,


                                                  Unnamed: 0    study_name  \
output_pk intervention_pk group_pk individual_pk                             
29987     0               312      -1                  31210     Chiew2010   
29988     0               312      -1                  32535     Chiew2010   
29989     0               312      -1                  31213     Chiew2010   
29990     0               312      -1                  33656     Chiew2010   
29991     0               312      -1                  29717     Chiew2010   
...                                                      ...           ...   
186700    1174            1852     -1                  99176  Mohammed1993   
186701    1174            1852     -1                  99167  Mohammed1993   
186702    1174            1852     -1                  99156  Mohammed1993   
186703    1174            1852     -1                  99191  Mohammed1993   
186704    1174            1852     -1                  99285  Mo

In [21]:
data.timecourses_mi

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 0,study_sid,study_name,output_pk,subset_name,normed,tissue,tissue_label,method,method_label,...,substance_label,value,mean,median,min,max,sd,se,cv,unit
subset_pk,intervention_pk,group_pk,individual_pk,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1
690,,312,-1,444,PKDB00026,Chiew2010,"(30125, 30126, 30127, 30128, 30129, 30130...",fig2__PEx_paracetamol glucuronide,True,serum,serum,,,...,paracetamol glucuronide,,"[0.00146388329555856, 0.009858915141736, 0.018...",,,,"[None, 0.007682712100943999, 0.008779730711669...","[None, 0.0025609040336480003, 0.00292657690388...","[None, 0.779265465874696, 0.4807891924497527, ...",gram / liter
691,,316,-1,401,PKDB00188,Clements1978,"(30545, 30546, 30547, 30548, 30549, 30550...",pentazocine_study_paracetamol20mg/kg_po_pentaz...,True,plasma,plasma,,,...,paracetamol,,"[None, 0.0006, None, 0.0013000000000000002, 0....",,,,"[None, 0.0011, None, 0.0026000000000000003, 0....","[None, 0.00055, None, 0.0013000000000000002, 0...","[None, 1.8333333333333337, None, 2.0, 1.6875, ...",gram / liter
692,,317,-1,460,PKDB00188,Clements1978,"(30565, 30566, 30567, 30568, 30569, 30570...",pentazocine_naloxone study_paracetamol20mg/kg_...,True,plasma,plasma,,,...,paracetamol,,"[None, 0.0013000000000000002, None, 0.0033, 0....",,,,"[None, 0.0001, None, 0.0011, 0.0048, 0.003, 0....","[None, 5e-05, None, 0.00055, 0.0024, 0.0015, 0...","[None, 0.07692307692307691, None, 0.3333333333...",gram / liter
693,,-1,1346,449,PKDB00188,Clements1978,"(30682, 30683, 30684, 30685, 30686, 30687...",subject2__20mg/kg,True,plasma,plasma,,,...,paracetamol,"[0.0, 2.7624309e-05, 0.0005524861999999999, 0....",,,,,,,,gram / liter
694,,314,-1,406,PKDB00188,Clements1978,"(30509, 30510, 30511, 30512, 30513, 30514...",all_paracetamol20mg/kg_po,True,plasma,plasma,,,...,paracetamol,,"[0.0175, 0.019600000000000003, 0.02, 0.0188, 0...",,,,"[0.0079, 0.007200000000000001, 0.0052000000000...","[0.0027930717856868626, 0.002545584412271571, ...","[0.45142857142857146, 0.36734693877551017, 0.2...",gram / liter
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3962,,1844,-1,2880,Test4,Test4,"(185590, 185591, 185592, 185593, 185594, ...",caf,True,plasma,plasma,,,...,caffeine,,"[0.0035442116, 0.0033748657999999993, 0.003074...",,,,"[0.0003674772, 0.0003820028, 0.000459372, 0.00...","[9.18693e-05, 9.55007e-05, 0.000114843, 0.0001...","[0.10368376425380471, 0.1131905156050946, 0.14...",gram / liter
3963,,1844,-1,2885,Test4,Test4,"(185617, 185618, 185602, 185603, 185604, ...",caf (lome),True,plasma,plasma,,,...,caffeine,,"[6.1484754e-05, 3.8633807e-07, 0.00014989601, ...",,,,"[0.000106382306, 5.319748493e-05, 0.0001885994...","[2.65955765e-05, 1.32993712325e-05, 4.71498725...","[1.7302225198786676, 137.69671968905368, 1.258...",gram / liter
3968,,1846,-1,2906,10381807,Caraco1999,"(186179, 186180, 186181, 186182, 186183, ...",caucasian_quinidine,True,plasma,plasma,,,...,quinidine,,"[0.0, 0.00024116978, 0.00026011735000000004, 0...",,,,,"[None, 6.6e-05, 4.6e-05, 4.2999999999999995e-0...","[None, 0.8209983854527712, 0.5305297781943418,...",gram / liter
3974,,1847,-1,2910,10381807,Caraco1999,"(186132, 186133, 186134, 186135, 186136, ...",morphine-6-glucuronide,True,plasma,plasma,,,...,morphine-6-glucuronide,,"[0.0, 1.1371890815142e-05, 1.38441064196046e-0...",,,,,"[None, 3.0636716549844004e-06, 6.5319184065738...","[None, 0.7619992269654697, 1.334506875186959, ...",gram / liter


                                                  Unnamed: 0  study_sid  \
subset_pk intervention_pk group_pk individual_pk                          
690       NaN              312     -1                    444  PKDB00026   
691       NaN              316     -1                    401  PKDB00188   
692       NaN              317     -1                    460  PKDB00188   
693       NaN             -1        1346                 449  PKDB00188   
694       NaN              314     -1                    406  PKDB00188   
...                                                      ...        ...   
3962      NaN              1844    -1                   2880      Test4   
3963      NaN              1844    -1                   2885      Test4   
3968      NaN              1846    -1                   2906   10381807   
3974      NaN              1847    -1                   2910   10381807   
3979      NaN              1850    -1                   2896  PKDB00096   

                        

In [7]:
data.scatters



Unnamed: 0.1,Unnamed: 0,study_sid,study_name,subset_pk,subset_name,x_outputs_pk,x_interventions,x_group_pk,x_individual_pk,x_normed,...,y_mean,y_median,y_min,y_max,y_sd,y_se,y_cv,y_unit,y_dimension,y_data_point
0,0,PKDB00002,Akinyinka2000,783,metabolic_ratio_corr,"[35815, 35816, 35817, 35818, 35819, 35820, 358...","(814,)",,"[1827, 1828, 1829, 1830, 1831, 1832, 1833, 183...",True,...,,,,,,,,none,1,"[7615, 7616, 7617, 7618, 7619, 7620, 7621, 762..."
1,1,PKDB00002,Akinyinka2000,784,caf_corr,"[35563, 35564, 35565, 35566, 35567, 35568, 355...","(814,)",,"[1746, 1747, 1748, 1749, 1750, 1751, 1752, 175...",True,...,,,,,,,,gram / liter,1,"[7625, 7626, 7627, 7628, 7629, 7630, 7631, 763..."
2,2,PKDB00002,Akinyinka2000,785,px_corr,"[35725, 35726, 35727, 35728, 35729, 35730, 357...","(814,)",,"[1792, 1793, 1794, 1795, 1796, 1797, 1798, 179...",True,...,,,,,,,,gram / liter,1,"[7671, 7672, 7673, 7674, 7675, 7676, 7677, 767..."
3,3,PKDB00210,Blanchard1983,927,elderly_po,"[41150, 41151, 41152, 41153, 41154, 41155, 41156]","(897,)",,"[2094, 2095, 2096, 2097, 2098, 2099, 2100]",True,...,,,,,,,,milliliter / meter ** 2 / minute,1,"[8551, 8552, 8553, 8554, 8555, 8556, 8557]"
4,4,PKDB00210,Blanchard1983,928,elderly_iv,"[41157, 41158, 41159, 41160, 41161, 41162, 411...","(898,)",,"[2101, 2102, 2103, 2104, 2105, 2106, 2107, 2108]",True,...,,,,,,,,milliliter / meter ** 2 / minute,1,"[8558, 8559, 8560, 8561, 8562, 8563, 8564, 8565]"
5,5,PKDB00210,Blanchard1983,929,young_po,"[41165, 41166, 41167, 41168, 41169, 41170, 411...","(897,)",,"[2109, 2110, 2111, 2112, 2113, 2114, 2115, 2116]",True,...,,,,,,,,milliliter / meter ** 2 / minute,1,"[8566, 8567, 8568, 8569, 8570, 8571, 8572, 8573]"
6,6,PKDB00210,Blanchard1983,930,young_iv,"[41173, 41174, 41175, 41176, 41177, 41178, 411...","(898,)",,"[2117, 2118, 2119, 2120, 2121, 2122, 2123, 2124]",True,...,,,,,,,,milliliter / meter ** 2 / minute,1,"[8574, 8575, 8576, 8577, 8578, 8579, 8580, 8581]"
7,7,PKDB00015,Campbell1987a,971,OC,"[42949, 42950, 42951, 42952, 42953]","(920,)",,"[2141, 2142, 2143, 2144, 2145]",True,...,,,,,,,,liter / hour / kilogram,1,"[8929, 8930, 8931, 8932, 8933]"
8,8,PKDB00015,Campbell1987a,972,NonSmokers,"[42954, 42955, 42956, 42957, 42958]","(920,)",,"[2146, 2147, 2148, 2149, 2150]",True,...,,,,,,,,liter / hour / kilogram,1,"[8934, 8935, 8936, 8937, 8938]"
9,9,PKDB00015,Campbell1987a,973,Smokers,"[42959, 42960, 42961, 42962, 42963]","(920,)",,"[2151, 2152, 2153, 2154, 2155]",True,...,,,,,,,,liter / hour / kilogram,1,"[8939, 8940, 8941, 8942, 8943]"


    Unnamed: 0      study_sid      study_name  subset_pk  \
0            0      PKDB00002   Akinyinka2000        783   
1            1      PKDB00002   Akinyinka2000        784   
2            2      PKDB00002   Akinyinka2000        785   
3            3      PKDB00210   Blanchard1983        927   
4            4      PKDB00210   Blanchard1983        928   
5            5      PKDB00210   Blanchard1983        929   
6            6      PKDB00210   Blanchard1983        930   
7            7      PKDB00015   Campbell1987a        971   
8            8      PKDB00015   Campbell1987a        972   
9            9      PKDB00015   Campbell1987a        973   
10          10        2921843    Holstege1989       1075   
11          11        2921843    Holstege1989       1076   
12          12        2921843    Holstege1989       1077   
13          13        2921843    Holstege1989       1078   
14          14        2921843    Holstege1989       1079   
15          15        2921843    Holsteg