In [1]:
# Install packages not available in the docker image
!pip install psycopg2-binary==2.9.3

Collecting psycopg2-binary==2.9.3
  Downloading psycopg2_binary-2.9.3-cp39-cp39-manylinux_2_24_aarch64.whl (3.4 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.4/3.4 MB[0m [31m10.4 MB/s[0m eta [36m0:00:00[0m00:01[0m00:01[0m
[?25hInstalling collected packages: psycopg2-binary
Successfully installed psycopg2-binary-2.9.3


In [2]:
import os
from sqlalchemy import create_engine
import pandas as pd

# Create connection based on environment variables defined at docker-compose.yml
conn_url = "postgresql+psycopg2://%s:%s@db:5432/%s" % (
    os.environ["POSTGRES_USER"],
    os.environ["POSTGRES_PASSWORD"],
    os.environ["POSTGRES_DB"]
)
engine = create_engine(conn_url, isolation_level="AUTOCOMMIT")

### Show available datasets

In [3]:
from IPython.display import Markdown, display

dfs = {}
with engine.begin() as connection:
    for tbl in ["buyers", "merchants", "orders_creation", "orders_decision", "orders_payment", "datasets"]:
        df = pd.read_sql(f"SELECT * FROM {tbl}", connection)
        index_col = next(c for c in df if c.endswith("_id"))
        dfs[tbl] = df.set_index(index_col)
        
        display(Markdown(f"**{tbl}**"))
        display(dfs[tbl].head(n=10))

**buyers**

Unnamed: 0_level_0,first_name,last_name,email,created_at
buyer_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1,Felicitas,Dowerg,weinhagekarl-heinz@example.org,2019-01-05 16:03:48.065322
2,Hellmuth,Etzold,stiffeljohanne@example.net,2019-01-06 02:18:23.014051
3,Dieter,Scheel,bbeckmann@example.org,2019-01-06 18:14:18.912525
4,Heinz-Jürgen,Heintze,rosehans-uwe@example.net,2019-01-07 23:18:11.857542
5,Friedlinde,Trapp,chartmann@example.net,2019-01-08 10:44:52.550876
6,Karl-Hans,Albers,hildaloeffler@example.com,2019-01-08 17:48:44.117045
7,Karl-Hans,Förster,vanessawilms@example.com,2019-01-10 16:08:24.980765
8,Edmund,Davids,wdietz@example.com,2019-01-12 15:39:50.044459
9,Dörte,Hettner,wagnervalerij@example.net,2019-01-13 09:43:09.301140
10,Faruk,Kostolzin,roehrdanzklaus-michael@example.net,2019-01-13 21:40:06.053150


**merchants**

Unnamed: 0_level_0,name,created_at
merchant_id,Unnamed: 1_level_1,Unnamed: 2_level_1
1,Dowerg,2019-01-01 18:36:21.374000
2,Weinhage GbR,2019-01-30 18:17:05.389742
3,Hauffer AG & Co. KG,2019-03-08 06:13:25.480632
4,Dobes,2019-03-10 12:02:26.723510
5,Weinhage,2019-03-15 18:53:56.577648
6,Christoph,2019-04-11 11:14:38.032554
7,Löffler,2019-04-23 09:05:19.099020
8,Becker AG,2019-04-24 14:47:02.835260
9,Heintze GmbH & Co. OHG,2019-06-23 06:27:02.565517
10,Bauer,2019-07-27 21:52:33.768389


**orders_creation**

Unnamed: 0_level_0,buyer_id,merchant_id,total_price_cents,created_at
order_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
1,1,1,36995,2019-01-05 16:03:48.065322
2,2,1,46197,2019-01-06 02:18:23.014051
3,3,1,37392,2019-01-06 18:14:18.912525
4,4,1,34974,2019-01-07 23:18:11.857542
5,5,1,41176,2019-01-08 10:44:52.550876
6,6,1,31138,2019-01-08 17:48:44.117045
7,5,1,44352,2019-01-09 00:17:37.327339
8,7,1,35963,2019-01-10 16:08:24.980765
9,6,1,52109,2019-01-10 17:15:11.111957
10,6,1,31782,2019-01-10 23:25:57.600129


**orders_decision**

Unnamed: 0_level_0,decision,due_date,created_at
order_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
1,ACCEPT,2019-02-04 16:03:48.248094,2019-01-05 16:03:48.248094
2,ACCEPT,2019-02-05 02:18:23.093798,2019-01-06 02:18:23.093798
3,ACCEPT,2019-02-05 18:14:19.026141,2019-01-06 18:14:19.026141
4,ACCEPT,2019-02-06 23:18:11.898825,2019-01-07 23:18:11.898825
5,ACCEPT,2019-02-07 10:44:52.943724,2019-01-08 10:44:52.943724
6,ACCEPT,2019-02-07 17:48:44.200912,2019-01-08 17:48:44.200912
7,ACCEPT,2019-02-08 00:17:37.363524,2019-01-09 00:17:37.363524
8,ACCEPT,2019-02-09 16:08:25.024673,2019-01-10 16:08:25.024673
9,ACCEPT,2019-02-09 17:15:11.205784,2019-01-10 17:15:11.205784
10,ACCEPT,2019-02-09 23:25:57.642529,2019-01-10 23:25:57.642529


**orders_payment**

Unnamed: 0_level_0,created_at
order_id,Unnamed: 1_level_1
1,2019-02-10 08:16:48.757377
2,2019-02-07 10:43:44.381343
3,2019-02-01 04:58:48.207862
4,2019-02-07 12:06:58.226781
5,2019-02-06 03:41:38.824075
6,2019-02-11 02:17:47.622723
7,2019-02-07 19:46:51.983749
8,2019-02-08 19:50:00.076555
9,2019-02-04 17:07:21.860173
10,2019-02-11 10:15:28.055798


**datasets**

Unnamed: 0_level_0,dataset_type
order_id,Unnamed: 1_level_1
1,train
2,train
3,train
4,train
5,train
6,train
7,train
8,train
9,train
10,train
