From 30d3dbdb371796a06de4b5f72bc57b2b36fa2123 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Wed, 16 Jul 2025 14:22:11 +0200
Subject: [PATCH 01/10] Add initial work on duckdb

---
 source-code/README.md                         |   2 +
 .../duckdb/data/patient_experiment.csv        |  63 ++++++++
 source-code/duckdb/data/patient_metadata.csv  |  11 ++
 source-code/duckdb/patients.ipynb             | 147 ++++++++++++++++++
 4 files changed, 223 insertions(+)
 create mode 100644 source-code/duckdb/data/patient_experiment.csv
 create mode 100644 source-code/duckdb/data/patient_metadata.csv
 create mode 100644 source-code/duckdb/patients.ipynb

diff --git a/source-code/README.md b/source-code/README.md
index 064c59f..4f9bfdc 100644
--- a/source-code/README.md
+++ b/source-code/README.md
@@ -22,6 +22,8 @@ to create it.  There is some material not covered in the presentation as well.
   soup and graph representation using networkx.
 * [`xarray`](xarray): illustrates the xarray library for pandas-like operations
   on multi-dimensional arrays.
+* [`duckdb`](duckdb): illustrates the DuckDB library for SQL-like operations
+  on dataframes, including integration with pandas and polars.
 
 **Note:** material on dashboards has been moved to a [dedicated
 repository](https://github.com/gjbex/Python-dashboards).
diff --git a/source-code/duckdb/data/patient_experiment.csv b/source-code/duckdb/data/patient_experiment.csv
new file mode 100644
index 0000000..034e2c7
--- /dev/null
+++ b/source-code/duckdb/data/patient_experiment.csv
@@ -0,0 +1,63 @@
+,patient,dose,date,temperature
+0,1,0.0,2012-10-02 10:00:00,38.3
+1,1,2.0,2012-10-02 11:00:00,38.5
+2,1,2.0,2012-10-02 12:00:00,38.1
+3,1,2.0,2012-10-02 13:00:00,37.3
+4,1,0.0,2012-10-02 14:00:00,37.5
+5,1,0.0,2012-10-02 15:00:00,37.1
+6,1,0.0,2012-10-02 16:00:00,36.8
+7,2,0.0,2012-10-02 10:00:00,39.3
+8,2,5.0,2012-10-02 11:00:00,39.4
+9,2,5.0,2012-10-02 12:00:00,38.1
+10,2,5.0,2012-10-02 13:00:00,37.3
+11,2,0.0,2012-10-02 14:00:00,36.8
+12,2,0.0,2012-10-02 15:00:00,36.8
+13,2,0.0,2012-10-02 16:00:00,36.8
+14,3,0.0,2012-10-02 10:00:00,37.9
+15,3,2.0,2012-10-02 11:00:00,39.5
+16,3,5.0,2012-10-02 12:00:00,38.3
+17,3,2.0,2012-10-02 13:00:00,
+18,3,2.0,2012-10-02 14:00:00,37.7
+19,3,2.0,2012-10-02 15:00:00,37.1
+20,3,0.0,2012-10-02 16:00:00,36.7
+21,4,0.0,2012-10-02 10:00:00,38.1
+22,4,5.0,2012-10-02 11:00:00,37.2
+23,4,5.0,2012-10-02 12:00:00,36.1
+24,4,0.0,2012-10-02 13:00:00,35.9
+25,4,,2012-10-02 14:00:00,36.3
+26,4,0.0,2012-10-02 15:00:00,36.6
+27,4,0.0,2012-10-02 16:00:00,36.7
+28,5,0.0,2012-10-02 10:00:00,37.9
+29,5,3.0,2012-10-02 11:00:00,39.5
+30,5,7.0,2012-10-02 12:00:00,38.3
+31,5,5.0,2012-10-02 13:00:00,38.5
+32,5,9.0,2012-10-02 14:00:00,39.4
+33,5,3.0,2012-10-02 15:00:00,37.9
+34,5,0.0,2012-10-02 16:00:00,37.2
+35,6,0.0,2012-10-02 10:00:00,37.5
+36,6,2.0,2012-10-02 11:00:00,38.1
+37,6,3.0,2012-10-02 12:00:00,37.9
+38,6,2.0,2012-10-02 13:00:00,37.7
+39,6,1.0,2012-10-02 14:00:00,37.2
+40,6,0.0,2012-10-02 15:00:00,36.8
+41,7,0.0,2012-10-02 10:00:00,39.5
+42,7,10.0,2012-10-02 11:00:00,40.7
+43,7,5.0,2012-10-02 12:00:00,39.8
+44,7,8.0,2012-10-02 13:00:00,40.2
+45,7,3.0,2012-10-02 14:00:00,38.3
+46,7,3.0,2012-10-02 15:00:00,37.6
+47,7,1.0,2012-10-02 16:00:00,37.3
+48,8,0.0,2012-10-02 10:00:00,37.8
+49,8,0.0,2012-10-02 11:00:00,37.9
+50,8,0.0,2012-10-02 12:00:00,37.4
+51,8,0.0,2012-10-02 13:00:00,37.6
+52,8,0.0,2012-10-02 14:00:00,37.3
+53,8,0.0,2012-10-02 15:00:00,37.1
+54,8,0.0,2012-10-02 16:00:00,36.8
+55,9,0.0,2012-10-02 10:00:00,38.3
+56,9,10.0,2012-10-02 11:00:00,39.5
+57,9,12.0,2012-10-02 12:00:00,40.2
+58,9,4.0,2012-10-02 13:00:00,39.1
+59,9,4.0,2012-10-02 14:00:00,37.9
+60,9,0.0,2012-10-02 15:00:00,37.1
+61,9,0.0,2012-10-02 16:00:00,37.3
diff --git a/source-code/duckdb/data/patient_metadata.csv b/source-code/duckdb/data/patient_metadata.csv
new file mode 100644
index 0000000..59e23ac
--- /dev/null
+++ b/source-code/duckdb/data/patient_metadata.csv
@@ -0,0 +1,11 @@
+,patient,gender,condition
+0,1,M,A
+1,2,F,A
+2,3,M,A
+3,5,M,A
+4,6,F,B
+5,7,M,B
+6,8,F,B
+7,9,M,B
+8,10,F,B
+9,11,M,B
diff --git a/source-code/duckdb/patients.ipynb b/source-code/duckdb/patients.ipynb
new file mode 100644
index 0000000..ca19c8f
--- /dev/null
+++ b/source-code/duckdb/patients.ipynb
@@ -0,0 +1,147 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "4c0d0975-71ce-4e9a-986c-ac6cbfb251bb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import duckdb\n",
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 33,
+   "id": "861daf66-0810-48d9-968c-18e1dabe0e4f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "conn = duckdb.connect('data/patient_experiment.csv')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "id": "c0f56de5-2351-4473-b768-234a89a705ac",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>5</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>9</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>8</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>3</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>6</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>4</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient\n",
+       "0        5\n",
+       "1        9\n",
+       "2        2\n",
+       "3        8\n",
+       "4        3\n",
+       "5        6\n",
+       "6        4\n",
+       "7        7\n",
+       "8        1"
+      ]
+     },
+     "execution_count": 37,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('SELECT DISTINCT patient FROM \"data/patient_experiment.csv\";').df()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0c4e1ad8-a9ae-4808-901b-c036e4e0ee17",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From 53da957572b9e3128bb88fc605c9db4c4a68ebcd Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Wed, 15 Oct 2025 09:03:12 +0200
Subject: [PATCH 02/10] Add material requirements

---
 docs/README.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/docs/README.md b/docs/README.md
index 1d2c156..24a5947 100644
--- a/docs/README.md
+++ b/docs/README.md
@@ -54,6 +54,14 @@ from scratch.  Familiarity with numpy is not required, but would be beneficial.
 If you plan to do Python programming in a Linux or HPC environment you should
 be familiar with these as well.
 
+For following along hands-on, you need
+* laptop or desktop with internet access.
+* a system set up so you can connect to an HPC system, an account on an HPC
+  system (e.g., VSC, CECI, ...), compute credits if that is required to run
+  jobs on the HPC system if you want to use an HPC system;
+* a Python environment that can run Jupyter Lab if you want to use your own system;
+* access to Google Colaboratory if you prefer not to install software.
+
 
 ## Level
 

From 014249d12482c5ca1a5b14febf6b35378785951e Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Tue, 4 Nov 2025 11:56:50 +0100
Subject: [PATCH 03/10] Added pivot operation

---
 source-code/duckdb/patients.ipynb | 336 ++++++++++++++++++++++++++++--
 1 file changed, 313 insertions(+), 23 deletions(-)

diff --git a/source-code/duckdb/patients.ipynb b/source-code/duckdb/patients.ipynb
index ca19c8f..380233b 100644
--- a/source-code/duckdb/patients.ipynb
+++ b/source-code/duckdb/patients.ipynb
@@ -13,7 +13,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 33,
+   "execution_count": 2,
    "id": "861daf66-0810-48d9-968c-18e1dabe0e4f",
    "metadata": {},
    "outputs": [],
@@ -23,7 +23,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 37,
+   "execution_count": 25,
    "id": "c0f56de5-2351-4473-b768-234a89a705ac",
    "metadata": {},
    "outputs": [
@@ -54,39 +54,39 @@
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
-       "      <td>5</td>\n",
+       "      <td>1</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
-       "      <td>9</td>\n",
+       "      <td>3</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>2</th>\n",
-       "      <td>2</td>\n",
+       "      <td>6</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>3</th>\n",
-       "      <td>8</td>\n",
+       "      <td>7</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>4</th>\n",
-       "      <td>3</td>\n",
+       "      <td>8</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>5</th>\n",
-       "      <td>6</td>\n",
+       "      <td>5</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>6</th>\n",
-       "      <td>4</td>\n",
+       "      <td>9</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>7</th>\n",
-       "      <td>7</td>\n",
+       "      <td>2</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>8</th>\n",
-       "      <td>1</td>\n",
+       "      <td>4</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
@@ -94,32 +94,322 @@
       ],
       "text/plain": [
        "   patient\n",
-       "0        5\n",
-       "1        9\n",
-       "2        2\n",
-       "3        8\n",
-       "4        3\n",
-       "5        6\n",
-       "6        4\n",
-       "7        7\n",
-       "8        1"
+       "0        1\n",
+       "1        3\n",
+       "2        6\n",
+       "3        7\n",
+       "4        8\n",
+       "5        5\n",
+       "6        9\n",
+       "7        2\n",
+       "8        4"
       ]
      },
-     "execution_count": 37,
+     "execution_count": 25,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "conn.execute('SELECT DISTINCT patient FROM \"data/patient_experiment.csv\";').df()"
+    "conn.execute('SELECT DISTINCT patient FROM \"patient_experiment\";').df()"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "id": "0c4e1ad8-a9ae-4808-901b-c036e4e0ee17",
    "metadata": {},
    "outputs": [],
+   "source": [
+    "sql_pivot = '''\n",
+    "CREATE TABLE time_series AS\n",
+    "  PIVOT \"data/patient_experiment.csv\"\n",
+    "  ON patient\n",
+    "  USING\n",
+    "    first(temperature) AS temperature,\n",
+    "    first(dose) AS dose\n",
+    "  GROUP BY date;\n",
+    "'''"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "6ff65df2-1997-4983-b3c8-1753034c3218",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<duckdb.duckdb.DuckDBPyConnection at 0x762650c61bf0>"
+      ]
+     },
+     "execution_count": 16,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute(sql_pivot)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "id": "95b029d4-0329-4462-8737-94f036dc8147",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>date</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2012-10-02 14:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2012-10-02 11:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>2012-10-02 13:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2012-10-02 12:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>2012-10-02 15:00:00</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                 date\n",
+       "0 2012-10-02 14:00:00\n",
+       "1 2012-10-02 11:00:00\n",
+       "2 2012-10-02 10:00:00\n",
+       "3 2012-10-02 13:00:00\n",
+       "4 2012-10-02 12:00:00\n",
+       "5 2012-10-02 15:00:00\n",
+       "6 2012-10-02 16:00:00"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('SELECT date FROM time_series;').df()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "id": "78a996cf-4bc2-40dc-8bce-27bcc6731b7b",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>name</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>file</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>patient_experiment</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>time_series</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                 name\n",
+       "0                file\n",
+       "1  patient_experiment\n",
+       "2         time_series"
+      ]
+     },
+     "execution_count": 23,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('show tables;').df()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "id": "ea5cf7e3-1b67-45fd-bdde-1ee294575149",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>table_schema</th>\n",
+       "      <th>table_name</th>\n",
+       "      <th>table_type</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>main</td>\n",
+       "      <td>time_series</td>\n",
+       "      <td>BASE TABLE</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>main</td>\n",
+       "      <td>file</td>\n",
+       "      <td>VIEW</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>main</td>\n",
+       "      <td>patient_experiment</td>\n",
+       "      <td>VIEW</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "  table_schema          table_name  table_type\n",
+       "0         main         time_series  BASE TABLE\n",
+       "1         main                file        VIEW\n",
+       "2         main  patient_experiment        VIEW"
+      ]
+     },
+     "execution_count": 24,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.sql(\"\"\"\n",
+    "    SELECT table_schema, table_name, table_type\n",
+    "    FROM information_schema.tables\n",
+    "    WHERE table_schema NOT IN ('information_schema', 'pg_catalog')\n",
+    "\"\"\").df()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "id": "843f9d0f-8384-4977-916e-49ef59e5cbad",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "┌─────────────┬─────────────┬─────────┬─────────┬─────────┬─────────┐\n",
+       "│ column_name │ column_type │  null   │   key   │ default │  extra  │\n",
+       "│   varchar   │   varchar   │ varchar │ varchar │ varchar │ varchar │\n",
+       "├─────────────┼─────────────┼─────────┼─────────┼─────────┼─────────┤\n",
+       "│ column0     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ patient     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ date        │ TIMESTAMP   │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "└─────────────┴─────────────┴─────────┴─────────┴─────────┴─────────┘"
+      ]
+     },
+     "execution_count": 28,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.sql('''dESCRIBE patient_experiment;''')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8570b365-09d5-4993-908e-4eaac974204d",
+   "metadata": {},
+   "outputs": [],
    "source": []
   }
  ],

From f01bc969eb0187aeca9913822df91cc19b19f677 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Thu, 20 Nov 2025 17:33:53 +0100
Subject: [PATCH 04/10] Add notebook on apply method

---
 source-code/pandas/README.md   |   5 +-
 source-code/pandas/apply.ipynb | 360 +++++++++++++++++++++++++++++++++
 2 files changed, 364 insertions(+), 1 deletion(-)
 create mode 100644 source-code/pandas/apply.ipynb

diff --git a/source-code/pandas/README.md b/source-code/pandas/README.md
index 746a50d..313b336 100644
--- a/source-code/pandas/README.md
+++ b/source-code/pandas/README.md
@@ -25,7 +25,10 @@ easy to use.
 1. `pipes.ipynb`: consolidating data processing using pipes.
 1. `screenshots`: screenshots made for the slides.
 1. `generate_csv_files.py`: script to generate CSV files in different
-    formats.
+    formatg.
 1. `copy_on_write.ipynb`: Jupyter notebook that illustrates how data is shared
    between related notebooks and the role Copy-on-Write plays in order to
    prevent accidental data modifications in more than one dataframe.
+1. `apply.ipynb`: Jupyter notebook that illustrates the use of the `apply` method
+   in pandas dataframes for applying functions along rows or columns. It includes
+   a comparison of performance between using `apply` and vectorized operations.
diff --git a/source-code/pandas/apply.ipynb b/source-code/pandas/apply.ipynb
new file mode 100644
index 0000000..35fc9c7
--- /dev/null
+++ b/source-code/pandas/apply.ipynb
@@ -0,0 +1,360 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "c507c033-f47a-40f3-9d9d-d24d23e25474",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c973633e-eccd-4a0f-873d-faf43fa3b836",
+   "metadata": {},
+   "source": [
+    "## apply"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f1401362-5955-495e-be57-5436a7446530",
+   "metadata": {},
+   "source": [
+    "Code that uses `.apply()` looks clean, but it is rather slow when used row-wise (`axis=1`). To quantify this, you can run the example below."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 31,
+   "id": "af048047-df04-4c5f-8b36-d48f53d021ae",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "size = 100_000\n",
+    "df = pd.DataFrame({\n",
+    "    'A': np.random.uniform(0.0, 1.0, size=size),\n",
+    "    'B': np.random.uniform(0.0, 1.0, size=size),\n",
+    "})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 32,
+   "id": "84b3d0d6-d9c3-4921-8561-80ef6d766f6f",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "RangeIndex: 100000 entries, 0 to 99999\n",
+      "Data columns (total 2 columns):\n",
+      " #   Column  Non-Null Count   Dtype  \n",
+      "---  ------  --------------   -----  \n",
+      " 0   A       100000 non-null  float64\n",
+      " 1   B       100000 non-null  float64\n",
+      "dtypes: float64(2)\n",
+      "memory usage: 1.5 MB\n"
+     ]
+    }
+   ],
+   "source": [
+    "df.info()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9dfd0c4b-996d-4426-8b58-d66c78124a8f",
+   "metadata": {},
+   "source": [
+    "Note that this dataframe is fairly small."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d0b672e5-9762-496e-932f-4c5729c62061",
+   "metadata": {},
+   "source": [
+    "### Evaluating a condition"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 38,
+   "id": "093ddcde-ee7f-4d66-847d-221e8181b9dc",
+   "metadata": {
+    "editable": true,
+    "slideshow": {
+     "slide_type": ""
+    },
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "551 ms ± 8.9 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit df.apply(lambda x: 0 if x.A + x.B < 1.0 else 1, axis=1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 39,
+   "id": "6b10519f-26b5-4c74-af2f-ee34af35e96d",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "1.17 ms ± 5.24 μs per loop (mean ± std. dev. of 7 runs, 1,000 loops each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit np.select([df.A + df.B < 1.0, df.A + df.B >= 1.0], [0, 1])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "id": "e8b003c0-7445-475e-9ece-68a9783b1388",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "510 μs ± 4.17 μs per loop (mean ± std. dev. of 7 runs, 1,000 loops each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit np.where(df.A + df.B < 1.0, 0, 1)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "35ebd7e1-48bb-4d3b-860d-f0d765ffa62e",
+   "metadata": {},
+   "source": [
+    "Clearly, `.apply()` is very slow comparted to `np.select()` and `np.where()`.  Note that `np.where()` is faster than `np.select()` by a factor of 2."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "id": "9bc83bfe-680e-4b3d-8017-970cf08fd956",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "assert np.array_equal(\n",
+    "    df.apply(lambda x: 0 if x.A + x.B < 1.0 else 1, axis=1).to_numpy(),\n",
+    "    np.where(df.A + df.B < 1.0, 0, 1),\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "id": "de5e05b5-154e-498c-a565-3116e490ae11",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "assert np.array_equal(\n",
+    "    df.apply(lambda x: 0 if x.A + x.B < 1.0 else 1, axis=1).to_numpy(),\n",
+    "    np.select([df.A + df.B < 1.0, df.A + df.B >= 1.0], [0, 1]),\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9b46cd48-f1ce-4041-9560-6c1b09556d53",
+   "metadata": {},
+   "source": [
+    "All three approaches produce the same results."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c63e4df2-6fed-4072-aadd-3256a7c8cede",
+   "metadata": {},
+   "source": [
+    "### Adding a column"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "id": "ef441507-f6f5-4485-b03f-36636259a848",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "563 ms ± 8.58 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit df['C'] = df.apply(lambda x: x.A + x.B, axis=1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "id": "bd13d78b-b7fd-40c0-8b0e-3bdafdef4b33",
+   "metadata": {
+    "editable": true,
+    "slideshow": {
+     "slide_type": ""
+    },
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "176 μs ± 2.21 μs per loop (mean ± std. dev. of 7 runs, 10,000 loops each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit df['C'] = df.A + df.B"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3f092bfc-9f32-4636-ba95-52b2c07d2fdb",
+   "metadata": {},
+   "source": [
+    "Clearly, `.apply()` is very slow comparted to a straightforward column definition.  The difference is a factor of 1,000."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "id": "5c8f3b66-1eea-4e58-9035-f6db4af3df3f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "assert df.apply(lambda x: x.A + x.B, axis=1).equals(df.A + df.B)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c31c53ea-e297-4658-b55b-35ab47987237",
+   "metadata": {},
+   "source": [
+    "Both approaches yield the same result."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a32a0791-8063-40ac-83d0-93a5ab796c70",
+   "metadata": {},
+   "source": [
+    "### Aggregating columns"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8be8ec5b-878b-4452-9815-9c0a23f97d9d",
+   "metadata": {},
+   "source": [
+    "Although less dramatically so, applying `.apply()` along axis 0 is also slower than its numpy counterpart."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "id": "47d6aca2-f52e-4746-a139-119fcdfe3030",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "303 μs ± 4.28 μs per loop (mean ± std. dev. of 7 runs, 1,000 loops each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit df.apply(np.sum, axis=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "id": "1e4ed799-08fd-4c14-bdf0-f6db5b829c0c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "179 μs ± 10.2 μs per loop (mean ± std. dev. of 7 runs, 10,000 loops each)\n"
+     ]
+    }
+   ],
+   "source": [
+    "%timeit np.sum(df.to_numpy(), axis=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "id": "d0504d19-a6d8-4f3d-a4ff-73e9c04152e4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "assert np.array_equal(df.apply(np.sum, axis=0), np.sum(df.to_numpy(), axis=0))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ce8fb4ac-795e-43e3-ae72-fa528df86855",
+   "metadata": {},
+   "source": [
+    "Again, both produce the same result."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From a841ab6918c550d8efb25fd715b00d8a1f12d5a5 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Thu, 20 Nov 2025 18:32:09 +0100
Subject: [PATCH 05/10] Display pandas version

---
 source-code/pandas/copy_on_write.ipynb | 25 +++++++++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/source-code/pandas/copy_on_write.ipynb b/source-code/pandas/copy_on_write.ipynb
index 744c29b..199cb6f 100644
--- a/source-code/pandas/copy_on_write.ipynb
+++ b/source-code/pandas/copy_on_write.ipynb
@@ -10,7 +10,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 1,
    "id": "9550bae2-79e5-4db6-b8eb-4b64dbc1b4e1",
    "metadata": {},
    "outputs": [],
@@ -37,6 +37,27 @@
     "The answer to that question seems to depend on the version of `pandas`."
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "44918d07-7c0c-45ba-a1bc-04a0fa27c06d",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'2.3.3'"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "pd.__version__"
+   ]
+  },
   {
    "cell_type": "markdown",
    "id": "ea08f1e0-78c1-463c-994c-92066363b006",
@@ -1688,7 +1709,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12.7"
+   "version": "3.12.12"
   }
  },
  "nbformat": 4,

From abe85d1d31b4642c219caed27459dbd7f5c3198d Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Fri, 21 Nov 2025 10:32:27 +0100
Subject: [PATCH 06/10] Fix typo

---
 source-code/pandas/copy_on_write.ipynb | 728 ++++++++++++-------------
 1 file changed, 364 insertions(+), 364 deletions(-)

diff --git a/source-code/pandas/copy_on_write.ipynb b/source-code/pandas/copy_on_write.ipynb
index 199cb6f..d18c56d 100644
--- a/source-code/pandas/copy_on_write.ipynb
+++ b/source-code/pandas/copy_on_write.ipynb
@@ -39,7 +39,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 2,
    "id": "44918d07-7c0c-45ba-a1bc-04a0fa27c06d",
    "metadata": {},
    "outputs": [
@@ -49,7 +49,7 @@
        "'2.3.3'"
       ]
      },
-     "execution_count": 3,
+     "execution_count": 2,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -76,7 +76,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 3,
    "id": "520bc27d-5d55-46dc-a7bf-5b9b12162b9d",
    "metadata": {},
    "outputs": [],
@@ -91,7 +91,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 4,
    "id": "432772e9-3031-4001-81e3-c346cb7f9c76",
    "metadata": {},
    "outputs": [
@@ -127,7 +127,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
+   "execution_count": 5,
    "id": "eb6f4dad-6df3-493e-869f-204d06b0cc7d",
    "metadata": {},
    "outputs": [
@@ -168,50 +168,50 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>4.225888</td>\n",
-       "      <td>1.284407</td>\n",
-       "      <td>-2.830820</td>\n",
-       "      <td>0.143920</td>\n",
+       "      <td>-0.666188</td>\n",
+       "      <td>-0.175422</td>\n",
+       "      <td>4.077410</td>\n",
+       "      <td>2.294040</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>577.759840</td>\n",
-       "      <td>577.063194</td>\n",
-       "      <td>577.528168</td>\n",
-       "      <td>576.729627</td>\n",
+       "      <td>576.312351</td>\n",
+       "      <td>576.718069</td>\n",
+       "      <td>577.017098</td>\n",
+       "      <td>577.149466</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.977694</td>\n",
-       "      <td>-999.908941</td>\n",
+       "      <td>-999.995592</td>\n",
+       "      <td>-999.992864</td>\n",
        "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-495.491551</td>\n",
-       "      <td>-497.783061</td>\n",
-       "      <td>-506.000000</td>\n",
+       "      <td>-499.708991</td>\n",
+       "      <td>-497.766770</td>\n",
+       "      <td>-496.000000</td>\n",
        "      <td>-499.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.748510</td>\n",
-       "      <td>2.103870</td>\n",
-       "      <td>-4.000000</td>\n",
-       "      <td>0.000000</td>\n",
+       "      <td>-1.080819</td>\n",
+       "      <td>-0.135347</td>\n",
+       "      <td>2.000000</td>\n",
+       "      <td>6.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>505.160586</td>\n",
-       "      <td>500.502871</td>\n",
-       "      <td>497.000000</td>\n",
-       "      <td>498.000000</td>\n",
+       "      <td>498.134233</td>\n",
+       "      <td>495.339400</td>\n",
+       "      <td>504.000000</td>\n",
+       "      <td>501.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.992940</td>\n",
-       "      <td>999.947904</td>\n",
+       "      <td>999.976901</td>\n",
+       "      <td>999.997666</td>\n",
        "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
@@ -222,16 +222,16 @@
       "text/plain": [
        "             column1        column2        column3        column4\n",
        "count  100000.000000  100000.000000  100000.000000  100000.000000\n",
-       "mean        4.225888       1.284407      -2.830820       0.143920\n",
-       "std       577.759840     577.063194     577.528168     576.729627\n",
-       "min      -999.977694    -999.908941    -999.000000    -999.000000\n",
-       "25%      -495.491551    -497.783061    -506.000000    -499.000000\n",
-       "50%         4.748510       2.103870      -4.000000       0.000000\n",
-       "75%       505.160586     500.502871     497.000000     498.000000\n",
-       "max       999.992940     999.947904     999.000000     999.000000"
+       "mean       -0.666188      -0.175422       4.077410       2.294040\n",
+       "std       576.312351     576.718069     577.017098     577.149466\n",
+       "min      -999.995592    -999.992864    -999.000000    -999.000000\n",
+       "25%      -499.708991    -497.766770    -496.000000    -499.000000\n",
+       "50%        -1.080819      -0.135347       2.000000       6.000000\n",
+       "75%       498.134233     495.339400     504.000000     501.000000\n",
+       "max       999.976901     999.997666     999.000000     999.000000"
       ]
      },
-     "execution_count": 17,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -250,7 +250,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 6,
    "id": "1a43e7eb-a7ad-4089-95ba-15879f5920ce",
    "metadata": {},
    "outputs": [],
@@ -260,7 +260,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 7,
    "id": "1af4b0bc-81eb-4dab-9a65-fb5f71d004c2",
    "metadata": {},
    "outputs": [
@@ -296,56 +296,56 @@
        "      <th>count</th>\n",
        "      <td>50000.000000</td>\n",
        "      <td>50000.000000</td>\n",
-       "      <td>50000.00000</td>\n",
+       "      <td>50000.000000</td>\n",
        "      <td>50000.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>4.828118</td>\n",
-       "      <td>0.964712</td>\n",
-       "      <td>-2.11148</td>\n",
-       "      <td>-3.656300</td>\n",
+       "      <td>-0.119765</td>\n",
+       "      <td>-2.058561</td>\n",
+       "      <td>-0.764240</td>\n",
+       "      <td>3.063220</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>577.936131</td>\n",
-       "      <td>577.971021</td>\n",
-       "      <td>577.96331</td>\n",
-       "      <td>576.181292</td>\n",
+       "      <td>575.680081</td>\n",
+       "      <td>578.254495</td>\n",
+       "      <td>577.348834</td>\n",
+       "      <td>577.086857</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.944283</td>\n",
-       "      <td>-999.897600</td>\n",
-       "      <td>-999.00000</td>\n",
+       "      <td>-999.933748</td>\n",
+       "      <td>-999.992864</td>\n",
+       "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-493.817751</td>\n",
-       "      <td>-500.003775</td>\n",
-       "      <td>-504.00000</td>\n",
-       "      <td>-503.000000</td>\n",
+       "      <td>-499.293681</td>\n",
+       "      <td>-499.616524</td>\n",
+       "      <td>-501.000000</td>\n",
+       "      <td>-498.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.462345</td>\n",
-       "      <td>3.577384</td>\n",
-       "      <td>-6.00000</td>\n",
-       "      <td>-2.000000</td>\n",
+       "      <td>-1.213840</td>\n",
+       "      <td>-4.281987</td>\n",
+       "      <td>-3.000000</td>\n",
+       "      <td>10.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>503.114598</td>\n",
-       "      <td>500.886860</td>\n",
-       "      <td>501.00000</td>\n",
-       "      <td>494.000000</td>\n",
+       "      <td>498.062126</td>\n",
+       "      <td>495.209044</td>\n",
+       "      <td>500.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.964569</td>\n",
-       "      <td>999.864196</td>\n",
-       "      <td>999.00000</td>\n",
+       "      <td>999.976901</td>\n",
+       "      <td>999.997666</td>\n",
+       "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
@@ -353,18 +353,18 @@
        "</div>"
       ],
       "text/plain": [
-       "            column1       column2      column3       column4\n",
-       "count  50000.000000  50000.000000  50000.00000  50000.000000\n",
-       "mean       4.828118      0.964712     -2.11148     -3.656300\n",
-       "std      577.936131    577.971021    577.96331    576.181292\n",
-       "min     -999.944283   -999.897600   -999.00000   -999.000000\n",
-       "25%     -493.817751   -500.003775   -504.00000   -503.000000\n",
-       "50%        4.462345      3.577384     -6.00000     -2.000000\n",
-       "75%      503.114598    500.886860    501.00000    494.000000\n",
-       "max      999.964569    999.864196    999.00000    999.000000"
+       "            column1       column2       column3       column4\n",
+       "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
+       "mean      -0.119765     -2.058561     -0.764240      3.063220\n",
+       "std      575.680081    578.254495    577.348834    577.086857\n",
+       "min     -999.933748   -999.992864   -999.000000   -999.000000\n",
+       "25%     -499.293681   -499.616524   -501.000000   -498.000000\n",
+       "50%       -1.213840     -4.281987     -3.000000     10.000000\n",
+       "75%      498.062126    495.209044    500.000000    499.250000\n",
+       "max      999.976901    999.997666    999.000000    999.000000"
       ]
      },
-     "execution_count": 19,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -383,7 +383,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 20,
+   "execution_count": 8,
    "id": "65dfb904-0b0a-4b4a-baab-77011a840910",
    "metadata": {},
    "outputs": [
@@ -391,7 +391,7 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "/tmp/ipykernel_565/3787905307.py:1: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.\n",
+      "/tmp/ipykernel_15868/3787905307.py:1: FutureWarning: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.\n",
       "The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.\n",
       "\n",
       "For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.\n",
@@ -407,7 +407,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 21,
+   "execution_count": 9,
    "id": "cbeb2db9-7018-4cac-9dd4-2880d2f7a214",
    "metadata": {},
    "outputs": [
@@ -443,56 +443,56 @@
        "      <th>count</th>\n",
        "      <td>50000.000000</td>\n",
        "      <td>50000.000000</td>\n",
-       "      <td>50000.00000</td>\n",
+       "      <td>50000.000000</td>\n",
        "      <td>50000.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>2.605923</td>\n",
-       "      <td>0.964712</td>\n",
-       "      <td>-2.11148</td>\n",
-       "      <td>-3.656300</td>\n",
+       "      <td>0.147446</td>\n",
+       "      <td>-2.058561</td>\n",
+       "      <td>-0.764240</td>\n",
+       "      <td>3.063220</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>408.136559</td>\n",
-       "      <td>577.971021</td>\n",
-       "      <td>577.96331</td>\n",
-       "      <td>576.181292</td>\n",
+       "      <td>407.380662</td>\n",
+       "      <td>578.254495</td>\n",
+       "      <td>577.348834</td>\n",
+       "      <td>577.086857</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
        "      <td>-500.000000</td>\n",
-       "      <td>-999.897600</td>\n",
-       "      <td>-999.00000</td>\n",
+       "      <td>-999.992864</td>\n",
+       "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-493.817751</td>\n",
-       "      <td>-500.003775</td>\n",
-       "      <td>-504.00000</td>\n",
-       "      <td>-503.000000</td>\n",
+       "      <td>-499.293681</td>\n",
+       "      <td>-499.616524</td>\n",
+       "      <td>-501.000000</td>\n",
+       "      <td>-498.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.462345</td>\n",
-       "      <td>3.577384</td>\n",
-       "      <td>-6.00000</td>\n",
-       "      <td>-2.000000</td>\n",
+       "      <td>-1.213840</td>\n",
+       "      <td>-4.281987</td>\n",
+       "      <td>-3.000000</td>\n",
+       "      <td>10.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
+       "      <td>498.062126</td>\n",
+       "      <td>495.209044</td>\n",
        "      <td>500.000000</td>\n",
-       "      <td>500.886860</td>\n",
-       "      <td>501.00000</td>\n",
-       "      <td>494.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
        "      <td>500.000000</td>\n",
-       "      <td>999.864196</td>\n",
-       "      <td>999.00000</td>\n",
+       "      <td>999.997666</td>\n",
+       "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
@@ -500,18 +500,18 @@
        "</div>"
       ],
       "text/plain": [
-       "            column1       column2      column3       column4\n",
-       "count  50000.000000  50000.000000  50000.00000  50000.000000\n",
-       "mean       2.605923      0.964712     -2.11148     -3.656300\n",
-       "std      408.136559    577.971021    577.96331    576.181292\n",
-       "min     -500.000000   -999.897600   -999.00000   -999.000000\n",
-       "25%     -493.817751   -500.003775   -504.00000   -503.000000\n",
-       "50%        4.462345      3.577384     -6.00000     -2.000000\n",
-       "75%      500.000000    500.886860    501.00000    494.000000\n",
-       "max      500.000000    999.864196    999.00000    999.000000"
+       "            column1       column2       column3       column4\n",
+       "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
+       "mean       0.147446     -2.058561     -0.764240      3.063220\n",
+       "std      407.380662    578.254495    577.348834    577.086857\n",
+       "min     -500.000000   -999.992864   -999.000000   -999.000000\n",
+       "25%     -499.293681   -499.616524   -501.000000   -498.000000\n",
+       "50%       -1.213840     -4.281987     -3.000000     10.000000\n",
+       "75%      498.062126    495.209044    500.000000    499.250000\n",
+       "max      500.000000    999.997666    999.000000    999.000000"
       ]
      },
-     "execution_count": 21,
+     "execution_count": 9,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -564,7 +564,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 22,
+   "execution_count": 10,
    "id": "b4cff949-c4aa-4f7d-b1e4-b4b78bf0284b",
    "metadata": {},
    "outputs": [],
@@ -582,7 +582,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
+   "execution_count": 11,
    "id": "6bb4fec9-0623-4482-8ebd-9077723956e0",
    "metadata": {},
    "outputs": [],
@@ -597,7 +597,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 24,
+   "execution_count": 12,
    "id": "f005ad9f-3b19-40bf-b01a-4f7fd8f4d024",
    "metadata": {},
    "outputs": [],
@@ -607,7 +607,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 25,
+   "execution_count": 13,
    "id": "91499993-8461-437d-b7b1-7f0caf20d7d6",
    "metadata": {},
    "outputs": [
@@ -648,50 +648,50 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.695724</td>\n",
-       "      <td>-3.040382</td>\n",
-       "      <td>4.001460</td>\n",
-       "      <td>0.511100</td>\n",
+       "      <td>0.455395</td>\n",
+       "      <td>5.588258</td>\n",
+       "      <td>1.329300</td>\n",
+       "      <td>1.763540</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>578.627560</td>\n",
-       "      <td>576.453798</td>\n",
-       "      <td>576.244217</td>\n",
-       "      <td>578.301376</td>\n",
+       "      <td>577.070175</td>\n",
+       "      <td>577.342945</td>\n",
+       "      <td>577.130306</td>\n",
+       "      <td>575.554149</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.983952</td>\n",
-       "      <td>-999.968792</td>\n",
+       "      <td>-999.965920</td>\n",
+       "      <td>-999.963945</td>\n",
        "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-502.160012</td>\n",
-       "      <td>-500.333306</td>\n",
-       "      <td>-492.250000</td>\n",
-       "      <td>-498.000000</td>\n",
+       "      <td>-500.420461</td>\n",
+       "      <td>-495.503431</td>\n",
+       "      <td>-497.000000</td>\n",
+       "      <td>-493.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.057258</td>\n",
-       "      <td>-4.377464</td>\n",
+       "      <td>3.895165</td>\n",
+       "      <td>9.582978</td>\n",
        "      <td>3.000000</td>\n",
-       "      <td>0.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>502.159214</td>\n",
-       "      <td>494.614704</td>\n",
-       "      <td>499.000000</td>\n",
-       "      <td>500.250000</td>\n",
+       "      <td>496.851678</td>\n",
+       "      <td>505.826690</td>\n",
+       "      <td>501.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.998666</td>\n",
-       "      <td>999.913716</td>\n",
+       "      <td>999.979256</td>\n",
+       "      <td>999.948488</td>\n",
        "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
@@ -702,16 +702,16 @@
       "text/plain": [
        "            column1       column2       column3       column4\n",
        "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
-       "mean       1.695724     -3.040382      4.001460      0.511100\n",
-       "std      578.627560    576.453798    576.244217    578.301376\n",
-       "min     -999.983952   -999.968792   -999.000000   -999.000000\n",
-       "25%     -502.160012   -500.333306   -492.250000   -498.000000\n",
-       "50%        4.057258     -4.377464      3.000000      0.000000\n",
-       "75%      502.159214    494.614704    499.000000    500.250000\n",
-       "max      999.998666    999.913716    999.000000    999.000000"
+       "mean       0.455395      5.588258      1.329300      1.763540\n",
+       "std      577.070175    577.342945    577.130306    575.554149\n",
+       "min     -999.965920   -999.963945   -999.000000   -999.000000\n",
+       "25%     -500.420461   -495.503431   -497.000000   -493.000000\n",
+       "50%        3.895165      9.582978      3.000000      1.000000\n",
+       "75%      496.851678    505.826690    501.000000    499.250000\n",
+       "max      999.979256    999.948488    999.000000    999.000000"
       ]
      },
-     "execution_count": 25,
+     "execution_count": 13,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -722,7 +722,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 26,
+   "execution_count": 14,
    "id": "abf7f30b-2bd0-4b3b-94fd-f9b6f183b26b",
    "metadata": {},
    "outputs": [
@@ -730,7 +730,7 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "/tmp/ipykernel_565/3016868282.py:1: ChainedAssignmentError: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.\n",
+      "/tmp/ipykernel_15868/3016868282.py:1: ChainedAssignmentError: A value is trying to be set on a copy of a DataFrame or Series through chained assignment using an inplace method.\n",
       "When using the Copy-on-Write mode, such inplace method never works to update the original DataFrame or Series, because the intermediate object on which we are setting values always behaves as a copy.\n",
       "\n",
       "For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' instead, to perform the operation inplace on the original object.\n",
@@ -754,7 +754,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 28,
+   "execution_count": 15,
    "id": "34e80602-a9fa-44d2-9fbb-3b6d4bd6a3d3",
    "metadata": {},
    "outputs": [
@@ -795,50 +795,50 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.695724</td>\n",
-       "      <td>-3.040382</td>\n",
-       "      <td>4.001460</td>\n",
-       "      <td>0.511100</td>\n",
+       "      <td>0.455395</td>\n",
+       "      <td>5.588258</td>\n",
+       "      <td>1.329300</td>\n",
+       "      <td>1.763540</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>578.627560</td>\n",
-       "      <td>576.453798</td>\n",
-       "      <td>576.244217</td>\n",
-       "      <td>578.301376</td>\n",
+       "      <td>577.070175</td>\n",
+       "      <td>577.342945</td>\n",
+       "      <td>577.130306</td>\n",
+       "      <td>575.554149</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.983952</td>\n",
-       "      <td>-999.968792</td>\n",
+       "      <td>-999.965920</td>\n",
+       "      <td>-999.963945</td>\n",
        "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-502.160012</td>\n",
-       "      <td>-500.333306</td>\n",
-       "      <td>-492.250000</td>\n",
-       "      <td>-498.000000</td>\n",
+       "      <td>-500.420461</td>\n",
+       "      <td>-495.503431</td>\n",
+       "      <td>-497.000000</td>\n",
+       "      <td>-493.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.057258</td>\n",
-       "      <td>-4.377464</td>\n",
+       "      <td>3.895165</td>\n",
+       "      <td>9.582978</td>\n",
        "      <td>3.000000</td>\n",
-       "      <td>0.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>502.159214</td>\n",
-       "      <td>494.614704</td>\n",
-       "      <td>499.000000</td>\n",
-       "      <td>500.250000</td>\n",
+       "      <td>496.851678</td>\n",
+       "      <td>505.826690</td>\n",
+       "      <td>501.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.998666</td>\n",
-       "      <td>999.913716</td>\n",
+       "      <td>999.979256</td>\n",
+       "      <td>999.948488</td>\n",
        "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
@@ -849,16 +849,16 @@
       "text/plain": [
        "            column1       column2       column3       column4\n",
        "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
-       "mean       1.695724     -3.040382      4.001460      0.511100\n",
-       "std      578.627560    576.453798    576.244217    578.301376\n",
-       "min     -999.983952   -999.968792   -999.000000   -999.000000\n",
-       "25%     -502.160012   -500.333306   -492.250000   -498.000000\n",
-       "50%        4.057258     -4.377464      3.000000      0.000000\n",
-       "75%      502.159214    494.614704    499.000000    500.250000\n",
-       "max      999.998666    999.913716    999.000000    999.000000"
+       "mean       0.455395      5.588258      1.329300      1.763540\n",
+       "std      577.070175    577.342945    577.130306    575.554149\n",
+       "min     -999.965920   -999.963945   -999.000000   -999.000000\n",
+       "25%     -500.420461   -495.503431   -497.000000   -493.000000\n",
+       "50%        3.895165      9.582978      3.000000      1.000000\n",
+       "75%      496.851678    505.826690    501.000000    499.250000\n",
+       "max      999.979256    999.948488    999.000000    999.000000"
       ]
      },
-     "execution_count": 28,
+     "execution_count": 15,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -877,7 +877,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 29,
+   "execution_count": 16,
    "id": "acc94632-2ed2-4dc1-a067-6d9518044c7b",
    "metadata": {},
    "outputs": [
@@ -913,56 +913,56 @@
        "      <th>count</th>\n",
        "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
-       "      <td>100000.00000</td>\n",
+       "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.623964</td>\n",
-       "      <td>-3.764614</td>\n",
-       "      <td>1.34378</td>\n",
-       "      <td>1.478400</td>\n",
+       "      <td>0.540672</td>\n",
+       "      <td>4.948220</td>\n",
+       "      <td>1.349060</td>\n",
+       "      <td>1.572440</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>577.971329</td>\n",
-       "      <td>577.167935</td>\n",
-       "      <td>575.56337</td>\n",
-       "      <td>577.826276</td>\n",
+       "      <td>577.009925</td>\n",
+       "      <td>577.169270</td>\n",
+       "      <td>576.321436</td>\n",
+       "      <td>576.108494</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.983952</td>\n",
-       "      <td>-999.980827</td>\n",
-       "      <td>-999.00000</td>\n",
+       "      <td>-999.965920</td>\n",
+       "      <td>-999.988117</td>\n",
+       "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-499.179172</td>\n",
-       "      <td>-503.072353</td>\n",
-       "      <td>-497.00000</td>\n",
-       "      <td>-497.000000</td>\n",
+       "      <td>-499.069860</td>\n",
+       "      <td>-494.820546</td>\n",
+       "      <td>-496.000000</td>\n",
+       "      <td>-496.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>3.133260</td>\n",
-       "      <td>-5.691740</td>\n",
-       "      <td>1.00000</td>\n",
-       "      <td>2.000000</td>\n",
+       "      <td>2.821413</td>\n",
+       "      <td>5.823958</td>\n",
+       "      <td>3.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>502.454035</td>\n",
-       "      <td>495.773629</td>\n",
-       "      <td>497.00000</td>\n",
+       "      <td>499.807599</td>\n",
+       "      <td>505.991898</td>\n",
        "      <td>501.000000</td>\n",
+       "      <td>500.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.998666</td>\n",
-       "      <td>999.985790</td>\n",
-       "      <td>999.00000</td>\n",
+       "      <td>999.984508</td>\n",
+       "      <td>999.948488</td>\n",
+       "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
@@ -970,18 +970,18 @@
        "</div>"
       ],
       "text/plain": [
-       "             column1        column2       column3        column4\n",
-       "count  100000.000000  100000.000000  100000.00000  100000.000000\n",
-       "mean        1.623964      -3.764614       1.34378       1.478400\n",
-       "std       577.971329     577.167935     575.56337     577.826276\n",
-       "min      -999.983952    -999.980827    -999.00000    -999.000000\n",
-       "25%      -499.179172    -503.072353    -497.00000    -497.000000\n",
-       "50%         3.133260      -5.691740       1.00000       2.000000\n",
-       "75%       502.454035     495.773629     497.00000     501.000000\n",
-       "max       999.998666     999.985790     999.00000     999.000000"
+       "             column1        column2        column3        column4\n",
+       "count  100000.000000  100000.000000  100000.000000  100000.000000\n",
+       "mean        0.540672       4.948220       1.349060       1.572440\n",
+       "std       577.009925     577.169270     576.321436     576.108494\n",
+       "min      -999.965920    -999.988117    -999.000000    -999.000000\n",
+       "25%      -499.069860    -494.820546    -496.000000    -496.000000\n",
+       "50%         2.821413       5.823958       3.000000       1.000000\n",
+       "75%       499.807599     505.991898     501.000000     500.000000\n",
+       "max       999.984508     999.948488     999.000000     999.000000"
       ]
      },
-     "execution_count": 29,
+     "execution_count": 16,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1000,7 +1000,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 30,
+   "execution_count": 17,
    "id": "1b86dd08-d8de-4b03-a363-80d18201b4da",
    "metadata": {},
    "outputs": [],
@@ -1018,7 +1018,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 31,
+   "execution_count": 18,
    "id": "dea886ac-e1a2-4903-b550-e73a2be70507",
    "metadata": {},
    "outputs": [
@@ -1059,50 +1059,50 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.695724</td>\n",
-       "      <td>-3.040382</td>\n",
-       "      <td>4.001460</td>\n",
-       "      <td>0.511100</td>\n",
+       "      <td>0.455395</td>\n",
+       "      <td>5.588258</td>\n",
+       "      <td>1.329300</td>\n",
+       "      <td>1.763540</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>578.627560</td>\n",
-       "      <td>576.453798</td>\n",
-       "      <td>576.244217</td>\n",
-       "      <td>578.301376</td>\n",
+       "      <td>577.070175</td>\n",
+       "      <td>577.342945</td>\n",
+       "      <td>577.130306</td>\n",
+       "      <td>575.554149</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.983952</td>\n",
-       "      <td>-999.968792</td>\n",
+       "      <td>-999.965920</td>\n",
+       "      <td>-999.963945</td>\n",
        "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-502.160012</td>\n",
-       "      <td>-500.333306</td>\n",
-       "      <td>-492.250000</td>\n",
-       "      <td>-498.000000</td>\n",
+       "      <td>-500.420461</td>\n",
+       "      <td>-495.503431</td>\n",
+       "      <td>-497.000000</td>\n",
+       "      <td>-493.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.057258</td>\n",
-       "      <td>-4.377464</td>\n",
+       "      <td>3.895165</td>\n",
+       "      <td>9.582978</td>\n",
        "      <td>3.000000</td>\n",
-       "      <td>0.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>502.159214</td>\n",
-       "      <td>494.614704</td>\n",
-       "      <td>499.000000</td>\n",
-       "      <td>500.250000</td>\n",
+       "      <td>496.851678</td>\n",
+       "      <td>505.826690</td>\n",
+       "      <td>501.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.998666</td>\n",
-       "      <td>999.913716</td>\n",
+       "      <td>999.979256</td>\n",
+       "      <td>999.948488</td>\n",
        "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
@@ -1113,16 +1113,16 @@
       "text/plain": [
        "            column1       column2       column3       column4\n",
        "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
-       "mean       1.695724     -3.040382      4.001460      0.511100\n",
-       "std      578.627560    576.453798    576.244217    578.301376\n",
-       "min     -999.983952   -999.968792   -999.000000   -999.000000\n",
-       "25%     -502.160012   -500.333306   -492.250000   -498.000000\n",
-       "50%        4.057258     -4.377464      3.000000      0.000000\n",
-       "75%      502.159214    494.614704    499.000000    500.250000\n",
-       "max      999.998666    999.913716    999.000000    999.000000"
+       "mean       0.455395      5.588258      1.329300      1.763540\n",
+       "std      577.070175    577.342945    577.130306    575.554149\n",
+       "min     -999.965920   -999.963945   -999.000000   -999.000000\n",
+       "25%     -500.420461   -495.503431   -497.000000   -493.000000\n",
+       "50%        3.895165      9.582978      3.000000      1.000000\n",
+       "75%      496.851678    505.826690    501.000000    499.250000\n",
+       "max      999.979256    999.948488    999.000000    999.000000"
       ]
      },
-     "execution_count": 31,
+     "execution_count": 18,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1141,7 +1141,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 32,
+   "execution_count": 19,
    "id": "c73063c8-4e9d-42ba-9804-1286b769ad54",
    "metadata": {},
    "outputs": [
@@ -1177,56 +1177,56 @@
        "      <th>count</th>\n",
        "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
-       "      <td>100000.00000</td>\n",
+       "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.174175</td>\n",
-       "      <td>-3.764614</td>\n",
-       "      <td>1.34378</td>\n",
-       "      <td>1.478400</td>\n",
+       "      <td>0.653302</td>\n",
+       "      <td>4.948220</td>\n",
+       "      <td>1.349060</td>\n",
+       "      <td>1.572440</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>408.414807</td>\n",
-       "      <td>577.167935</td>\n",
-       "      <td>575.56337</td>\n",
-       "      <td>577.826276</td>\n",
+       "      <td>408.053983</td>\n",
+       "      <td>577.169270</td>\n",
+       "      <td>576.321436</td>\n",
+       "      <td>576.108494</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
        "      <td>-500.000000</td>\n",
-       "      <td>-999.980827</td>\n",
-       "      <td>-999.00000</td>\n",
+       "      <td>-999.988117</td>\n",
+       "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-499.179172</td>\n",
-       "      <td>-503.072353</td>\n",
-       "      <td>-497.00000</td>\n",
-       "      <td>-497.000000</td>\n",
+       "      <td>-499.069860</td>\n",
+       "      <td>-494.820546</td>\n",
+       "      <td>-496.000000</td>\n",
+       "      <td>-496.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>3.133260</td>\n",
-       "      <td>-5.691740</td>\n",
-       "      <td>1.00000</td>\n",
-       "      <td>2.000000</td>\n",
+       "      <td>2.821413</td>\n",
+       "      <td>5.823958</td>\n",
+       "      <td>3.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>500.000000</td>\n",
-       "      <td>495.773629</td>\n",
-       "      <td>497.00000</td>\n",
+       "      <td>499.807599</td>\n",
+       "      <td>505.991898</td>\n",
        "      <td>501.000000</td>\n",
+       "      <td>500.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
        "      <td>500.000000</td>\n",
-       "      <td>999.985790</td>\n",
-       "      <td>999.00000</td>\n",
+       "      <td>999.948488</td>\n",
+       "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
@@ -1234,18 +1234,18 @@
        "</div>"
       ],
       "text/plain": [
-       "             column1        column2       column3        column4\n",
-       "count  100000.000000  100000.000000  100000.00000  100000.000000\n",
-       "mean        1.174175      -3.764614       1.34378       1.478400\n",
-       "std       408.414807     577.167935     575.56337     577.826276\n",
-       "min      -500.000000    -999.980827    -999.00000    -999.000000\n",
-       "25%      -499.179172    -503.072353    -497.00000    -497.000000\n",
-       "50%         3.133260      -5.691740       1.00000       2.000000\n",
-       "75%       500.000000     495.773629     497.00000     501.000000\n",
-       "max       500.000000     999.985790     999.00000     999.000000"
+       "             column1        column2        column3        column4\n",
+       "count  100000.000000  100000.000000  100000.000000  100000.000000\n",
+       "mean        0.653302       4.948220       1.349060       1.572440\n",
+       "std       408.053983     577.169270     576.321436     576.108494\n",
+       "min      -500.000000    -999.988117    -999.000000    -999.000000\n",
+       "25%      -499.069860    -494.820546    -496.000000    -496.000000\n",
+       "50%         2.821413       5.823958       3.000000       1.000000\n",
+       "75%       499.807599     505.991898     501.000000     500.000000\n",
+       "max       500.000000     999.948488     999.000000     999.000000"
       ]
      },
-     "execution_count": 32,
+     "execution_count": 19,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1264,7 +1264,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 33,
+   "execution_count": 20,
    "id": "1151d8a4-db49-4524-b7f3-bd38866e3d5e",
    "metadata": {},
    "outputs": [],
@@ -1274,7 +1274,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 34,
+   "execution_count": 21,
    "id": "bd8ce0d1-73cb-4982-b4fe-65e7d2144943",
    "metadata": {},
    "outputs": [
@@ -1310,56 +1310,56 @@
        "      <th>count</th>\n",
        "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
-       "      <td>100000.00000</td>\n",
+       "      <td>100000.000000</td>\n",
        "      <td>100000.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.174175</td>\n",
-       "      <td>-2.876739</td>\n",
-       "      <td>1.34378</td>\n",
-       "      <td>1.478400</td>\n",
+       "      <td>0.653302</td>\n",
+       "      <td>3.035664</td>\n",
+       "      <td>1.349060</td>\n",
+       "      <td>1.572440</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>408.414807</td>\n",
-       "      <td>408.107880</td>\n",
-       "      <td>575.56337</td>\n",
-       "      <td>577.826276</td>\n",
+       "      <td>408.053983</td>\n",
+       "      <td>408.488775</td>\n",
+       "      <td>576.321436</td>\n",
+       "      <td>576.108494</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
        "      <td>-500.000000</td>\n",
        "      <td>-500.000000</td>\n",
-       "      <td>-999.00000</td>\n",
+       "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-499.179172</td>\n",
-       "      <td>-500.000000</td>\n",
-       "      <td>-497.00000</td>\n",
-       "      <td>-497.000000</td>\n",
+       "      <td>-499.069860</td>\n",
+       "      <td>-494.820546</td>\n",
+       "      <td>-496.000000</td>\n",
+       "      <td>-496.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>3.133260</td>\n",
-       "      <td>-5.691740</td>\n",
-       "      <td>1.00000</td>\n",
-       "      <td>2.000000</td>\n",
+       "      <td>2.821413</td>\n",
+       "      <td>5.823958</td>\n",
+       "      <td>3.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
+       "      <td>499.807599</td>\n",
        "      <td>500.000000</td>\n",
-       "      <td>495.773629</td>\n",
-       "      <td>497.00000</td>\n",
        "      <td>501.000000</td>\n",
+       "      <td>500.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
        "      <td>500.000000</td>\n",
        "      <td>500.000000</td>\n",
-       "      <td>999.00000</td>\n",
+       "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
@@ -1367,18 +1367,18 @@
        "</div>"
       ],
       "text/plain": [
-       "             column1        column2       column3        column4\n",
-       "count  100000.000000  100000.000000  100000.00000  100000.000000\n",
-       "mean        1.174175      -2.876739       1.34378       1.478400\n",
-       "std       408.414807     408.107880     575.56337     577.826276\n",
-       "min      -500.000000    -500.000000    -999.00000    -999.000000\n",
-       "25%      -499.179172    -500.000000    -497.00000    -497.000000\n",
-       "50%         3.133260      -5.691740       1.00000       2.000000\n",
-       "75%       500.000000     495.773629     497.00000     501.000000\n",
-       "max       500.000000     500.000000     999.00000     999.000000"
+       "             column1        column2        column3        column4\n",
+       "count  100000.000000  100000.000000  100000.000000  100000.000000\n",
+       "mean        0.653302       3.035664       1.349060       1.572440\n",
+       "std       408.053983     408.488775     576.321436     576.108494\n",
+       "min      -500.000000    -500.000000    -999.000000    -999.000000\n",
+       "25%      -499.069860    -494.820546    -496.000000    -496.000000\n",
+       "50%         2.821413       5.823958       3.000000       1.000000\n",
+       "75%       499.807599     500.000000     501.000000     500.000000\n",
+       "max       500.000000     500.000000     999.000000     999.000000"
       ]
      },
-     "execution_count": 34,
+     "execution_count": 21,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1397,7 +1397,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 35,
+   "execution_count": 22,
    "id": "bea974f5-367b-4432-893f-a33a449dda6f",
    "metadata": {},
    "outputs": [
@@ -1438,50 +1438,50 @@
        "    </tr>\n",
        "    <tr>\n",
        "      <th>mean</th>\n",
-       "      <td>1.695724</td>\n",
-       "      <td>-3.040382</td>\n",
-       "      <td>4.001460</td>\n",
-       "      <td>0.511100</td>\n",
+       "      <td>0.455395</td>\n",
+       "      <td>5.588258</td>\n",
+       "      <td>1.329300</td>\n",
+       "      <td>1.763540</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>std</th>\n",
-       "      <td>578.627560</td>\n",
-       "      <td>576.453798</td>\n",
-       "      <td>576.244217</td>\n",
-       "      <td>578.301376</td>\n",
+       "      <td>577.070175</td>\n",
+       "      <td>577.342945</td>\n",
+       "      <td>577.130306</td>\n",
+       "      <td>575.554149</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>min</th>\n",
-       "      <td>-999.983952</td>\n",
-       "      <td>-999.968792</td>\n",
+       "      <td>-999.965920</td>\n",
+       "      <td>-999.963945</td>\n",
        "      <td>-999.000000</td>\n",
        "      <td>-999.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>25%</th>\n",
-       "      <td>-502.160012</td>\n",
-       "      <td>-500.333306</td>\n",
-       "      <td>-492.250000</td>\n",
-       "      <td>-498.000000</td>\n",
+       "      <td>-500.420461</td>\n",
+       "      <td>-495.503431</td>\n",
+       "      <td>-497.000000</td>\n",
+       "      <td>-493.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>50%</th>\n",
-       "      <td>4.057258</td>\n",
-       "      <td>-4.377464</td>\n",
+       "      <td>3.895165</td>\n",
+       "      <td>9.582978</td>\n",
        "      <td>3.000000</td>\n",
-       "      <td>0.000000</td>\n",
+       "      <td>1.000000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>75%</th>\n",
-       "      <td>502.159214</td>\n",
-       "      <td>494.614704</td>\n",
-       "      <td>499.000000</td>\n",
-       "      <td>500.250000</td>\n",
+       "      <td>496.851678</td>\n",
+       "      <td>505.826690</td>\n",
+       "      <td>501.000000</td>\n",
+       "      <td>499.250000</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>max</th>\n",
-       "      <td>999.998666</td>\n",
-       "      <td>999.913716</td>\n",
+       "      <td>999.979256</td>\n",
+       "      <td>999.948488</td>\n",
        "      <td>999.000000</td>\n",
        "      <td>999.000000</td>\n",
        "    </tr>\n",
@@ -1492,16 +1492,16 @@
       "text/plain": [
        "            column1       column2       column3       column4\n",
        "count  50000.000000  50000.000000  50000.000000  50000.000000\n",
-       "mean       1.695724     -3.040382      4.001460      0.511100\n",
-       "std      578.627560    576.453798    576.244217    578.301376\n",
-       "min     -999.983952   -999.968792   -999.000000   -999.000000\n",
-       "25%     -502.160012   -500.333306   -492.250000   -498.000000\n",
-       "50%        4.057258     -4.377464      3.000000      0.000000\n",
-       "75%      502.159214    494.614704    499.000000    500.250000\n",
-       "max      999.998666    999.913716    999.000000    999.000000"
+       "mean       0.455395      5.588258      1.329300      1.763540\n",
+       "std      577.070175    577.342945    577.130306    575.554149\n",
+       "min     -999.965920   -999.963945   -999.000000   -999.000000\n",
+       "25%     -500.420461   -495.503431   -497.000000   -493.000000\n",
+       "50%        3.895165      9.582978      3.000000      1.000000\n",
+       "75%      496.851678    505.826690    501.000000    499.250000\n",
+       "max      999.979256    999.948488    999.000000    999.000000"
       ]
      },
-     "execution_count": 35,
+     "execution_count": 22,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1528,7 +1528,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 42,
+   "execution_count": 23,
    "id": "e4aa3b34-c948-4efe-b523-37e3ab2b2522",
    "metadata": {},
    "outputs": [],
@@ -1538,7 +1538,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 43,
+   "execution_count": 24,
    "id": "018ed5c4-de6f-4a18-bc11-ae3917dcf481",
    "metadata": {},
    "outputs": [],
@@ -1553,7 +1553,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 44,
+   "execution_count": 25,
    "id": "08daae66-9e28-4394-8021-b64cd806a4ab",
    "metadata": {},
    "outputs": [
@@ -1561,7 +1561,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "6.94 ms ± 638 μs per loop (mean ± std. dev. of 7 runs, 100 loops each)\n"
+      "7.19 ms ± 1.07 ms per loop (mean ± std. dev. of 7 runs, 100 loops each)\n"
      ]
     }
    ],
@@ -1572,7 +1572,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 45,
+   "execution_count": 26,
    "id": "04dd1afc-11cb-46a6-9e15-28461c9e96b3",
    "metadata": {},
    "outputs": [
@@ -1580,7 +1580,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "946 μs ± 49.5 μs per loop (mean ± std. dev. of 7 runs, 1,000 loops each)\n"
+      "962 μs ± 137 μs per loop (mean ± std. dev. of 7 runs, 1,000 loops each)\n"
      ]
     }
    ],
@@ -1591,7 +1591,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 46,
+   "execution_count": 27,
    "id": "5bc546df-96b7-446c-be09-3bdc48b6e86b",
    "metadata": {},
    "outputs": [],
@@ -1601,7 +1601,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 47,
+   "execution_count": 28,
    "id": "e8d2d195-0c5f-48ee-956f-895c6ae45fa3",
    "metadata": {},
    "outputs": [],
@@ -1616,7 +1616,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 48,
+   "execution_count": 29,
    "id": "5d455f94-47f4-4582-8019-15763457198b",
    "metadata": {},
    "outputs": [
@@ -1624,7 +1624,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "778 ms ± 78.8 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+      "971 ms ± 162 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
      ]
     }
    ],
@@ -1635,7 +1635,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 49,
+   "execution_count": 30,
    "id": "b8b68166-7010-41d7-b2ea-f6536dc2d147",
    "metadata": {},
    "outputs": [
@@ -1643,7 +1643,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "49 ms ± 6.72 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)\n"
+      "66.8 ms ± 13.7 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)\n"
      ]
     }
    ],
@@ -1657,7 +1657,7 @@
    "id": "ca530907-9cda-408f-816a-f6f34351e0d9",
    "metadata": {},
    "source": [
-    "As you can see, assigning the column to perform an in--place operations is significantly faster."
+    "As you can see, assigning the column to perform an in-place operations is significantly faster."
    ]
   },
   {

From fde9090824a69df62f9e8cbe2077a6f75904d973 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Mon, 24 Nov 2025 11:00:12 +0100
Subject: [PATCH 07/10] Add numba example

---
 source-code/pandas/README.md              |   2 +
 source-code/pandas/numba_and_pandas.ipynb | 327 ++++++++++++++++++++++
 2 files changed, 329 insertions(+)
 create mode 100644 source-code/pandas/numba_and_pandas.ipynb

diff --git a/source-code/pandas/README.md b/source-code/pandas/README.md
index 313b336..1bb6cf9 100644
--- a/source-code/pandas/README.md
+++ b/source-code/pandas/README.md
@@ -32,3 +32,5 @@ easy to use.
 1. `apply.ipynb`: Jupyter notebook that illustrates the use of the `apply` method
    in pandas dataframes for applying functions along rows or columns. It includes
    a comparison of performance between using `apply` and vectorized operations.
+1. `numba_and_pandas.ipynb`: Jupyter notebook that demonstrates how to use Numba
+   to optimize performance of operations on pandas dataframes.
diff --git a/source-code/pandas/numba_and_pandas.ipynb b/source-code/pandas/numba_and_pandas.ipynb
new file mode 100644
index 0000000..6dc82e0
--- /dev/null
+++ b/source-code/pandas/numba_and_pandas.ipynb
@@ -0,0 +1,327 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "4be65a5f-39d9-42f6-a1ec-beee22363ce3",
+   "metadata": {},
+   "source": [
+    "## Requirements"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "2c930efe-41a4-4665-a419-7d1ad683cc82",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "from numba import njit\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import time"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8cfbec4d-90d1-4e45-9c9e-310475a395f0",
+   "metadata": {},
+   "source": [
+    "## Using numba"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8ec085cd-5fce-420b-8f12-46b9a9e56269",
+   "metadata": {},
+   "source": [
+    "Consider the following dataframe with 2 million rows."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "31f2457e-b51a-4e6c-91fb-852c088c6792",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "size = 2_000_000\n",
+    "df = pd.DataFrame({\n",
+    "    'x': np.random.rand(size),\n",
+    "    'y': np.random.rand(size),\n",
+    "})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7203ebcd-b1ba-4877-90ef-e1b9665d1029",
+   "metadata": {},
+   "source": [
+    "You want to create a series computed as $\\sqrt{x^2 + y^2}$.  You can consider three approoaches:\n",
+    "1. pandas' `.apply()` method,\n",
+    "2. numpy expressions, and\n",
+    "3. using a numba function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "20974ffd-621b-4ba5-a168-01f27a307712",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 8.93 s, sys: 288 ms, total: 9.22 s\n",
+      "Wall time: 9.22 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time df.apply(lambda row: np.sqrt(row['x']**2 + row['y']**2), axis=1);"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "b15fabcb-22d5-487e-bd79-72d1f6924e7f",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 34.4 ms, sys: 16.1 ms, total: 50.5 ms\n",
+      "Wall time: 48.9 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time np.sqrt(df['x']**2 + df['y']**2);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0f53a473-d8bc-40b3-ba63-7b4db3ec81ca",
+   "metadata": {},
+   "source": [
+    "It is clear that the using numpy is much more efficient, the speedup is 250."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "4bddc8bb-5e68-4a7c-9c45-589f797dac12",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "@njit\n",
+    "def score_numba(x, y):\n",
+    "    result = np.empty_like(x)\n",
+    "    for i in range(len(x)):\n",
+    "        result[i] = np.sqrt(x[i]**2 + y[i]**2)\n",
+    "    return result"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "bd7cc279-76d1-4b2d-a300-24142d0fafa2",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 248 ms, sys: 47.8 ms, total: 296 ms\n",
+      "Wall time: 433 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time score_numba(df.x.values, df.y.values);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a5b4731e-593d-41ee-8354-54a066992c8c",
+   "metadata": {},
+   "source": [
+    "Using numba is about 25 times faster than the pandas `.apply()` method, but 10 slower than numpy, so is there a point?\n",
+    "\n",
+    "There is if you run that function multiple times."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "8339e439-3d9c-4404-af22-3af502ecf941",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 5.7 ms, sys: 0 ns, total: 5.7 ms\n",
+      "Wall time: 5.77 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time score_numba(df.x.values, df.y.values);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d6900b2d-3dd1-4e90-aee2-a526b8dd058d",
+   "metadata": {},
+   "source": [
+    "As you can see, numba is now more than 2,000 times faster then the equivalent `.apply()` method call.  Once the initial compilation has been done, there is little or no overhead on subsequent calls."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7b302dd6-97e9-4294-8b3c-2236fd3c03a2",
+   "metadata": {},
+   "source": [
+    "This can be compared to a similar implementation with a non-compiled Python function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "024672ee-7e66-4e6b-a199-b78c81489735",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def score_python(x, y):\n",
+    "    result = np.empty_like(x)\n",
+    "    for i in range(len(x)):\n",
+    "        result[i] = np.sqrt(x[i]**2 + y[i]**2)\n",
+    "    return result"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "796d265e-4c6b-4f70-ac08-dfe7d90036db",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 1.74 s, sys: 0 ns, total: 1.74 s\n",
+      "Wall time: 1.74 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time score_python(df.x.values, df.y.values);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "26476f95-fb22-4751-8ac9-80d90f210c6c",
+   "metadata": {},
+   "source": [
+    "Even this approach is faster than pandas' `.apply()`, but still more than 200 times slower than numba (once compiled)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f613ea5c-eddc-4517-a31b-980ae613d072",
+   "metadata": {},
+   "source": [
+    "## Benchmark"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "15f830eb-3ea7-43b7-a31f-c2b234735df7",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAnEAAAHACAYAAADN8z51AAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjgsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvwVt1zgAAAAlwSFlzAAAPYQAAD2EBqD+naQAAbqZJREFUeJzt3Qd4E/X/B/BPFy17lT3K3lCmbCjKEBBBpqKIDJUlS0UQUYbIUkBkCC7UnygiFP8qW7ZsKEOW7I3sWejM/3l/46VJmrRJmjbr/Xqee5LcXS53uUvyyXd8vn46nU4nRERERORR/F29A0RERERkPwZxRERERB6IQRwRERGRB2IQR0REROSBGMQREREReSAGcUREREQeiEEcERERkQdiEEdERETkgQJdvQPuLjExUS5fvizZs2cXPz8/V+8OEREReTGdTif379+XwoULi79/ymVtDOJSgQCuWLFizjw/RERERCm6cOGCFC1aNMV1GMSlAiVw2puZI0eO1FaXuLg4WbNmjbRs2VKCgoLEl/DYed597ZoHXve87n3tuvflaz4jjv/evXuq8EiLP1LCIC4VWhUqAjhbg7gsWbKodX3t4uax87z72jUPvO553fvade/L13xGHr8tTbjYsYGIiIjIAzGIIyIiIvJADOKIiIiIPBCDOCIiIiIP5BNB3HPPPSe5c+eWzp07u3pXiIiIiJzCJ4K4wYMHy3fffefq3SAiIiJyGp8I4po1a2ZTvhUiIiIiT+H2QdzmzZulXbt2avgJ5ExZvnx5snXmzp0rJUuWlJCQEKlVq5Zs2bLFJftKRERElFHcPoh7+PChhIeHy+zZsy0uX7x4sQwdOlRGjx4tUVFR0rhxY2ndurWcP38+w/eViIiIKKO4/YgNCMgwWTN9+nTp06eP9O3bVz2eOXOmrF69WubNmyeTJk2y+/ViYmLUZDz8hZahGVNqtHVsWdfb8Nh53n0Rr3te977Gl695SUiQhI0bpcjmzZIQHCwSESESEODUl7DnfXX7IC4lsbGxsnfvXhk5cqTJfIxntm3bNoe2icBv3LhxyeZjnDQMs2GrtWvXiq/isfsmXz7vvn78PHbf5GvnvdD27VL1yy8l882bUhszpk+XR3nzyqG+feVK/fpOe53o6GjfCOJu3LghCQkJUqBAAZP5eHz16lXD41atWsm+fftU1WzRokUlMjJS6tSpY3Gbo0aNkuHDhycbiBaBoa1jp+LCbtGihc+NKcdj53n3tWseeN3zuve1694Xr3m/yEgJmDpVRKczmR9y65bUmTpVEn76SXTPPeeU19JqAL0+iLM2SKxOpzOZh+pVWwUHB6vJHC5Uey5We9f3Jjx2nndfxOue172v8ZlrPiFB5M03kwVw4Id5fn4S+NZbIp06OaVq1Z731KODuNDQUAkICDApdYNr164lK52z15w5c9SEkj4iIiLycomJInfuiFy/njRduyaya5fIxYvWn4dA7sIFEWTGQBu5DOTRQVymTJlUShEU62JUBg0et2/fPk3bHjhwoJpQrJkzZ04n7C0RERFlaFB2+7Y+EDMOzLTgzHweprQU3Fy5IhnN7YO4Bw8eyMmTJw2Pz5w5I/v375c8efJI8eLFVfu1Hj16SO3ataV+/fqyYMEClV6kX79+Lt1vIiIiciIEWLdupRyIXTOad/OmY0EZ2r/ny5c0xceLrFyZ+vMKFZKM5vZB3J49e9SICxqt00HPnj1l4cKF0q1bN7l586aMHz9erly5IlWqVJEVK1ZIWFiYC/eaiIiIUoTgCIGWLaVkmIcADqVr9sqZUx+M5c9vGpxZm2feLh6BYIkSIpcuWWwXhzZxUrSoSOPGGX7C3T6Ii4iIUB0VUjJgwAA1ORPbxBEREdkZlN24YXtJGYKyVH7fLcqdO/VALP9/80JD0fYqbacRnRU+/VSkc2d9wGa8z1onypkznZ4vziuCOFdhmzgiIvJpSDprod2Y/5UrEr5vnwR8801SSRqCM7Q/c0SePLaXkiEoc0WP2I4dRX75RWTIENNODiiBQwCH5S7AII6IiMgXxMamXG1p/hg9NS1AeVMJa6+Bkqm8eVMOxowfY91ADwlFOnYUad9e4jdskP0rV0r11q0lEM29XFACp/GQd46IiIhMPH5suYeltWpMO5LIGvj76wMto8ArIW9eOXH7tpRt2FACChY0DdCwrguDmnQXECC6pk3lEsZ1b9rU5cfKIM4KtokjIqIM9eiR7e3JMN2/b/9rIOhAlaQt7ckwof2ZWaCSGBcnx1eskNJt2kiALyT7dWMM4qxgmzgiIkqThw9tLyXDLda3F6oizYOwlIKzXLn0pWvkFRjEERERpQY9Eo2CMr/Ll6X4+vXif+RIUu4y8wDNjoHMDVCyZWspGSYEZWZDT5LvYBBHRES+GZShOtKekjK0QTP68axhy+sgvYWtPS8xD4lmGZSRjRjEWcE2cUREHhaUoeG+re3JMMXE2P86ISEq4NKFhso1Pz/JV7Gi+GOsbmvBWfbsDMoo3TCIs4Jt4oiIXByUmQ9GnlJaDCSZRQoNe2XOnHIKDPN5WbOqoCw+Lk52rFghbdq0EX827icXYRBHRETpD8MlaUGZLSVlCMqQbNZeCLLsGWIJ6xN5KAZxRETkWFB244Zku3BB/LZs0WfrTyk4Q1DmyGDkqI60tT0ZblGyRuQjGMQREZE+wLLWy9JKSVlQYqI8Ze97h4b79pSUoQ0aEVnEIM4KdmwgolQlJIjfpk1SZPNm8UO1nIuH4Ek2GLk2rqUtPS+xrgODkcdmzSpBhQqJnxaApTYYeXBwuhwukS9iEGcFOzYQUYqWLVODYQdevCi18Xj6dP1g2J9+mj6DYSMoQ5WkrT0vUarmQFCmMvTbWEoWlzOnrFy3TjXuD2LjfqIMxyCOiMiRAK5z5+RB0qVL+vm//JJ6IIeelAjKbB2QHG3O7IV8Y3ny2N6eDONe2hOMOdLxgIichkEcEZG9bceGDLFcyoV5CJz69dNn99eqMy2VlKGnpr2wbbPByFMMzrAuhmUiIq/ETzcRka0QeC1aJHLxovV1EMghSHv55dS3hzEs7RmMHKVq7tLmjohcjkEcEZF5EIYg7dgxkaNHTW+vXrX9vapUSaRq1ZSDM7Q/42DkROQgBnFE5JvQJu3kyeSBGiZUhVqDKkpUk6ZmzhyRiAin7jIRkTEGcVYwxQiRF1WBasGZccB2+rT15LNoR1amjEiFCiIVKybdli+vz/BfooS+E4OldnFot4Zeqo0bp/uhEZFvYxBnBVOMEPlAFShGAzAP1HBbunTKvTSRRgS9UBGwGQdyeAwzZ7LtGhGlOwZxROT9VaCFCycP1HBbqFBS4GUPpA9BGhH0UjXu5IASOARw6ZEnjojIDIM4IvKMKlBMp045VgWKoZ6cDYFa+/YSv2GD7F+5Uqq3bi2B7jRiAxF5PQZxROQ+VaDa/fSoAk0PAQGia9pULj18KOFNmzKAI6IMxSCOiDK2CtQ4aMvIKlAiIi/DII6InOPuXX2wZh6ouVMVKBGRF2EQR0SOVYH+F6gFHD0qrQ4ckKCUxvZ0pypQIiIvwSDOCuaJI5+mVYGap+w4flzkwQOTVf1FJER7wCpQIqIMwyDOCuaJI5+pArWUW82OKtD4MmXkr1u3pEGvXhKE0QyIiChDMIgj8sEqUGf2AtXFxcmdFSvYho2IKIMxiCPywSpQE6wCJSLySAziiHywCpS9QImIPB+DOKK0SkgQv02bpMjmzeKHwdGdkbUfVaAYYN3S8FJXrlh/HnuBEhH5DAZxRGmxbJkaPzPw4kWpjcfTp+vHz8QA6baMn2mpClSbWAVKREQpYBBHlJYArnNnfamZMZSgYT4GSNcCOfMqUO0+q0CJiMhBDOKIHIG2Z0OGJA/gQJvXs6fIZ5/pOxawCpSIiJyMQRyRI7Zs0aftSAmqQzduTHrMXqBEROREDOKIHJFSyZqxfv1EevfmWKBEROR0DOKI7IGq0vXrRaZOtW39bt1E6tThe0xERE6HYQ/JytiplSpVkjr8ASZITBT59VeRevVEmjcX2b8/5ffFz0+kWDGRxo35/hERUbpgEJfC2KlHjhyR3bt3p887T54hPl5k0SKR8HCRDh1Edu0SCQkReeMNkc8/1wdrmIxpj2fOTHu+OCIiIitYnUpkSUyMyLffikyZInL6tH5ejhyI7kWGDhXJn18/L18+fS9V404OyBOHAM6WPHFEREQOYhBHZOzhQ5EFC0Q+/ljk8mX9vNBQfeCGAC5XLtP3C4Fa+/YSv2GD7F+5Uqq3bi2BzhixgYiIKBUM4ojg9m2R2bP1Iy3cvKl/T4oUEXn7bZG+fUUwnJY1AQGia9pULj18KOFNmzKAIyKiDMEgjnzbv/+KzJghMneuyP37+nmlS4uMHCnSo4dIcLCr95CIiMgiBnHkm86dE5k2TeSrr0QeP9bPq1pV5N139UNmBfKjQURE7o2/VORbMGYpOiv873/6nqdQt67I6NEibduK+LPDNhEReQYGceQboqJEPvpIZOnSpLFNn3pKX/KGjgjmaUKIiIjcHIM48m5bt+qDt5Urk+a1by8yapS+BI6IiMhDMYgj74OStjVrRCZO1A9UD6gmfeEFfYeFKlVcvYdERERpxiCOvGtorMhIfcnbvn36eZkyibzyisiIEfpep0RERF6CQRx5vrg4kR9/FJk0Sd9xAbJkEenXT2T4cH2+NyIiIi/DII4816NHIt98IzJ1qj5lCGBEBYxrOniwfqQFIiIiL8UgjjwPkvLOmycyfbo+WS9gLFOUuvXvrx/jlIiIyMv5RFKs33//XcqXLy9ly5aVL7/80tW7Q47CcFgffCBSvLjIO+/oAzjcx3BZZ8/q5zGAIyIiH+H1JXHx8fEyfPhw2bBhg+TIkUNq1qwpHTt2lDx58rh618hWGIj+k09E5s/XD1AP5cvre5q++KJIUBDfSyIi8jleXxK3a9cuqVy5shQpUkSyZ88ubdq0kdWrV7t6t8gWp0/rOyeULKmvOkUAV6OGyJIlIocP63udMoAjIiIf5fZB3ObNm6Vdu3ZSuHBh8fPzk+XLlydbZ+7cuVKyZEkJCQmRWrVqyRYtN5gqxLmsAjhN0aJF5dKlSxm2/+QABGgYfL5cOX3pW2ysSMOGIitWiOzdqx/bNCCAby0REfk0tw/iHj58KOHh4TIb7Z4sWLx4sQwdOlRGjx4tUVFR0rhxY2ndurWcP39eLddpQywZQTBIbmj3bpHnntMn48XYpgkJIq1aIZLXj7zQujWHxyIiIvKUNnEIyDBZM336dOnTp4/07dtXPZ45c6aqLp03b55MmjRJlcIZl7xdvHhR6qYw3FJMTIyaNPfu3VO3cXFxakqNto4t63obh45dpxO/zZvFf8oU8V+3Tj/Lz090HTpIAjoq1KypbVzcGc+7b17zwHPvm+ee5903z3tGnHt7tuuns1RU5aZQghYZGSkdOnRQj2NjYyVLliyyZMkSeQ4lOP8ZMmSI7N+/XzZt2qQ6NlSsWFE2btxo6NiwY8cOyZs3r8XXGDt2rIwbNy7Z/EWLFqnXIifR6aTAnj1S7pdfJM/x42pWor+/XGzaVE507CgPihXjW01ERD4nOjpaunfvLnfv3lVxi0eXxKXkxo0bkpCQIAUKFDCZj8dXr15V9wMDA+WTTz6RZs2aSWJioowYMcJqAAejRo1SvVmNS+KKFSsmLVu2TPXN1CLotWvXSosWLSTIxxrd23TsCQnit3SpBEyZIn6HDqlZuuBgSezVSxKHD5dCJUpIIfE8PO++ec0Dz71vnnued9887xlx7rUaQFt4dBBnrY0bCheN5z377LNqskVwcLCazOFE2XOy7F3fm1g8dnRO+P57kSlTRE6c0M/Llk0l5/UbPlwCChYUb+iqwPPum9c88Nz75rnneffN856e596ebXp0EBcaGioBAQGGUjfNtWvXkpXO2WvOnDlqQkkfpUF0tAgSLE+bhgaJ+nnI0TdkiMigQfr7RERE5H29U1OSKVMmlVIExZrG8LhBgwZp2vbAgQPlyJEjshs9Jsl+d+/qB6QvUUIfsCGAK1RI5OOP9eOcvv8+AzgiIqI0cPuSuAcPHsjJkycNj8+cOaM6LWDEheLFi6v2az169JDatWtL/fr1ZcGCBSq9SD8kiaUMl+nuXfEfM0Y/tqlWr49kvehp2rOnSEgIzwoREZEvBHF79uxRnRI0WqeDnj17ysKFC6Vbt25y8+ZNGT9+vFy5ckWqVKkiK1askLCwsDS9LqtT7XThgvhPmyYt5s+XALR/g0qV0FNE5Pnn0cMkTeeDiIiITLn9L2tERITFhL3GBgwYoCZnQnUqJvQSyZkzp1O37VXQSQGdFb77TgL+y22TWKuW+L/3HnqUiPh7dI09ERGR23L7II7c1MGD+jZvP/8skpioZiU2bSo7mjWTOqNGiX+mTK7eQyIiIq/GYhKyz/btIu3aiYSHi/z0kz6Aa9tW5K+/JGHtWrlevTqHxiIiIsoALImzgm3ijKA6+88/RT76SGTDBv085OHr2lVk5EgRBG7go0OwEBERuQJL4qxgihHUjyaKLF8ugrFmW7TQB3DooNC7t8ixY/qSOC2AIyIiogzFkjhKLj5eZPFifZu3w4f18zJnFnn1VZE33xQpXpzvGhERkYsxiKMkjx+LfPutvrfpmTP6eRgvFiMrIGFv/vx8t4iIiNwEgzhCRmWRBQv0oylcuaJ/R0JDRYYNQ/4WkVy5+C4RERG5GQZxvtyx4fZtkc8+E/n0U5Fbt/TzihYVefttkb59RbJkcfUeEhERkRUM4nwx2e/VqyIzZojMnasvhYMyZfQ9TXv0wKC0rt5DIiIiSgWDOF+CgeenThX56iuRmBj9vKpVRd59V6RLF5GAAFfvIREREdmIQZwvQDqQyZNFfvhB3/MU6tUTGT1an6gXOd+IiIjIozCI82b79ukT9C5bpk/YC82b60veIiIYvBEREXkwBnGe1rEB+7Nli74XaaFCIo0bJ68GxXIEb6tWJc3r0EFk1CiRJ57I8F0mIiIi5+OIDZ40YgNK1EqUEGnWTKR7d/0tHmslbQjaENQ1aaK/7+8v8uKLIocOiURGMoAjIiLyIiyJ8xQI1Dp3TqoW1Vy6JNKpk0jJkkkJetG7tFcvfaqQ0qVdsrtERESUvhjEeQJUoWLEBPMADrR5COAwNFb//iLDh4sUKZLhu0lEREQZh0GcJ0Abt4sXU1/vxx9F2rfPiD0iIiIiF2ObOE+gDYWVmujo9N4TIiIichMM4jwBeqE6cz0iIiLyeAzirEB6kUqVKkmdOnXE5dDjFGOaWoNkvcWK6dcjIiIin8AgzhNSjCAPHDo2WKKNtjBzJofNIiIi8iEM4jxBbKzId9/p76MHqjGU0P3yi0jHji7ZNSIiInIN9k71BB9+qE/YGxqqv8VYqCmN2EBERERej0Gcp4x/CnPnihQsqJ+IiIjIp7E61d2rUTHyApL9dumin4iIiIgYxLm5iRNFDh7UV6POnu3qvSEiIiI3wpI4dxUVlVSNOmeOSP78rt4jIiIiciMM4twxT5xWjRofrx/0vmvXjN8HIiIicmsM4twxTxxK4A4cEMmbV18KR0RERGSGQZy72b9f3xYOWI1KREREVjCIcydxcSKvvKKvRu3UidWoREREZBXzxLkSUods2ZKUuHfDBtNqVG1ILSIiIiIzDOJcZdky/XioFy8mX4Z0IgUKuGKviIiIyEMwiHNVAIdepzqd5eVBQRm9R0RERORh2CbOFVWoKIGzFsChCnXYMP16RERERFYwiMtoaANnqQpVg+DuwgX9ekRERERWMIjLaOjE4Mz1iIiIyCcxiMto6IXqzPWIiIjIJzGIy2iNG4sULWo9fQjmFyumX4+IiIjICgZxGT12akCAyKef6u+bB3La45kz9esREREROTPFyNmzZ2XLli3qNjo6WvLlyyc1atSQ+vXrS0hIiHjL2KmY7t27Jzlz5nTuxjt2FPnll+R54lBChwAOy4mIiIicFcQtWrRIZs2aJbt27ZL8+fNLkSJFJHPmzHLr1i05deqUCuBefPFFeeeddyQsLMyeTfseBGrt25uO2IAqVJbAERERkTODuJo1a4q/v7+88sor8vPPP0vx4sVNlsfExMj27dvlp59+ktq1a8vcuXOlS5cutm7eNyFgi4hw9V4QERGRNwdxEyZMkLZt21pdHhwcLBEREWr68MMP5cyZM87aRyIiIiJyNIhLKYAzFxoaqiYiIiIicqPeqfv27ZNDhw4ZHv/666/SoUMHeffddyU2NtaZ+0dEREREzgriXn/9dfnnn3/U/dOnT8vzzz8vWbJkkSVLlsiIESMc2SQRERERpXcQhwCuevXq6j4CtyZNmqieqwsXLpSlS5c6skkiIiIiSu8gTqfTSWJiorq/bt06adOmjbpfrFgxuXHjhiObJCIiIqL0DuKQQgQ9UL///nvZtGmTodMDeqQWKFDAkU0SERERUXoHcTNnzlSdGwYNGiSjR4+WMmXKqPm//PKLNGjQwJFNEhEREVF6D7tVrVo1k96pmmnTpkkARxwgIiIics8gzhpvGTeViIiIyGuCuNy5c4ufn59N62IsVSIiIiJygyAO7eA0N2/eVB0bWrVqJfXr11fzMG7q6tWrZcyYMeJunnvuOdm4caM89dRTqt0eERERkc8EcT179jTc79Spk4wfP151bNAMHjxYZs+erVKODBs2TNwJ9q13797y7bffunpXiIiIiFzXOxUlbk8//XSy+SiZQxDnbpo1aybZs2d39W4QERERuTaIy5s3r0RGRiabv3z5crXMHps3b5Z27dpJ4cKFVZs7bMPc3LlzpWTJkqrjRK1atWTLli2O7DYRERGRb/dOHTdunPTp00e1M9PaxO3YsUNWrVolX375pV3bevjwoYSHh0uvXr1UNa25xYsXy9ChQ1Ug17BhQ5k/f760bt1ajhw5IsWLF1frILCLiYlJ9tw1a9ao4NAe2I7xtu7du6du4+Li1JQabR1b1vU2PHaed1/E657Xva/x5Ws+I47fnu366TCGlgN27twps2bNkqNHj6phuCpVqqTantWtW9eRzel3xs9PlfB16NDBMA/bq1mzpsybN88wr2LFimqdSZMm2bxtBJxos5dax4axY8eqINUcxobNkiWLza9HREREZK/o6Gjp3r273L17V3LkyJE+eeIQXP3www+SnmJjY2Xv3r0ycuRIk/ktW7aUbdu2pctrjho1SoYPH25SEocxYfGaqb2ZWgS9du1aadGihQQFBYkv4bHzvPvaNQ+87nnd+9p178vXfEYcv1YDaAuHg7jExEQ5efKkXLt2Td031qRJE3GGGzduSEJCQrLxWPH46tWrNm8HHS4wTBiqbosWLapK++rUqWNx3eDgYDWZw4my52TZu7434bHzvPsiXve87n2NL1/z6Xn89mzToSAO7d9Q1Hfu3DlVlWpeJYrAy5nMkwzjNW1NPKz1piUiIiLyJg4Fcf369ZPatWvLH3/8IYUKFbIroLJHaGioGovVvNQNpX/mpXPONmfOHDU5OyAlIiIiclmKkRMnTshHH32kOhjkypVLcubMaTI5S6ZMmVTPU9Q9G8PjBg0aSHoaOHCg6gG7e/fudH0dIiIiogwriUOnBrSHK1OmjKTVgwcP1LY0Z86ckf3790uePHlUChF0MujRo4cq+UM6kwULFsj58+dVaSARERGRr3IoiHvjjTfkzTffVNWcVatWTdYIr1q1ajZva8+ePWpEBY3WMxTDfC1cuFC6deumxmrFMF9XrlyRKlWqyIoVKyQsLEzSE6tTiYiIyOuCOC0pL8Yj1aBdnNbhwJ52ZBEREck6R5gbMGCAmjISqlMxoauvM6uIiYiIiFwWxKHKk4iIiIg8LIhL76pMIiIiIkqnZL+nTp2SmTNnqmG3UIWKnqpDhgyR0qVLizdgmzgiIiLyuhQjSJ6LsVJ37dqlOjGgswHGUq1cuXKydCCeiilGiIiIyOtK4jCW6bBhw2Ty5MnJ5r/zzjtqPDEiIiIicrOSOFSh9unTJ9l89FZFglwiIiIicsMgLl++fCohrznMy58/vzP2i4iIiIicXZ366quvymuvvSanT59Ww1+hY8PWrVtlypQpKgmwN2DHBiIiIvK6IG7MmDGSPXt2+eSTT2TUqFFqXuHChWXs2LEyePBg8QZM9ktEREReF8Sh5A0dGzDdv39fzUNQR0RERERuPmJDfHy8lC1b1iR4O3HihBpHtUSJEs7cRyIiIiJyRseGV155RbZt25ZsPnLFYRkRERERuWEQFxUVJQ0bNkw2v169ehZ7rXpqxwYkNK5Tp46rd4WIiIjIOUEc2sRpbeGM3b17VxISEsQbcMQGIiIi8rogrnHjxjJp0iSTgA33Ma9Ro0bO3D8iIiIiclbHhqlTp0qTJk2kfPnyKqCDLVu2yL1792T9+vWObJKIiIiI0rskDm3FDh48KF27dpVr166pqtWXX35Zjh07JlWqVHFkk0RERESU3iVxWnLfjz76yNGnExEREVFGl8Rp1acvvfSSGnbr0qVLat7333+vht/yBuydSkRERF4XxC1dulRatWolmTNnln379klMTIyaj2pVbymdY+9UIiIi8rog7sMPP5TPP/9cvvjiCzVCgwalcgjqiIiIiMgNg7jjx4+r3qnmcuTIIXfu3HHGfhERERGRs4O4QoUKycmTJ5PNR3u4UqVKObJJIiIiIkrvIO7111+XIUOGqLFSMXrD5cuX5YcffpC33npLBgwY4MgmiYiIiCi9U4yMGDFCDbHVrFkzefz4sapaDQ4OVkHcoEGDHNkkEREREWVEnriJEyfK6NGj5ciRI5KYmKgSAGfLls3RzRERERFRRuSJgyxZskjt2rWlQoUKsm7dOjl69GhaNkdERERE6RnEYbit2bNnq/uPHj2SOnXqqHnVqlVTOeS8AZP9EhERkdcFcZs3bzYMfB8ZGamqU5FaZNasWSqHnDdgsl8iIiLyuiAOnRry5Mmj7q9atUo6deqkqlbbtm0rJ06ccPY+EhEREZEzgrhixYrJ9u3b5eHDhyqIa9mypZp/+/ZtCQkJcWSTRERERJTevVOHDh0qL774ouqNGhYWJhEREYZq1qpVqzqySSIiIiJK7yAOCX3r1q0r58+flxYtWoi/v75AD6M1eEubOCIiIiKvzBNXq1YtNRlDmzgiIiIicqM2cZMnT5bo6Gib1sVwXH/88Uda9ouIiIiInBHEYWSG4sWLS//+/WXlypVy/fp1w7L4+Hg5ePCgzJ07Vxo0aCDPP/+85MiRw9ZNExEREVF6Vad+9913KlBDElx0akCakYCAADVmqlZCV6NGDXnttdekZ8+eaj4RERERuUGbOIzIMH/+fPn8889VQHf27Fk1YkNoaKhUr15d3RIRERGRm3Zs8PPzk/DwcDURERERkYck+/UFHDuViIiI3BmDOCs4dioRERG5MwZxRERERB6IQRwRERGRrwVxJ0+elNWrV6seqqDT6Zy1X0RERETk7CDu5s2b0rx5cylXrpy0adNGrly5oub37dtX3nzzTUc2SURERETpHcQNGzZMAgMD5fz585IlSxbD/G7dusmqVasc2SQRERERpXeeuDVr1qhq1KJFi5rML1u2rJw7d86RTRIRERFRepfEPXz40KQETnPjxg0Ot0VERETkrkFckyZN1FiqxiM4JCYmyrRp06RZs2bO3D8iIiIiclZ1KoK1iIgI2bNnj8TGxsqIESPk8OHDcuvWLfnrr78c2SQRERERpXdJXKVKleTgwYPyxBNPSIsWLVT1aseOHSUqKkpKly7tyCaJiIiIKL1L4qBgwYIybtw4R59ORERERK4I4h4/fqxK465du6bawxl79tln07JPRERERJQeQRxywb388suqN6o5dHJISEgQd3HhwgXp0aOHCjaR227MmDHSpUsXV+8WERERUca3iRs0aJAKhDBSA0rhjCd3CuAAgdvMmTPlyJEjsm7dOpWoGG34iIiIiHyuJA6lWsOHD5cCBQqIuytUqJCaIH/+/JInTx7VizZr1qyu3jUiIiKijC2J69y5s2zcuFGcYfPmzdKuXTspXLiwqopdvnx5snXmzp0rJUuWlJCQEKlVq5Zs2bLFoddCShSUFhYrVswJe05ERES+YOzGsTJh0wSLyzAfyz2mJG727NmqOhXBVNWqVSUoKMhk+eDBg23eFqo2w8PDpVevXtKpU6dkyxcvXixDhw5VgVzDhg1l/vz50rp1a1U9Wrx4cbUOAruYmBiLw4MhOISbN2+qdnxffvmlA0dMREREvirAL0De3/i+uj+ywUiTAA7zx0eM95wgbtGiRWrs1MyZM6sSOZSgaXDfniAOARkma6ZPny59+vSRvn37qsdo34bXnjdvnkyaNEnN27t3b4qvgQDvueeek1GjRkmDBg1SXdc4ILx37566jYuLU1NqtHVsWdfb8Nh53n0Rr3te977Gk6/5+MR4iYmPkdiEWIlJiNFP8fpbzFPz/3tsvCx/lvzSpkwbFbBtOLNB6vjVkb2b9sqEvybIB00+UIGds94Pe7bjp9PpdI7kiEOgNnLkSPH3d6hG1vLO+PlJZGSkdOjQQT3GaBAYo3XJkiUqCNMMGTJE9u/fL5s2bUp1mzi87t27S/ny5WXs2NSLO7GOpfx3CFwtjRdLREREyX9743XxaorTxUlcYpz+9r/72nx1a7TM+LGty+LNXkNbZphv9JqJYpoSzVF+4ic60ckLBV+QbgW7OfX0R0dHq7jl7t27kiNHDueXxCG46tatm1MDOEuQwgS9Xc07UODx1atXbdoGhgFDlWy1atUM7e2+//57VQ1sCUrr0GnDuCQObehatmyZ6pupRdBr165VI1mYVzN7Ox47z7uvXfPA657Xvauv+0RdYlLpkVEpUkolS9aWGeabbQv3EQjh9nH8Y7l265qEZA2R2MRYiUuIs/ja7s5P/CQ4MFiCA4IlU0AmdYvHxve1Zcbzfj7ys3rPMe/b3t86fb+0GkBbOBTE9ezZUwVG7777rmQE4+paLcI3n2dNo0aNkiUjTklwcLCazOFDas8H1d71vQmPnefdF/G6D/KN0iVUxyXEyIO4B3Ir7pZcfHhRdH460yDGKFBKFlyltMyR58THSILORam9om1fNdA/MFlwZHxrbZnDzwkMTnUZ9snWWMK4DRwCuEC/QHU+Jm+bLGOajhFnsid2cCiIQ+nY1KlTVds0lHCZvyDasTlDaGioBAQEJCt1Q4qT9E5vMmfOHDW5W947InI99ERDQ2dLX974kseP6tgI1/RW8xb4oTQPWpKVEKUS3Fhb36Hn/LcMVWgmDovbsTe4Maxv43MCJEAO7T8kDeo2kKzBWVMNrvA4wD9APN2E/zoxoA1cjXs1JCpHlKGzg7MDuXQN4g4dOiQ1atRQ9//++2+TZfZGtSnJlCmT6nmK6knjNnF43L59e0lPAwcOVBOKNXPmzJmur0VEnsVde6qltbG3vSVB0bHRsu/6Pjmx64Rqb2Rx/RQCopReA1V37s5f/PWBir2lQ04uUTK+DfIPcurvsLUmBJnPZJaWpVr6TI3TBKPPNj7zK1askNGNRqvg1JWBnENB3IYNG5y2Aw8ePJCTJ08aHp85c0Z1WkBSXqQQQfs0DJtVu3ZtqV+/vixYsEDOnz8v/fr1c9o+EBHZQ/uyxpd3QmKC1JAaMnHrRBm3eZz6krf2ZY7qOC14cbQkKNXgyoHqPJR6pcml9L9+EJzYXKJkvsyR56QSXPnr/GXNqjXSpk0bnwlkfFmCLsHw2TbuPap91l1Vpe1QEOdMSMDbrFkzw2OtUwHa3S1cuFB1oECOt/Hjx6thvqpUqaIi4LCwMBfuNRH5spvRN+WJIk/IUyWfUoGb1lOtSPYisvToUln09yKLQZcnNfa2pXQIgdXt67clrGiYZA7K7NQSJfOG5v5+6duRzl6emF6DHJdS8whXVaXaFcR17NhRBVXooYn7KVm2bJnNOxAREaH+naZkwIABaspIbBNHRHA/5r7su7JP9lzeI7sv71bT6dunTd4crZ3UpfuX1GRPtazDpUNOKlEyn2dPY28EMvhTzdIoIjcP4tAuTPtgI5BL7zp3V2ObOCLfg9QJB64eUIGaFrQdvX40eWN2ESmdu7Qqffr72t+qoXeCJEj3Kt3l5fCXbQ6gvKGxNxF5QBD3zTffGO6jRI6IyJOhMf/ha4dNArZD/x6y2KAe1aR1itSROoX1U63CtWTOrjnJeqqharVCaAWXVq8Qke9wqE3ck08+qapMc+XKZTIfPTkx2sL69eudtX9ERGmGhvsnbp4wCdiirkTJo/hHydbNmzmvScBWu3BtKZS9kEf0VCMi3+JQEIfxUjFqg7nHjx/Lli1bxBuwTRyRZ0Ib2/N3z+vbr13aLXuu7JG9l/fK3Zi7ydbNnim7KlXTAjYEb2E5w1JtLuKuPdWIyLfYFcQdPHjQcP/IkSMmSXiRFHfVqlVSpEgR8QZsE0fkGf598K9JwIbb69HXk60XEhgi1QtWNwnYyuUt51CvR3ftqUZEvsWuIK569erqHyomVKmay5w5s3z22WfO3D8iIoM7j+/oq0Mv6XuJ4v6FexeSvUPoYVk1f1VVFaoFbJXzVZagAObzIiIfDeKQiBdVFaVKlZJdu3ZJvnz5TEZXyJ8/vxomi4gorR7GPpSoq1EmAduJWycs5jVDZwIEarUL1Va34QXCVc9RIiJvZlcQpyXYtWdAeU/FNnFEGQdJcA/+e9AkYDt8/bDFkQRK5ippErDVLFRTcgTn4OkiIp/j8IgN//zzj+rggMHozYO699/X987yZGwTR5Q+MEzV0RtHTQK2A/8esDiaQaFshUwCNlSPhmYJ5akhInI0iPviiy+kf//+EhoaKgULFjTpyYX73hDEEVHaofnFqdunDAEbJox+EB0XnWzd3CG5Dak9tLZsRXJ4R0cpIiK3CeI+/PBDmThxorzzzjvO3yMi8tiA7eK9iyYBG0rZ0BnBXNagrCapPRC0lcpdyutHgiEicnkQd/v2benSpYtTd4SIPMv1h9dVkLbjwg5ZcXqF9JvVT64+TEo7pMHwUsapPRCwoSMCh5wiInJBEIcAbs2aNdKvX780vjwReYJ7MfdUwlythA2lbefunrM4oHvl/JVNAraqBaqqQI6IiNwgiCtTpoyMGTNGduzYIVWrVpWgINPcS4MHDxZPx96p5KsexT2S/Vf3mwRsx28et7gukuXWKlhLstzJIi8/9bLULlpbsgRlyfB9JiLyRQ4FcQsWLJBs2bLJpk2b1GQMbVq8IYhj71TyBXEJcfL3tb8NwRpu8djSsFHFcxY3Ge0AqT1yheRSw05h7ND6Resn+0NHRERuFsQh6S8ReV5qj39u/mMSsKHELSYhJtm6+bPmNwnYUC2KeURE5AV54ojIvXuKnr1z1iRg23tlrzyIfZBs3ZzBOU2Gp8Jt0RxF2VOUiMgbg7jevXunuPzrr792dH+IyAGX719ONqbozUc3k62XOTCzqgY1DthK5ynt0CDwRETkoSlGjKFNzN9//y137tyRJ5980ln7RkQW3Iy+qYI0FbT91/kAQZy5IP8gqVagmknAVjFfRTU4PBEReT6Hvs0jIyOTzcPQWwMGDJBSpUqJN2DvVHIH92PuqxEOjAO207dPJ1sPJWmV8lVKqhYtXEcFcMGBwS7ZbyIiSn9O+0vu7+8vw4YNk4iICBkxYoR4OvZOpYz2OP6xHLh6wCRgO3r9qOhEl2zdMnnKmAxPVaNQDcmWKRtPGhGRD3FqvcqpU6ckPj7emZskcltjN45VyW3HNB2TbNmETRNUmo6xEWMtPjc+MV4OXztsaL+G20P/HpK4xLhk66KTgXHAhtvcmXOnyzEREZGXB3HDhw9P1hPuypUr8scff0jPnj2dtW9Ebg0B3Psb31f3RzYYaRLAYf74iPHqcaIuUU7cPGESsEVdiZJH8Y+SbTM0S6hJwIa2bAWzFczAoyIiIq8O4qKiopJVpebLl08++eSTVHuuEnkLrQQOARtysNWQGjJxy0QZt2WcdKvcTR7GPZSnvntKDVd1N+Zusudnz5TdpHQNAVtYzjCm9iAiovQL4jZs2GB12aVLl6RIkSKObJbIIwM5VIGO2zxO/MTP0H5t8eHFJuuFBIZIjYI1TAI2DFnF1B5EROTyNnFXr16ViRMnypdffimPHiWvJiLyNpfuXZI5u+fI/L3z1WMtgEMKj6r5q5qMdlA5X2UJCuCQVERE5KIgDnng0GtzzZo1aozEkSNHyqBBg2Ts2LHy8ccfS+XKlZnol7zerku75NOdn8rPh39WHRQ0/uIviZIooxqNkvHN9O3hiIiI3CKIe/fdd2Xz5s2q88KqVatUShHcPn78WFauXClNmzZNtx0lciUEa5FHI2Xmzpmy7cI2w3y0YTt395y83/h9qXm/pkTliFJVq0i0a6nXKhERkUuCOPQ+/eabb6R58+YqsW+ZMmWkXLlyMnPmTK87I0z2S3D70W35Yt8XMnvXbLlw74KahwDthaovSJagLPL5ns9VL1T0Tl2xYoWMbjRaAvyTeq0ykCMiIrcI4i5fviyVKlVS9zEyQ0hIiPTt21e8EZP9+rZjN47JrJ2z5NsD30p0XLSaly9LPulfu7/0r9Nfpf1AnjgEcKpzQ1xSfjctcEOeOCIi8nznz4vcuKG/j3S4p07lFCTqCPwvigoNFSle3M2DOAythbZwmoCAAMmaNWt67BdRhkO+w7Wn18rMHTNl5cmVhvkYvmpo3aGq9A29TDXWEvkCS+CIiLwngCtfXuTxY20O4qAIk3VCQkSOH8/4QC7Q3h+5V155RYKD9eMxoi1cv379kgVyy5Ytc+5eEqUjlLT97+D/VGeFI9ePqHlIF9KufDsVvEWUiGDuNiIiH3XjhnEAZxmWYz23DuLMR2N46aWXnL0/RC5JEXLr0S01D+OP9q7eW96o+4Yan5SIiMhd2RXEoVMDkTekCEGV6ZIjSwwpQkrmKimD6w6WXtV7Sc6QnK7eRSIiSkc6nUh0tMi9eyL376d8e+qUDyT7JXJnCNaWHV2mgrftF7cb5jcNaypD6w2VduXaqV6lRETkvoEXxhIwDrDu2RCEWbrFlJgoHo9BHPlsipAhdYdIzUI1Xb2LREReH3g5EmhZunV24OXvL5I9u0iOHNZvHz4U+eorcUsM4sinUoQMqDNA+tXup1KEEBGR5cALDfWtBVJ37vjLrl1lZNcufxXgpFYqluDkbEt+fkkBVo4Ugi9bbrNk0W8vJfv2MYgjcmmKkGH1hsnzVZ43SRFCRORNgVdMTPIgytFSL+RCsw5NTyo7FHilJeDSbpEQI7XAy1ewJI68NkXIs+WfVe3d0O7Nj594InJDCLycUc2IW6Oc405jKfDKmjVR7t+/KBUqFJFcuQJSDbwwocQLVZeeKDRUnwcupTQjWI71MhqDOPK6FCF9avSRN554Q0rnKe3qXSQiLxQbK3Lzpsi//2aRAwf0P+72BFzG99Mj8MqWLfUSLVtKvVDiZSnwiotLkBUroqRNm0ISFOT9HcKKF9cn8k0asSFOtm79Sxo1aiiBgUGeM2KDL+HYqe6LKUKIyJHAS+uVmFpgldottqXP2t/CaScCAZMjgZb5LQI4Ty3xcmfFiycFaQi8r1y5KzVqiBgNYuUSDOKs4Nip7oUpQoh8D34sndWrEdWWzhYcHC+5c6M60S9N7bwQeAV4f4EWpQMGceTWUE365b4vTVKEZArIJC9U0acIqVGohqt3kYiMoEF8WgMu7X5qQx05InPmtDWs1+4HB8fJmjUrpE2bNiZjihNlJAZx5DEpQvJnzS/9a/dnihByiwGxk9rHIKN7TomKEgn87xvVVe1jHIUUEPa040qaFyAXLzaVt94KNMxHTjBnQ6NxewIsa7eYtHOUVunRlo3IXgziyO1ThIQXCFe9TJkihNwlgCtf3riUCKUwEcmCDjSETs9ATgu8nFHdiOGHHIPGV7ksLgkOdrxBvXngxYIuIssYxJHbpAhB8Hb0xlE1jylCyF2hBC61aj4sx3rmQRwCrwcPnBN4IcmqsyHwsi9RarwcO7ZbnnqqjuTOHWgSeGXK5Pz9IyJTDOLIZS7euyhzd89lihDySq+/rr81Dr7SI/BCKVVaM9dr9+0NvOLidLJixTVp0EDH0jIiF2AQRxmOKULIU925I7J+vW3r7tljfRnaZdkbeFlbhtIzIvJNDOIoQ8QlxMmyo8vUqArbL243zMdoCmjv1q5cOwnwZx97ci9ovL5rl8iaNfoJ920dgHviRJHwcOuBFwcRIaK0YhBH6Z4i5Iu9X8js3bNV9SkwRQi58/iTJ0/qA7a1a/WlbqgKNVaihMjZs6lv6+mnRWrWTLddJSJiEEfplyLk0x2fqhQhj+L1OQeYIoTc0e3bIn/+qQ/aELyZB2h584o0by7SsqVIixYi16+L1Krlqr0lIkrCkjhyaoqQqHtRMu+nebL69GrDfKYIIXerIt2xI6m0bfdu0ypSdBRo1EgfsCFww9A6xsMYIYgjInIHDOLIKSlCvj/wvUoRcuzmMUOKkPYV2svQukOlSVgT8WMDIHJhFemJE0nt2jZuTF5FWqlSUklb06b6cSytQSJf5IFLKc0IlmM9IqL0xCCOHIY2bnN2zZEF+xaotm+Q2T+zvFrrVRlcb7CUzlOa7y65xK1b+ipSLXBDgl5jCLAQsGlT0aK2bxu535DIN2nEhjjZuvUvadSooQQGBnnkiA1E5Jm8Poi7f/++PPnkkxIXFycJCQkyePBgefXVV129Wx5t58WdMnPnTFlyeIkk6BLUvFK5S8nAWgOl0L+FpHOLzhxLkDJUbGxSFSkmpPdACZwG+c9QRaqVtlWvblpFai8EaFqQhurZK1fuqmpXjixARBnJ64O4LFmyyKZNm9RtdHS0VKlSRTp27Ch50VqZ7E4RguBtx8UdhvkRJSJUlekz5Z6RxIREWbFiBd9VSncI0FAapnVG2LAheSLdypX1QRumxo1TriIlIvJEXh/EBQQEqAAOHj9+rErj0ACf0pYipHvV7jKk7hCpXrC6YV0EcUTp5eZN0yrSCxdMl+fLl9QZAb1JixThuSAi7+byIG7z5s0ybdo02bt3r1y5ckUiIyOlQ4cOJuvMnTtXrYPllStXlpkzZ0pj/LW20Z07d6Rp06Zy4sQJtZ1QtjhO1dHrR2XWzlnJUoQMqD1A+tXuJwWyFbD/ZBPZWUW6bVtSadvevaZVpEiYq1WRYqpWLW1VpEREnsblQdzDhw8lPDxcevXqJZ06dUq2fPHixTJ06FAVyDVs2FDmz58vrVu3liNHjkjx/xql1KpVS2JiYpI9d82aNVK4cGHJlSuXHDhwQP79919Vldq5c2cpUIBBiDmUUK45tUZVma46ucowH6VtqDJ9vsrzEhzIMX4ofSBAO3YsKfUHepGaV5FWrZpU2ob/cf8VshMR+SSXB3EIyDBZM336dOnTp4/07dtXPUYp3OrVq2XevHkyadIkNQ+leLZA4FatWjVV+telSxeL6yAYNA4I72HUatV4OU5NqdHWsWVdd0oR8sOhH+Sz3Z+ZpAjBUFiD6wyWxsUb61OE6FI+Lk88dmfhsTt23tHD888//WTdOn91e/Gin8ny/Pl18tRTOmnePFHdFi5s/r6Ly/Hc8zPva3z5ms+I47dnu346N2oghkDBuDo1NjZWtWdbsmSJPPfcc4b1hgwZIvv371cdFlKD0rfMmTNLjhw5VEBWv359+fHHH1UwZ8nYsWNl3LhxyeYvWrTI0LbOW9yIvSErb6yUNTfXyP2E+4YUIc3zNpe2oW2lYHBBV+8ieZm4OH85diyP7N+fT/bvzy+nT+cUnS4pcAsKSpBKlW5K9erXpXr1axIWdo9VpETkU6Kjo6V79+5y9+5dFbu4dUlcSm7cuKE6IphXfeLx1atXbdrGxYsXVUkeYlVMgwYNshrAwahRo2T48OGGxwj8ihUrJi1btkz1zdQi6LVr10qLFi3cNs3Grku7ZNbuWbL06NKkFCG5SsnA2gOlZ3hPyRGc+nF66rGnFx675fOOv4hHj4oqaVu3zk82b/aT6GjT0raqVXXSooW+pK1RI51kzpxbRDCVE0/Ac8/PPL/vfEtcOv/WaTWAtnDrIE5jnu0fwZitIwCgvRxK7WwVHBysJnM4UfacLHvXd4cUIQH+AU55LXc79ozEYw9Sw1KtW5fUi/TyZdP3CP/JtHxt6EVaqBA+y8659lyJ556feV/jy9d8eh6/Pdt06yAOvUiRIsS81O3atWvp3jFhzpw5akJJoK+kCCFyBIafOnAgVLZuRbs2kaio5ENQNWmSFLihcwJHYSMiSju3DuIyZcqkStJQbGncJg6P27dvn66vPXDgQDWhWDNnzpziaZgihNILqkgPH05K/bFpU6A8etTQZJ3w8KSgDWlAMmfm+SAi8rog7sGDB3Ly5EnD4zNnzqjqzzx58qgUImif1qNHD6ldu7bqlLBgwQI5f/689OvXz6X77Y6YIoTSy7//6qtItcDtyhXjpX6SO/djads2kzz9tL+qImUGHyIiHwji9uzZI82aNTM81joV9OzZUxYuXCjdunWTmzdvyvjx41WyXwybhaGdwsLCfKo6dezGsRLgFyBjmo5Jtuz9De/Lviv75PTt03L0xlFDipD2Fdqr9m5NwprY3IaQSKsi3bo1KWebebNSlKxpVaTNmsXJuXOrpW3bNhIUxGy7REQ+E8RFRESkOgzWgAED1JSR3K06FQHc+xvfV/e1QA5t3Lov7S5bzm8xrJc9U3bpU6OPvFH3DTUoPZEt8BH8+++koA3ZexDIGcMA71qi3YYN9W3dACmNzp/n+0xE5HNBHNlGC9wQyJ29c1ai46Nl8d+LRYcMvEgRkruUDH5isPSq0cvhFCHkW9BfSOtFisDNPGsPEusaj0WaP7+r9pSIiCxhEOcBYhNiZcOZDXLh3gXJEpRFvt7/tWFZyVwlZUarGU5NEULe6dGjpCpSTAcPJq8ijYhICtwqVWIvUiIid8YgzgVt4lJq3zZh0wSVgHdEwxFqHFMk5P3t+G9yN+ZusnWD/IPk9JDTTt8/8p4q0kOHkoK2LVuSV5HWrJnUixRVpBZSJBIRkZtiEOeCNnGW2rfBe+vfk4lbJkql0Eoybds0NaappkDWAvJchefUvO8OfqdyvaGEDkGfpWCQfBN6jRpXkaJXqbEiRfRBG6annhLJl89Ve0pERGnFIM7F7dsQlJXNW1ambJ0i/9z6R80/cuOIug3LGSYdK3aUThU7Sb2i9eSjLR+p54yPGK+2gQDOUjBIviM6Wl/CpqX+QMmbMQz3iypSrbStYkVWkRIReQsGcW4QyBkrn7e8Cto6VeokNQrWMKQG0QI2LYCztA0Gct4vMVHflk0raUMAFxOTtByXi1ZFiql+fVaREhF5KwZxLoSga/zm8RKfGK+qWA/1PyQV81W0uC7ayRkHcMbb0JaTd8LYo1pJG6pKr10zXV60qGkVaWioq/aUiIgyEoM4Fyb7RekaAjitfdsvR36xWpo2NmKs1e2wBM77qkg3b04qbUP+NmNZsyZVkWIqX55VpEREvohBnIuS/ZpXj7J9m29XkR44kNSLFGlAYmNNq0hr105K/YEq0kyZXLnHRETkDhjEuQDbt3kHjFJw44b+fny8yKlTOSUqSiTwv08VqjWLF7f83EuXTKtIr183XV6smEirVvrADVWkefOm88EQEZHHYRDnAmzf5h0BHKoxk/KuBWEQOZN1MCzV8eP6QO7hw6QqUkxH9B2QDbJlwxikSaVt5cqxipSIiFLGIM4F2L7N86EEzjxxrjksnzZN5PBhkb/+Sl5FWqdOUuqPevVYRUpERPZhEOfCjg3k/WbPTrofFpbUGeHJJ0Xy5HHlnhERkadjEOeijg3kG5o0EenaVR+4lSnDKlIiInIeBnFE6WjGDH3yXSIiImfzd/oWibzcuXMiY62n7SMiIsoQDOKIbISREoYO1fcc/e03vm1ERORaDOKIUnHvnr7krXRpkU8/1fcyRfJdIiIiV2KbOKIUUoTMmycycaLIzZv6ebVqiUyapC+Nq1Ah5TQjyBPHcUyJHIfsAHFxcW75FmK/AgMD5fHjxz6XxcCXj91Zx58pUybx9097ORqDOCuYYsR3YfSF777Tl75duKCfh6ANwVynTkk9TJHIN2nEhjjZuvUvadSooQQGBqU6YgMRWafT6eTq1aty584dt97HggULyoULF8RP+1LwEb587M46fgRwJUuWVMFcWjCIs4IpRnyPTieybJnIe++JHDumn1e0qD6Y69kzaTgtDQI0LUhDYcGVK3elRg2RIH0MR0QO0gK4/PnzS5YsWdwyUEhMTJQHDx5ItmzZnFKi4kl8+didcfx4/uXLl+XKlStSvHjxNF3fDOKIRD9+6ahRInv26N8OjFWKxwMGiGTOzLeIKKOgekoL4PK68aDB+CGOjY2VkJAQnwtkfPnYnXX8+fLlU4FcfHy8BKXhnz+DOPJpu3frg7U//9Q/zppVZPhwkTffFGGOZ6KMp7WBQwkckbfK9F81Kv60MIgjstPRo/pqU1Sf6j9QIv36iYweLZI/P99OIldzxypUIne7vlkSRz7l/Hl9G7dvv0WROBqXivTooZ9XooSr946IiMh2vleZTT7p+nWRYcNEypYV+eYbfQDXoYPIwYMiCxcygCPyOkj9sHGjyI8/6m+9NBXG2LFjpXr16uLpzp49q0qn9u/fb9fz1q9fLxUqVFDt1GD27Nny7LPPiq9gEEc+kai3VCmRmTP1iXojIkS2bxeJjBSpXNnVe0hETod2Eihab9ZMpHt3/S0ea+0n0sErr7yighBMaONUqlQpeeutt+Thw4fp9pokMmLECBk9erShg8Grr74qu3fvlq1bt/rE28MgLoU8cZUqVZI6depk7Bkhp0ASXgw+j1EWxo0TefBAn6h39Wr8cxOpV49vNJFXQqDWubPIxYum8y9d0s9Px0Du6aefVmkjTp8+LR9++KHMnTtXBXKUPrZt2yYnTpyQLl26GOYFBwdL9+7d5bPPPvOJt51BXAp54o4cOaIievKsRL1ff61PzotepkjGi/tLluh7orZsmZSsl4g8JIEjSrNsmVD0Pniw/jmWtgNDhujXs2V7lraTAgQQSAJbrFgxFUi8+OKLsnz5crXsf//7n9SuXVuyZ8+u1sHyaxiQ+T8bN25UpXh//vmnWg+9cxs0aCDHkVXcyOTJk6VAgQJqO3369FGjBhjDb1aLFi0kNDRUcubMKU2bNpV9+/Ylq4JFfjLsb+HChWUw3jMrTp06Je3bt1evibxoKNhYh5xMRkqUKCETJkxQx4R1sE3zIArHNm/ePGndurVkzpxZJbpdgi9mK8l0y5QpIx9//LHJ/L///luVuGGf4KeffpKWLVuqVB/GUJ2K9/3Ro0fi7RjEkVfAd+3SpSJVq4r06aMfaaFIEZEvvhA5fFj/B5zBG5EHio4WyZbNtgl5gVDiltIXBUrosJ4t28NrpwGCFS1lCvKKIdA5cOCACjDOnDmjqmDNoWrwk08+kT179qihnXr37m1Y9vPPP8sHH3wgEydOVMsLFSqkSvuM3b9/X3r27ClbtmyRHTt2SNmyZaVNmzZqPvzyyy8yY8YMmT9/virFwr5UxRenFUhqi+cjcIuKipJWrVqpoA6jFRibNm2aVKtWTQWMo0aNkmHDhsnatWtN1hkzZox06tRJvQcvvfSSvPDCC3IUqQLMIODDcX+DBsxGvv76a2ncuLGURhWLiGzevFkFvOYwD+/7rl27xOvpKEV3797FXzF1a4vY2Fjd8uXL1a2vcdWxr1un09Wpg29n/ZQnj0738cc6XXR0xu0Dz7tvXvPAc+/cc//o0SPdkSNH1K3y4EHShzujJ7y2FQkJCbrbt2+rW+jZs6euffv2huU7d+7U5c2bV9e1a1eLz9+1a5f6bbl//756vGHDBvV4Hb7Q/vPHH3+oedp7Ub9+fV2/fv1MtlO3bl1deHi41f2Mj4/XZc+eXffbb7+px5988omuXLlyaTpnlSpV0k2ZMsVw7GFhYbqnn37aZJ1u3brpWrdubXiM47C07/3791f3z5w5o9aJiopSjy9fvqwLCAhQ7yNgf/Ply6dbuHCh4fk5c+bUfffddxb3MXfu3CbrOpP5uXfKde5g3MGSOPJYqB5t3lw/4T4S9Y4ZI3L6tD5ZL0daIPICSPqLRq22TCtW2LZNrGfL9uxMOPz777+r6kRU79WvX1+aNGliqFZEKRZKsMLCwlRVaAR6WKm0R+dNtoHSLA1K2kCrdkWpFbZrzPwx1u3Xr5+UK1dOVadiQmma9jpoP4ZqRnS8QCeAyMhINWqANeiYgc4DaCOeK1cudXzHjh2Ti2ZtDi3tl3kpmy3rGB9727ZtVemb9t6i6ti4/dujR4+SVaUal4JGp7Ek1RMwTxx5fKJejFjSv7/Iu++KFCjg6r0jIqdCOwj8Q7MFGr1iwGNUqVpqz4ZtYTnWCwhw+olq1qyZaveF3qloF6Zl4kcghLZbmNA2DkMuIahC1SSqWY0ZZ+/XEsJq6TNsgSra69evy8yZM1XAiHZvCJa010F7PbSzQ1UnqkgHDBigqkI3bdpkceSAt99+W1avXq3ap6GdGoKjzp07G6qJ05rQNqV1+vbtKz169FDVv6ha7datm8lIHqGhoXL79m2Lz71165Z6n70dS+LIY+CPJJqHVKmiD+Dw2cfA9P/8I/LppwzgiHweAjN8GYB5cKA9Rq6hdAjgIGvWrCrQQfBkHBCh5OrGjRuqUwLadCGvmXGnBltVrFhRtXMzZv4YbeHQUQHt2CpXrqyCOLy2MQRiaPw/a9Ys1aFi+/btcujQIYuvie0hMHzuuedU2zl0ykBON3OW9gvHae86xnAMeE8RGK9cudKkfSDUqFFDdUA0h44PKLXDcm/HkjjyiES9H30kgva72p9WJOr98EPmeSMiMx07ovW+vheqcZUfSuAQwGF5BkNPUIyViapVVHWilyU6OdhryJAhqtMCGu43atRIfvjhBzl8+LCqGtUgiPz+++/VOvfu3VMlaQjaNAsXLlTjddatW1eVamFdLEfgaQm2t2zZMmnXrp0qNUPnBEslg3/99ZdMnTpVOnTooEr50PP0jz/+MFkH84z3HR0PvvrqK6vHGxAQoAJIdJTAfphXx7Zq1Uq+xfA7FgJPvCdaBwhvxpI4cltM1EtEDkGghtKiDRtEFi3S354545IADlCth+AJQQzalqFEzjx9hi1Qnfj+++/LO++8I7Vq1ZJz585Jf7QlMYI2ZKhiRCkUqiJRKpffaEBotGv74osvpGHDhqr9HVKa/Pbbb5I3b16Lr4mqzNy5c6t0JwjkEDjVrFkz2Xpvvvmm7N27V70uAlT0sMW6xsaNG6fSguB1EXwhkMP7kRKkUUFVsHkpHLz00kuqJM48DcuPP/6o2vv5BIe7VvgI9k7N+F566KwzY4ZOFxqa1EmsZk2dbvVqnS4xUeeW2EORvVN9sXduelz3KfXacyfO6KHoqcyPHb1TZ+BLOwUINyIjI+1+ra1bt+oCAwN1V69etbj87bff1r322muGx4cOHdLlz59fd+fOHV16Ye9UIgvQQQppgZCcF+Ocaol6f/6ZiXqJiHxJTEyMnDx5UlXfdu3aVSUbtmT06NGqKhhVxHD58mX57rvvVK9cX8A2ceRy+I+GcUxHj0YDYP08JOrFmKfIhRnIq5SIyKegShRVqdWrV1ft9qzJmTOnvIvUBP9BD2Bfwp/HFMZOxaRF95Q+/vxTZNQofUkb5MmjfzxwIPO8ERF5Aku9Vc3pa1Rthw4Nlka0IFPs2GAFx07N+ES9yP2GRL0YL5qJeomIiFLGkjjKUKguRbCGcU4BqZT69dNXpTJRLxERke0YxFGGJeodNw45ipB9XJ93s0cP/bwSJXgSiIiI7MUgjtI9Ue+kSWhjmJSot317faJejLxAREREjmEQR+ni/n2R6dNFkM8S40hD06YikyeL1KvHN52IiCitGMSRU8XG+susWf4qWNOG60NybwybhZ7fNoyHTERERDZgEEdOS9T77bd+8u67T8n16/rBpcuW1Vebdu4s4s9+0ERERE7Fn1ZKE6T+WbZMpFo1kVdfDZTr17NI4cI6WbBA5PBhka5dGcARUcYZu3GsTNhkeXB5zMfy9IK8ZhgkHmOjGlu+fLmaT+RsDOIoTYl60b6tUyeRo0eRqFcnr7zytxw9Gi8YexjpQ4iIMlKAX4C8v/H9ZIEcHmM+lqenkJAQmTJlihqEnii9MYgjuyE5b4sW+kS9u3aJZMmiz/12/Hi8dOhwiol6ichpkOn/YexDm6fh9YfLe43fUwHbmPVj1Dzc4jHmY7mt27J3lAFo3ry5FCxYUCahW74FY8eOVUNJGZs5c6aUMMq1hBK9Dh06yEcffaTGDM2VK5eMGzdO4uPj5e2335Y8efJI0aJF5euvvzYZNQGlfT/99JM0aNBABZOVK1eWjRs3Gt7HMmXKyMfobWbk77//Fn9/fzl16pTdx0quxzZx5LREvXFxfDOJyLmi46Il26RsDj33wy0fqsna49Q8GPVAsmbKatdrBgQEqOCre/fuMnjwYBVsOWL9+vXquZs3b5a//vpLjSO6fft2adKkiezcuVMWL14s/fr1kxYtWkixYsUMz0OQh6CwUqVKMn36dHn22WflzJkzkjdvXundu7d888038haGxfkPAsHGjRtL6dKlHdpPci2WxJFNiXr79BGpXFkfwKFpx8svo+RNZNYsjrRARGTsueeeU6VtH3zwgcNvDErbZs2aJeXLl1fBF26jo6PVYO9ly5aVUaNGSaZMmVSAZ2zQoEHSqVMnqVixosybN08NEP/VV1+pZb169ZLjx4/LLlShCP54x8n//vc/tX3yTCyJI6uQIgSpQebOFYmJ0c9jol4iykhZgrKoEjF7Td46WZW6ZQrIJLEJsaoqdWSjkXa/tqPQLu7JJ5+UN99806HnoyoU1ZwaVKtWMcqQjhI/lK5du3bN5Hn169c33A8MDJTatWvLUTRaFpFChQpJ27ZtVenbE088Ib///rs8fvxYunTp4tA+kuuxJI4sJurFcFilSonMmKEP4JCod9s29LLiSAtElHHQzgtVmvZM07dPVwHc+IjxEvNejLrFY8y3Zztp6VGKas9WrVqpkjNjCMzM29qhRMxckFnPMOyLpXmJGMcwFcbH0bdvX9Vu7tGjR6pqtVu3bpIFDZvJI/lMEIdi6LCwMJO2AGQKwdqnn+qDt7Fj9cFcjRoiq1aJbNiAf3h8x4jIvWm9UBG4jWk6Rs3DLR5b6rWanpBq5LfffpNt+Af8n3z58snVq1dNArn9+/c77TV37NhhuI+OEHv37pUKFSoY5rVp00ayZs2qqlpXrlzJqlQP5zPVqRMnTpS6deu6ejfcNlHv99/rAze0f9MS9U6YIIJSdibqJSJPkaBLMAngNNpjLM8oVatWlRdffFE+++wzw7yIiAi5fv26TJ06VTp37iyrVq1SwVSOHDmc8ppz5sxRbebQJm7GjBkq1YlxmzdUw6L3K9rUobeqcfUreR6fKIk7ceKEHDt2TP0DoST4IxgZqU/Ui884ArjChcWQqLdbNwZwRORZxkaMTRbAaTAfyzPShAkTTErdEFzNnTtXBVvh4eGqk4Eza4hQ+of2eNj2li1b5Ndff5XQ0FCTddDTNTY2lqVwXsDlJXHoPj1t2jRV5HvlyhWJjIxU+XGM4YLHOliOxp7oPo0u0bbCBwTPNy7S9nXr14uMGqXP8wa5c+sfDxokzPNGROSAhQsXJpuHZjzoPGAMqUEwGTNuO2dpO1q+N2PIDWcOQaJxlaol+C1Fp4eXkWaAPJrLg7iHDx+qfwzo+oxu0eaQC2fo0KEqkGvYsKHMnz9fWrduLUeOHJHixYurdWrVqiUxWvdJI2vWrJHdu3dLuXLl1MQgTmTPHn2wtm6d/j1Ce9ZhwxDoiuTKlf7nm4iIXAO/kxcuXJAxY8ZI165dVY9X8mwuD+IQkGGyBskKUfSLHjWAUrjVq1erRplaRmyU4lmDfyToibNkyRJ58OCB6gWEtgfvv/++1YvcOCC8d++eusXzLPUgMqetY8u6GZ2o94MPAiQyUl+DHhSkk1dfTZSRIxOlYEH9OmndZXc99ozAY/fN8w48984999gWqh/R69KWnpeuolWRavvqato+pPS+/fDDD/Lqq6+qHHbffvutw/vtbsee0Zxx/Hgeno/rHe0UjdnzefLTOTKuSDpBN2jj6lTU2aPrMwIwJE/UDBkyRPXm2bRpk13bRxE1hhgxH3bEfEgUDG9ibtGiRR7ZDfv69RBZvLiCrF9fXBIT/cTPTydNm16UF144JgUKRLt694iITKCaD8NWYRQCJLMl8kaxsbGqVBQ9ldGL2DybBkb8uHv3bqodXlxeEpeSGzduSEJCQrIiXzzGgacH9NgZPny4SUkcvkxatmxpU+8hRNBr165VQ6GY5/TJ6ES9U6f6y7x5/hITo88R9MwziTJuXIJUrYqit/+K35zIXY7dFXjsvnnegefeuece7cfw45YtWzY1/qe7QvnH/fv3JXv27GnKJ+eJfPnYnXX8uM4zZ86s8gmaX+daDaAt3DqI05i/SXgDHXnj0K06NcHBwWoyhy8oe76k7F3fWZDbDQl6UdiI+9CkCXosIc+bf4Z0SHbVsbsDHrtvnnfguXfOuccfd3y/Iymu8YgF7karRtP21Zf48rE76/jxPC2Bs/nvpT2/n24dxKFbNOqKzUvdMMxIejfIRPdvTPhCcQdI/4HSNWuyZxdZsQL58FCFqp+HRL0YNqtVK/14p0REROQ93DqIQ3sI9DxFFZ1xmzg8bo9BPNPRwIED1YRiTQwg7OoArnx5FL/atj4T9RIREXk/lwdx6DF68uRJw+MzZ86oTgt58uRRKUTQPq1Hjx5qEF9kll6wYIGcP38+WY4db4YSOFsCOORzRElcr14ojs2IPSMiIiKfDeL27NkjzZo1MzzWOhX07NlT9SbF4Lw3b96U8ePHqwSFVapUkRUrVqgEir5UnWqLX38VadDA1XtBREREPhHEYRy51LKcDBgwQE0ZyZ2qU23lxh25iIjcov0waiz+yxPvVTB6Q8mSJSUqKkrlgfMmJUqUUEn/MXmKsxl0PnyvW4kHMkshQ0REKbQfrlXL+oTlWM/ZkP0AvQ0xdqmx5cuX+2QaDk909uxZda7QpMtTMIhzc5s3i3Tv7uq9ICLyjvbDWJ5SSV1aIN8XBp+/fft2+rwAOSTOi0eTYRBnBdrDVapUSerUqeP0Nx3/Avftsz5hObKq9Ogh0rSpyKlTTt8FIiKPgNY2Dx/aNj16ZNs2sZ4t27N3PKPmzZur0Sa0ISGtjQpkXr2G4SRRZWhcqoeRiz766COVTitXrlxqJCFk9n/77bdVx7+iRYvK119/nWz7x44dkwYNGqiAsnLlyrJx40bDMrTxxjCWqOZDotny5cvLp59+muIxWXrOrFmzkq2HfcHrIc9qoUKFZNCgQYZld+7ckddee00dC/YLbdt///13w3KMa46kt9g+kusPHjxYjatuDUYywPby58+vkvA/+eSTcuDAgWTvMfapVKlSap/QbGvVqlXSqFEj9X7mzZtXnnnmGTll9AOLY4QaNWqoEjk099J88803UrFiRbX/iA2+/PJLk33atWuXeh6WoyMmqlF9ok2cu0qvNnG2pAsJDNS3b3vwQJ/fDdlVli1z2i4QEXmM6GiRbNmcu81GjWxbD9/BWbPavl3kNUXghSGTEIgg0HLU+vXr1fM3b94sf/31lwqktm/froKdnTt3yuLFi1WWBoyWgcBHgyAPQSECDYw9/uyzz6qsDwhakKQW2/z5559VHlYETwiGEHR17drV4n5Yew5+F9EBETCWOToloioZY6EjyMI+a8/HPIxw8L///U9Kly4tR44cMYwXeujQIWnVqpVMmDBBvvrqK7l+/boKADEhcDKHYKxt27YqkF2xYoXaj/nz58tTTz0l//zzj5oPyHqBfV66dKnhtRAYYj+rVq2q7mMMdaQvQ/Upku8iEHviiSdk3bp1KiDVhn374osv5IMPPpDZs2erQA3jteM9wHvaq1cvtS0EhAgmcYx4vzE8aIbA2Klk3d27d/FfTN3aIjY2Vrd8+XJ1a8nevfhvZ9tUu7ZOt2uXTnfunE4XEpLyuliO9VwptWP3Zjx23zzvwHPv3HP/6NEj3ZEjR9QtPHhg+3emsye8tjUJCQm627dvq1vo2bOnrn379up+vXr1dL1791b3IyMj1W+I5oMPPtCFh4ebbGvGjBm6sLAww2NsC4+1bUP58uV1jRs3NjyOj4/XZc2aVffjjz+qx2fOnFGvM3nyZMM6cXFxuqJFi+qmTJli9TgGDBig69Spk84e/fv31z377LOG/StcuLBu9OjRFtddvXq1zt/fX3f8+HGLy3v06KF77bXXTOZt2bJFPUe7BvBe4D2CP//8U5cjRw7d48ePTZ5TunRp3fz58w3vcVBQkO7atWspHgeW4z07dOiQyXsYFRVlsl6xYsV0ixYtMjzGceN469evrx7jdfPkyaN7+PChYZ158+ZZ3Ja169zRuIMlcW5q9GiRcePwz07/+Phx3+xxRUS+LUsWfYmYLdAe3ZZStq1bRWzpMIjXdgTaxaFU5s0333RsAyKqJMh4SCdURaIaUoPSJZQEYQQjY8inqgkMDFRVe0ePHjXM+/zzz1VV4Llz5+TRo0dqIPbUek9aeg5KswCvf/nyZVUSZglKuVCSV65cOYvLUaqFUrMffvjBpLQNJXgo0UIVpvn6yC+LYzeG/TKuGkUasnz58pmsg+VjxoyRHTt2qLHZteGzkHvW+L01hpJBjOWLktBXX33VMB9V21otHd7f8PBwyWJ0wRifh/TEIM5NdeyYFMABAjQGaUTka9CkxNYqzcyZbV/PnmpSe6HKE1WE7777brIxuxGYmafVstTw3nz8TG2cTfN5WiCSEq13LKoXhw0bJp988okKMjCA+7Rp01T1rDWWnjN16lRVtQtox5aS1JZj/19//XVV/WwOCf8trY/qX+O2fhq0ddNktXCC27Vrp6qeUT1auHBhtS0EbwhKrdHeXzynbt26hnkIJLUgLrU0aemJQZwXJfslIiL3gPZhKOEyL4FC6RDGA8cPvxZcOTOlBUqZEERqpUUoudI6GWzZskV1ejDOu2pcemWJpeecPn3acB9BHTpl/PnnnyaJ+zXVqlWTixcvqvZqlkrjatasKYcPH5YyZcrYdHxYH+8fShlLGHUGSQ0GDUCJGdrPNW7cWM3biiJZI1obOOPffZSAFilSRB3ziy++aAji0F4enSoA7Q+///57VRqoBa04DxmBvVOtQKcGNL7cvXt3hpwIIiJKGzQrSS3pOZZjvfSG6kb86H/22Wcm89HjEVV0KM1CAIXCgpUrVzrtdbG9yMhI1UsVv2NId9K7d2+1DIESRklavXq1CqpQtZjab5wtz0FvUJTUodfqiRMnZN++fYbjbtq0qQoqO3XqpMY9RxUpjhc9ReGdd95RpXrYVwSzeP7//d//yRtvvGG1BzBKBNF7d/Xq1Sq3GzpbvPfee2o/rcmdO7eqgsXQnai+RccRbYQoDXq7IgjDvv3777+qg4Z2fOhxjJ68eA/QGQPVvzNmzFDL0ZEFJayockXcgA4XH3/8sWQEBnFEROQVUPuG9sN791qfsDyjmqagx6V5VRvaeM2dO1cFW2hHhR6Rb731llNLANEmD9tGKdqvv/6qepUCerN27NhRDWeJqkGUTqU2GpKl5/Tv399kHfRSRY9YHBfa8qGnJoIxDXqIIl3XCy+8oEqtRowYYSjtQkndpk2b1PooIUPvTwSKqDK1BKWXCJIQGPbu3VuV7j3//PMqmEOpmTUIsn766SdVMokqVFQRoyrZGEr3EIiitA7Vre3bt1fz+/btq9oEYihQBOcocVy0aJGhJDBbtmzy22+/qQAO+z969Gh1DjKCH3o3ZMgreSgtxQgicq3oNCVo24ALrE2bNsnaLwDywCFreGrwZVOzpniU1I7dm/HYffO8A8+9c8/948ePVWkNcnYh55a7Mq5SM+6A4At8+diddfwpXef2xB2+9+67mDsV9xMREZHnYseGDO7YoBX3M10IERERpQWDuAwesQGYLoSIiIjSitWpRERERB6IQRwREbkd9rkjb6ZzUp9SBnFEROQ2tF6u0Rj5nshLxf43SgSGT0sLtokjIiK3gR81DJ+kjQmK8Si1kQ3cLc0EfoiRKsLX0mz48rE74/jxfCR8xrWN3HRpwSCOiIjcSsGCBdWt+eDu7lYdpg2z5I5BZnry5WN31vEj+MPYsGl9/xjEWcGxU4mIXAM/bMjYj2GQLA0O7w6wX5s3b1YjB/hakmtfPnZnHT/GaXVGKSaDOBekGCEiItuqVtPaZii9YL8wwDyy7ftaIOPLx+5ux+97ldlEREREXoBBHBEREZEHYhBHRERE5IHYJs7GhHxoG2drg0fkN8L6rq4rz2g8dp53X7vmgdc9r3tfu+59+ZrPiOPX4g1bEgIziEvF/fv31W2xYsWccW6IiIiIbIo/UutY6afj2CapJuW7fPmyZM+e3aZ8LoigEfBduHBBcuTIIb6Ex87z7mvXPPC653Xva9e9L1/zGXH8CMsQwBUuXDjVNCQsiUsF3sCiRYvafRJwYn3x4gYeO8+7L+J1z+ve1/jyNZ/ex29rajN2bCAiIiLyQAziiIiIiDwQgzgnCw4Olg8++EDd+hoeO8+7L+J1z+ve1/jyNe9ux8+ODUREREQeiCVxRERERB6IQRwRERGRB2IQR0REROSBGMQREREReSAGcamYO3eulCxZUkJCQqRWrVqyZcuWFNfftGmTWg/rlypVSj7//PNk6yxdulQqVaqkerbgNjIyUjz92JctWyYtWrSQfPnyqeSH9evXl9WrV5uss3DhQjXqhfn0+PFj8fTj37hxo8VjO3bsmNef+1deecXisVeuXNnjzv3mzZulXbt2KlM69m/58uWpPsdbPvP2Hrs3febtPXZv+rzbe+ze9HmfNGmS1KlTR43IlD9/funQoYMcP37coz7zDOJSsHjxYhk6dKiMHj1aoqKipHHjxtK6dWs5f/68xfXPnDkjbdq0Ueth/XfffVcGDx6sTqZm+/bt0q1bN+nRo4ccOHBA3Xbt2lV27twpnnzs+CLAF/qKFStk79690qxZM/XFgOcaw5f9lStXTCZ8ENyNvcevwReA8bGVLVvW68/9p59+anLMGIomT5480qVLF4879w8fPpTw8HCZPXu2Tet702fe3mP3ps+8vcfuTZ93e4/dmz7vmzZtkoEDB8qOHTtk7dq1Eh8fLy1btlTvicd85jF2Kln2xBNP6Pr162cyr0KFCrqRI0daXH/EiBFqubHXX39dV69ePcPjrl276p5++mmTdVq1aqV7/vnnPfrYLalUqZJu3LhxhsfffPONLmfOnDpPYO/xb9iwQYeP0+3bt61u01fOfWRkpM7Pz0939uxZjzz3GpxPHEtKvOkzb++xe9tn3p5j96bPe1rPu7d83uHatWvqPdi0aZPOUz7zLImzIjY2Vv27RFRuDI+3bdtm8TmIvs3Xb9WqlezZs0fi4uJSXMfaNj3l2M0lJiaqAXzxD83YgwcPJCwsTI1H+8wzzyT71+7px1+jRg0pVKiQPPXUU7JhwwaTZb5y7r/66itp3ry5Os+edu7t5S2feWfw5M+8ozz98+4M3vR5v3v3rro1v4bd+TPPIM6KGzduSEJCghQoUMBkPh5fvXrV4nMw39L6KKLF9lJax9o2PeXYzX3yySeqSBpFyJoKFSqothL/93//Jz/++KMqWm/YsKGcOHFC3Ikjx48v8gULFqgidbQVKl++vPpiR5WTxhfOPapMVq5cKX379jWZ7ynn3l7e8pl3Bk/+zNvLWz7vaeVNn3edTifDhw+XRo0aSZUqVTzmMx/o9C16GTTGND/R5vNSW998vr3bdBVH9xMf2rFjx8qvv/6qGotq6tWrpyYNPtQ1a9aUzz77TGbNmiWefPz4EsekQSNvtBX5+OOPpUmTJg5t05Uc3U98cefKlUs1EDbmaefeHt70mXeUt3zmbeVtn3dHedPnfdCgQXLw4EHZunWrR33mWRJnRWhoqAQEBCSLnK9du5YswtYULFjQ4vqBgYGSN2/eFNextk1POXbjRvF9+vSRn3/+WRWxp8Tf31/1DHK3f2dpOX5j+BIzPjZvP/f4kvr6669VI95MmTJ55Lm3l7d85tPCGz7zzuCJn/e08KbP+xtvvKFKDVEljupfT/rMM4izAhcluhCjx4oxPG7QoIHF5+DfmPn6a9askdq1a0tQUFCK61jbpqccu/ZvHN3PFy1aJG3btrXpS2D//v2qasKdOHr85tAGxPjYvPncaz29Tp48qX7QPfXc28tbPvOO8pbPvDN44uc9Lbzh867T6VQJHKrE169fr9Iqedxn3uldJbzITz/9pAsKCtJ99dVXuiNHjuiGDh2qy5o1q6EXDnrr9ejRw7D+6dOndVmyZNENGzZMrY/n4fm//PKLYZ2//vpLFxAQoJs8ebLu6NGj6jYwMFC3Y8cOnScf+6JFi9RxzJkzR3flyhXDdOfOHcM6Y8eO1a1atUp36tQpXVRUlK5Xr17qOTt37tS5G3uPf8aMGaqX1j///KP7+++/1XJ8vJYuXer1517z0ksv6erWrWtxm55y7u/fv6/2DxPO3/Tp09X9c+fOef1n3t5j96bPvL3H7k2fd3uP3Zs+7/3791e9aDdu3GhyDUdHRxvWcffPPIO4VOALKiwsTJcpUyZdzZo1Tboe9+zZU9e0aVOT9XEx1KhRQ61fokQJ3bx585Jtc8mSJbry5curE4+uysYffE89dtzHF4D5hPU0CAaKFy+utpcvXz5dy5Ytddu2bdO5K3uOf8qUKbrSpUvrQkJCdLlz59Y1atRI98cff/jEuQf8cGfOnFm3YMECi9vzlHOvpY6wdh1782fe3mP3ps+8vcfuTZ93R655b/m8i4XjxoQUKRp3/8z7/XcgRERERORB2CaOiIiIyAMxiCMiIiLyQAziiIiIiDwQgzgiIiIiD8QgjoiIiMgDMYgjIiIi8kAM4oiIiIg8EIM4IvJZZ8+eVYNSY0ggd3Hs2DE1DmdISIhUr17d1btDRBZs3rxZ2rVrJ4ULF1bfIcuXLxd7IU3vxx9/LOXKlZPg4GApVqyYfPTRR3Ztg0EcEbkMxt3EF+DkyZNN5uMLEfN90QcffCBZs2aV48ePy59//pni+4YJA28XL15c+vfvL7dv387w/SXyRQ8fPpTw8HCZPXu2w9sYMmSIfPnllyqQw5+33377TZ544gm7thHo8KsTETkBSpymTJkir7/+uuTOndsr3tPY2FjJlCmTQ889deqUGkw+LCwsxfWefvpp+eabbyQ+Pl6OHDkivXv3ljt37qhB6YkofbVu3VpNKX0HvPfee/LDDz+oz2WVKlXU91xERIRafvToUZk3b578/fffUr58eYf3gyVxRORSzZs3l4IFC8qkSZOsrjN27NhkVYszZ86UEiVKmJROdejQQVVHFChQQHLlyiXjxo1TQc7bb78tefLkkaJFi8rXX3+dbPv4F9ygQQMVUFauXFk2btxoshxBUps2bSRbtmxq2z169JAbN24YluOLedCgQTJ8+HAJDQ2VFi1aWDyOxMREGT9+vNoPVJ/gmFatWmVYjpK1vXv3qnVwH8dtDZ6P9w3batmypXTr1k3WrFlj82t16tRJ3njjDcPjoUOHqtc8fPiweoz3LXv27LJ69Wr1+JdffpGqVatK5syZJW/evOq8oTSCiJLr1auX/PXXX/LTTz/JwYMHpUuXLuqP14kTJ9RylLqVKlVKfv/9dylZsqT6Luvbt6/cunVL7MEgjohcKiAgQAVen332mVy8eDFN21q/fr1cvnxZtVeZPn26CoKeeeYZVcK3c+dO6devn5ouXLhg8jwEeW+++aZERUWpYO7ZZ5+VmzdvqmVXrlyRpk2bqiBoz549KhD6999/pWvXribb+Pbbb1XVJr6458+fb3H/Pv30U/nkk09U9Qm+2Fu1aqVeS/tix2shiMS+4P5bb71l03GfPn1a7VdQUJDNr4XA0zhY3bRpkwpAcQu7d++Wx48fS8OGDdW+vPDCC6q0DyUIeF7Hjh1Vmx4iSl6ajhLxJUuWSOPGjaV06dLqs9yoUSNVeq59Zs+dO6fW+e6772ThwoXqD1znzp3FLjoiIhfp2bOnrn379up+vXr1dL1791b3IyMjER0Y1vvggw904eHhJs+dMWOGLiwszGRbeJyQkGCYV758eV3jxo0Nj+Pj43VZs2bV/fjjj+rxmTNn1OtMnjzZsE5cXJyuaNGiuilTpqjHY8aM0bVs2dLktS9cuKCed/z4cfW4adOmuurVq6d6vIULF9ZNnDjRZF6dOnV0AwYMMDzGceJ4U4JjDQgIUMcSEhKi9gXT9OnTbX6tgwcP6vz8/HTXr1/X3bp1SxcUFKT78MMPdV26dFHLP/roI13dunXV/b1796rtnz17NtVjJPI1IqK+szQ///yzmofPp/EUGBio69q1q1rn1VdfNfkOMf6cHTt2zObXZps4InILaC/y5JNPqlIoR6EUy98/qYIBVZ9oi2Jc6oeqwGvXrpk8r379+ob7KE2rXbu2KnEC/DvesGGDqkq19I8bPcsAz0nJvXv3VCkhSraM4fGBAwfsPtZmzZqpNjXR0dGqcfQ///xjqB615bXwvuC9QMkbSvDQSBsldbNmzVLLUdqGEkjAsqeeekpVp6JED9W3KDHwljaMRM6Epgz4rsF3B26Nad8jhQoVUt812vcHVKxYUd2eP3/e5nZyrE4lIrfQpEkTFSC8++67yZYhMDOvuouLi0u2nnF1IqCNl6V5+JJNjdY7FusilQDSkBhPqJbEPmvQo9QW5r1ucVyO9MTF65UpU0aqVaumAq+YmBjVBtDW18It9h/BGgI5VK8isEtISJBDhw7Jtm3bDI2w8UO0du1aWblypVSqVElVfeNH5syZM3bvN5G3q1Gjhvoc4c8iPqPGE9qxan+o0O4UfwQ1+CMGqXVqMsYgjojcBlKNoMEvAghj+fLlk6tXr5oEcs7M7bZjxw7DfXyx4h90hQoV1OOaNWuqxv5oeGz+hWxr4AY5cuRQOaW2bt1qMh/Hqv0DT2tqErR/Qwmcra+ltYvDhPsI7NCGB9t59OiRSUkeluExAkW0HUTv28jIyDTvN5EnevDggeEPHeAPDe6jFA2lay+++KK8/PLLsmzZMrUMbUxR27BixQq1PjoG4bsF7UzxecJ3Dnroo1OUcelcahjEEZHbQHUdvvxQ0mMMAcb169dl6tSp6p/rnDlzVKmQs2B7CEjQS3XgwIEq3xq+XAGP0WMMDft37dqlGiSjFyiW49+2PdCBAl/kixcvVnngRo4cqb74kS8qrfAeoTpZSxZqy2vhOQhQUfKG4E2bh7QI+IFBMAjoFILtomMHfqTww4Tz4Yzgk8gT7dmzR5W4YQL0TMf9999/Xz1GBwYEcWgeglJrNFXA5wgJfbXaBfxhRWcilIgjrRA+T+jNag+2iSMitzJhwgT5+eefTebhy23u3LkqkMBypMdAb68FCxY4rQQQAQ/+EaMn2a+//qq+XAElWuhx+s4776jqXlRboroD6QKM29/ZYvDgwaq9Gr7YUdWCqsn/+7//k7JlyzrlOPBDgtQG2FdbXgvVpzhOHI8WsKEdHIJTrT0cYBl6/CKtC7aJ9dHzNaU8WUTeLCIiIsXe2WjGgVJr8yYOxvDdsnTp0jTth99/PSuIiIiIyIOwOpWIiIjIAzGIIyIiIvJADOKIiIiIPBCDOCIiIiIPxCCOiIiIyAMxiCMiIiLyQAziiIiIiDwQgzgiIiIiD8QgjoiIiMgDMYgjIiIi8kAM4oiIiIg8EIM4IiIiIvE8/w9mUl1QT936UgAAAABJRU5ErkJggg==",
+      "text/plain": [
+       "<Figure size 700x500 with 1 Axes>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "sizes = [50_000, 100_000, 500_000, 1_000_000, 2_000_000]\n",
+    "times_apply, times_numpy, times_numba = [], [], []\n",
+    "\n",
+    "for size in sizes:\n",
+    "    df = pd.DataFrame({\n",
+    "        \"x\": np.random.rand(size),\n",
+    "        \"y\": np.random.rand(size)\n",
+    "    })\n",
+    "    \n",
+    "    start = time.time()\n",
+    "    df.apply(lambda row: np.sqrt(row['x']**2 + row['y']**2), axis=1)\n",
+    "    times_apply.append(time.time() - start)\n",
+    "    \n",
+    "    start = time.time()\n",
+    "    np.sqrt(df['x']**2 + df['y']**2)\n",
+    "    times_numpy.append(time.time() - start)\n",
+    "    \n",
+    "    score_numba(df['x'].values, df['y'].values)  # warm-up compile\n",
+    "    start = time.time()\n",
+    "    score_numba(df['x'].values, df['y'].values)\n",
+    "    times_numba.append(time.time() - start)\n",
+    "\n",
+    "plt.figure(figsize=(7,5))\n",
+    "plt.plot(sizes, times_apply, \"o-r\", label=\"Pandas apply()\")\n",
+    "plt.plot(sizes, times_numpy, \"x-g\", label=\"Numpy\")\n",
+    "plt.plot(sizes, times_numba, \"s-b\", label=\"Numba accelerated\")\n",
+    "plt.xlabel(\"Number of Rows\")\n",
+    "plt.ylabel(\"Runtime (seconds)\")\n",
+    "plt.yscale('log')\n",
+    "plt.legend()\n",
+    "plt.grid(True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3e37e637-a4e5-4422-b769-4de985926a46",
+   "metadata": {},
+   "source": [
+    "It is clear that numba can significantly speedup computations that rely on function that are called repeatedly."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.13.9"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From 6f444ec10ff358c468f7a30c49d6b1c591700865 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Mon, 24 Nov 2025 18:56:18 +0100
Subject: [PATCH 08/10] Add DuckDB examples

---
 source-code/README.md             |    1 +
 source-code/duckdb/README.md      |   14 +
 source-code/duckdb/patients.ipynb | 1386 +++++++++++++++++++++++++----
 3 files changed, 1250 insertions(+), 151 deletions(-)
 create mode 100644 source-code/duckdb/README.md

diff --git a/source-code/README.md b/source-code/README.md
index 4f9bfdc..177a58c 100644
--- a/source-code/README.md
+++ b/source-code/README.md
@@ -15,6 +15,7 @@ to create it.  There is some material not covered in the presentation as well.
   representation and algorithms.
 * [`pandas`](pandas): illustrations of using pandas and seaborn.
 * [`polars`](polars): Kllustrations of using polars.
+* [`duckdb`](duckdb): illustrations of using DuckDB for SQL queries.
 * [`regexes`](regexes): illustrations of using regular expressions for
   validation and information extraction from textual data.
 * [`seaborn`](seaborn): illustrations of using Seaborn to create plots.
diff --git a/source-code/duckdb/README.md b/source-code/duckdb/README.md
new file mode 100644
index 0000000..c4b0e68
--- /dev/null
+++ b/source-code/duckdb/README.md
@@ -0,0 +1,14 @@
+# DuckDB
+
+DuckDB is an in-process SQL OLAP database management system. It is designed to
+support analytical query workloads and is optimized for fast query performance
+on large datasets. DuckDB can be embedded directly into applications, making it
+a popular choice for data analysis tasks in various programming environments.
+
+
+## What is it?
+
+1. `patients.ipynb`: A Jupyter notebook that demonstrates how to use DuckDB for
+   analyzing patient data. It includes examples of loading data and executing
+   SQL queries.
+1. `data/`: CSV files to use with the notebook.
diff --git a/source-code/duckdb/patients.ipynb b/source-code/duckdb/patients.ipynb
index 380233b..853801e 100644
--- a/source-code/duckdb/patients.ipynb
+++ b/source-code/duckdb/patients.ipynb
@@ -1,31 +1,946 @@
 {
  "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "9b23ccda-f524-41bc-975b-568da36a4493",
+   "metadata": {},
+   "source": [
+    "## Requirements"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "4c0d0975-71ce-4e9a-986c-ac6cbfb251bb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import duckdb\n",
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d46cb701-62c6-4279-bf61-36935a0a53a9",
+   "metadata": {},
+   "source": [
+    "## Database connection"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6a0df994-ac76-4c42-904a-a6113ea419f9",
+   "metadata": {},
+   "source": [
+    "Create a connection to the database, and query metadata."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "861daf66-0810-48d9-968c-18e1dabe0e4f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "conn = duckdb.connect('data/patient_experiment.csv')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "843f9d0f-8384-4977-916e-49ef59e5cbad",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "┌─────────────┬─────────────┬─────────┬─────────┬─────────┬─────────┐\n",
+       "│ column_name │ column_type │  null   │   key   │ default │  extra  │\n",
+       "│   varchar   │   varchar   │ varchar │ varchar │ varchar │ varchar │\n",
+       "├─────────────┼─────────────┼─────────┼─────────┼─────────┼─────────┤\n",
+       "│ column0     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ patient     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ date        │ TIMESTAMP   │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "│ temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+       "└─────────────┴─────────────┴─────────┴─────────┴─────────┴─────────┘"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.sql('''\n",
+    "    DESCRIBE patient_experiment;\n",
+    "''')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "62195da0-ca79-4f65-b3f8-780783518d98",
+   "metadata": {},
+   "source": [
+    "Create a function to show the tables/views in the database."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "a3effca9-7353-435b-b7b5-01a487034314",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def show_tables(conn):\n",
+    "    conn.sql('''\n",
+    "        SELECT table_schema, table_name, table_type\n",
+    "          FROM information_schema.tables\n",
+    "          WHERE table_schema NOT IN ('information_schema', 'pg_catalog');\n",
+    "    ''').show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "66400c5a-ca95-4104-a537-7a29dbdb001b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌──────────────┬────────────────────┬────────────┐\n",
+      "│ table_schema │     table_name     │ table_type │\n",
+      "│   varchar    │      varchar       │  varchar   │\n",
+      "├──────────────┼────────────────────┼────────────┤\n",
+      "│ main         │ file               │ VIEW       │\n",
+      "│ main         │ patient_experiment │ VIEW       │\n",
+      "└──────────────┴────────────────────┴────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "show_tables(conn)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5bc72abf-863b-4516-bc42-14784d7a40b0",
+   "metadata": {},
+   "source": [
+    "## Queries"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bff175ad-cbe7-4a5d-91db-7d6eada3b695",
+   "metadata": {},
+   "source": [
+    "Select all the data for patient 6 and convert it to a pandas dataframe."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "id": "d4607877-270b-48c5-ba91-6aa19a8a24cf",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "      <th>date</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>37.5</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 11:00:00</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 12:00:00</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>3.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 13:00:00</td>\n",
+       "      <td>37.7</td>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 14:00:00</td>\n",
+       "      <td>37.2</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 15:00:00</td>\n",
+       "      <td>36.8</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient                date  temperature  dose\n",
+       "0        6 2012-10-02 10:00:00         37.5   0.0\n",
+       "1        6 2012-10-02 11:00:00         38.1   2.0\n",
+       "2        6 2012-10-02 12:00:00         37.9   3.0\n",
+       "3        6 2012-10-02 13:00:00         37.7   2.0\n",
+       "4        6 2012-10-02 14:00:00         37.2   1.0\n",
+       "5        6 2012-10-02 15:00:00         36.8   0.0"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT patient, date, temperature, dose\n",
+    "      FROM patient_experiment\n",
+    "      WHERE patient == 6;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "02af9a7f-84d2-4cb9-a705-441b4eff526a",
+   "metadata": {},
+   "source": [
+    "For the patients with a high fever, count the number of timepoints they had a temperature above $39.5\\textdegree C$ as well as their maximum temperature."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "262b2ad4-05c0-445e-8005-f07307f88947",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "      <th>high_fever_count</th>\n",
+       "      <th>max_temperature</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>7</td>\n",
+       "      <td>3</td>\n",
+       "      <td>40.7</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>9</td>\n",
+       "      <td>1</td>\n",
+       "      <td>40.2</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient  high_fever_count  max_temperature\n",
+       "0        7                 3             40.7\n",
+       "1        9                 1             40.2"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "        patient,\n",
+    "        COUNT(temperature) AS high_fever_count,\n",
+    "        MAX(temperature) AS max_temperature\n",
+    "      FROM patient_experiment\n",
+    "      WHERE temperature > 39.5\n",
+    "      GROUP BY patient\n",
+    "      ORDER BY patient;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "98ef7ed5-23d1-4591-ab8a-405248f98a3a",
+   "metadata": {},
+   "source": [
+    "For each patient, compute the total dose administered, as well as the maximum temperature, and order by descending maximum temperature."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "id": "7df98e50-5ab8-4813-a3ad-d3796aa35c48",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "      <th>max_temperature</th>\n",
+       "      <th>total_dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>7</td>\n",
+       "      <td>40.7</td>\n",
+       "      <td>30.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>9</td>\n",
+       "      <td>40.2</td>\n",
+       "      <td>30.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>5</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>27.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>3</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>13.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2</td>\n",
+       "      <td>39.4</td>\n",
+       "      <td>15.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>1</td>\n",
+       "      <td>38.5</td>\n",
+       "      <td>6.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>6</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>8.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>4</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>10.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>8</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient  max_temperature  total_dose\n",
+       "0        7             40.7        30.0\n",
+       "1        9             40.2        30.0\n",
+       "2        5             39.5        27.0\n",
+       "3        3             39.5        13.0\n",
+       "4        2             39.4        15.0\n",
+       "5        1             38.5         6.0\n",
+       "6        6             38.1         8.0\n",
+       "7        4             38.1        10.0\n",
+       "8        8             37.9         0.0"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "        patient,\n",
+    "        MAX(temperature) AS 'max_temperature',\n",
+    "        SUM(dose) AS 'total_dose'\n",
+    "      FROM patient_experiment\n",
+    "      GROUP BY patient\n",
+    "      ORDER BY max_temperature DESC;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d3d6fcbf-9bc5-40fb-9e4f-046def5249db",
+   "metadata": {},
+   "source": [
+    "If you want to query the result of such a query, you can create a view, `'hypothesis'` in this example."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "6b8694e2-5e9f-4d15-b2c3-609ab762d7b4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "conn.execute('''\n",
+    "    CREATE VIEW hypothesis AS SELECT\n",
+    "        patient,\n",
+    "        MAX(temperature) AS 'max_temperature',\n",
+    "        SUM(dose) AS 'total_dose'\n",
+    "      FROM patient_experiment\n",
+    "      GROUP BY patient\n",
+    "      ORDER BY max_temperature DESC;\n",
+    "''');"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "7c755e2b-d781-435e-a878-9b29b6374670",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌──────────────┬────────────────────┬────────────┐\n",
+      "│ table_schema │     table_name     │ table_type │\n",
+      "│   varchar    │      varchar       │  varchar   │\n",
+      "├──────────────┼────────────────────┼────────────┤\n",
+      "│ main         │ file               │ VIEW       │\n",
+      "│ main         │ hypothesis         │ VIEW       │\n",
+      "│ main         │ patient_experiment │ VIEW       │\n",
+      "└──────────────┴────────────────────┴────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "show_tables(conn)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "96617d94-da47-4604-9c27-3375058cbd86",
+   "metadata": {},
+   "source": [
+    "Get the maximum dose administered to a patient."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "id": "d1a405c8-05e4-4d27-bd1c-3d1fe61c5e43",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>max(total_dose)</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>30.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   max(total_dose)\n",
+       "0             30.0"
+      ]
+     },
+     "execution_count": 35,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT MAX(total_dose)\n",
+    "      FROM hypothesis;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2718eb2c-1e3a-4f90-a1f6-bb27e9d4a332",
+   "metadata": {},
+   "source": [
+    "Although DuckDB has an extension to perform a pivot (this is not standard SQL), it is not as elegant as the pandas counterpart as multi-level columns are not suppported by DuckDB."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "id": "0c4e1ad8-a9ae-4808-901b-c036e4e0ee17",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "<_duckdb.DuckDBPyConnection at 0x739eb95f72b0>"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    CREATE TABLE time_series AS\n",
+    "      PIVOT patient_experiment\n",
+    "      ON patient\n",
+    "      USING\n",
+    "        first(temperature) AS temperature,\n",
+    "        first(dose) AS dose\n",
+    "      GROUP BY date;\n",
+    "''');"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "b4b38844-e6d2-4df1-8f6c-21e4daf77d48",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌───────────────┬─────────────┬─────────┬─────────┬─────────┬─────────┐\n",
+      "│  column_name  │ column_type │  null   │   key   │ default │  extra  │\n",
+      "│    varchar    │   varchar   │ varchar │ varchar │ varchar │ varchar │\n",
+      "├───────────────┼─────────────┼─────────┼─────────┼─────────┼─────────┤\n",
+      "│ date          │ TIMESTAMP   │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 1_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 1_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 2_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 2_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 3_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 3_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 4_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 4_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 5_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 5_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 6_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 6_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 7_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 7_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 8_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 8_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 9_temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "│ 9_dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
+      "├───────────────┴─────────────┴─────────┴─────────┴─────────┴─────────┤\n",
+      "│ 19 rows                                                   6 columns │\n",
+      "└─────────────────────────────────────────────────────────────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "conn.sql('DESCRIBE time_series;').show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "id": "95b029d4-0329-4462-8737-94f036dc8147",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>date</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>37.5</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2012-10-02 11:00:00</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2012-10-02 12:00:00</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>3.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>2012-10-02 13:00:00</td>\n",
+       "      <td>37.7</td>\n",
+       "      <td>2.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2012-10-02 14:00:00</td>\n",
+       "      <td>37.2</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>2012-10-02 15:00:00</td>\n",
+       "      <td>36.8</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                 date  temperature  dose\n",
+       "0 2012-10-02 10:00:00         37.5   0.0\n",
+       "1 2012-10-02 11:00:00         38.1   2.0\n",
+       "2 2012-10-02 12:00:00         37.9   3.0\n",
+       "3 2012-10-02 13:00:00         37.7   2.0\n",
+       "4 2012-10-02 14:00:00         37.2   1.0\n",
+       "5 2012-10-02 15:00:00         36.8   0.0\n",
+       "6 2012-10-02 16:00:00          NaN   NaN"
+      ]
+     },
+     "execution_count": 26,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "      date,\n",
+    "      \"6_temperature\" AS temperature,\n",
+    "      \"6_dose\" AS dose\n",
+    "    FROM time_series\n",
+    "    ORDER BY date;\n",
+    "''').df()"
+   ]
+  },
   {
    "cell_type": "code",
-   "execution_count": 1,
-   "id": "4c0d0975-71ce-4e9a-986c-ac6cbfb251bb",
+   "execution_count": 27,
+   "id": "78a996cf-4bc2-40dc-8bce-27bcc6731b7b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌────────────────────┐\n",
+      "│        name        │\n",
+      "│      varchar       │\n",
+      "├────────────────────┤\n",
+      "│ file               │\n",
+      "│ hypothesis         │\n",
+      "│ patient_experiment │\n",
+      "│ time_series        │\n",
+      "└────────────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "conn.sql('SHOW TABLES;').show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8637dcab-93f4-4d69-9fec-0bc840b03598",
    "metadata": {},
+   "source": [
+    "Create a view on a second CSV file."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "id": "8570b365-09d5-4993-908e-4eaac974204d",
+   "metadata": {
+    "scrolled": true
+   },
    "outputs": [],
    "source": [
-    "import duckdb\n",
-    "import pandas as pd"
+    "conn.execute('''\n",
+    "   CREATE VIEW patient_metadata AS\n",
+    "       SELECT *\n",
+    "         FROM read_csv_auto('data/patient_metadata.csv', filename=true);\n",
+    "''');"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
-   "id": "861daf66-0810-48d9-968c-18e1dabe0e4f",
+   "execution_count": 41,
+   "id": "022db70e-64a2-40ad-920f-463f465b274c",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌──────────────┬────────────────────┬────────────┐\n",
+      "│ table_schema │     table_name     │ table_type │\n",
+      "│   varchar    │      varchar       │  varchar   │\n",
+      "├──────────────┼────────────────────┼────────────┤\n",
+      "│ main         │ time_series        │ BASE TABLE │\n",
+      "│ main         │ file               │ VIEW       │\n",
+      "│ main         │ hypothesis         │ VIEW       │\n",
+      "│ main         │ metadata           │ VIEW       │\n",
+      "│ main         │ patient_experiment │ VIEW       │\n",
+      "│ main         │ patient_metadata   │ VIEW       │\n",
+      "└──────────────┴────────────────────┴────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
    "source": [
-    "conn = duckdb.connect('data/patient_experiment.csv')"
+    "show_tables(conn)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8ae2a578-6849-4a22-ad2e-b770de3ff44e",
+   "metadata": {},
+   "source": [
+    "Determine the patient IDs that are either in `patient_experiment`, or in `patient_metadata`, but not in both.  Note that a full outer join is used to combine the informantion in both tables."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 25,
-   "id": "c0f56de5-2351-4473-b768-234a89a705ac",
+   "execution_count": 45,
+   "id": "6482c2b6-4896-4c30-9bb4-b5a278626364",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "      <th>present</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>4</td>\n",
+       "      <td>only in experiment</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>10</td>\n",
+       "      <td>only in metadata</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>11</td>\n",
+       "      <td>only in metadata</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient             present\n",
+       "0        4  only in experiment\n",
+       "1       10    only in metadata\n",
+       "2       11    only in metadata"
+      ]
+     },
+     "execution_count": 45,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "      DISTINCT COALESCE(exp.patient, mt.patient) AS patient,\n",
+    "      CASE\n",
+    "        WHEN exp.patient IS NOT NULL AND mt.patient IS NULL\n",
+    "          THEN 'only in experiment'\n",
+    "        WHEN exp.patient IS NULL and mt.patient IS NOT NULL\n",
+    "          THEN 'only in metadata'\n",
+    "        ELSE 'in both'\n",
+    "      END AS present\n",
+    "      FROM patient_experiment AS exp FULL OUTER JOIN patient_metadata AS mt\n",
+    "        USING (patient)\n",
+    "      WHERE NOT present = 'in both'\n",
+    "      ORDER BY exp.patient, mt.patient;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9cf58cd3-0804-4472-bfd2-72f5afd82166",
    "metadata": {},
+   "source": [
+    "You can do an inner join between the tables `patient_experiment` and `patient_metadata` to get the maximum temperature, the condition and gender for each patient that occurs in both tables."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "id": "1639aeaa-b33a-4889-869d-93500242980b",
+   "metadata": {
+    "scrolled": true
+   },
    "outputs": [
     {
      "data": {
@@ -49,114 +964,115 @@
        "    <tr style=\"text-align: right;\">\n",
        "      <th></th>\n",
        "      <th>patient</th>\n",
+       "      <th>max_temperature</th>\n",
+       "      <th>condition</th>\n",
+       "      <th>gender</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
        "      <td>1</td>\n",
+       "      <td>38.5</td>\n",
+       "      <td>A</td>\n",
+       "      <td>M</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
-       "      <td>3</td>\n",
+       "      <td>2</td>\n",
+       "      <td>39.4</td>\n",
+       "      <td>A</td>\n",
+       "      <td>F</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>2</th>\n",
-       "      <td>6</td>\n",
+       "      <td>3</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>A</td>\n",
+       "      <td>M</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>3</th>\n",
-       "      <td>7</td>\n",
+       "      <td>5</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>A</td>\n",
+       "      <td>M</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>4</th>\n",
-       "      <td>8</td>\n",
+       "      <td>6</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>B</td>\n",
+       "      <td>F</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>5</th>\n",
-       "      <td>5</td>\n",
+       "      <td>7</td>\n",
+       "      <td>40.7</td>\n",
+       "      <td>B</td>\n",
+       "      <td>M</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>6</th>\n",
-       "      <td>9</td>\n",
+       "      <td>8</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>B</td>\n",
+       "      <td>F</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>7</th>\n",
-       "      <td>2</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>4</td>\n",
+       "      <td>9</td>\n",
+       "      <td>40.2</td>\n",
+       "      <td>B</td>\n",
+       "      <td>M</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "   patient\n",
-       "0        1\n",
-       "1        3\n",
-       "2        6\n",
-       "3        7\n",
-       "4        8\n",
-       "5        5\n",
-       "6        9\n",
-       "7        2\n",
-       "8        4"
+       "   patient  max_temperature condition gender\n",
+       "0        1             38.5         A      M\n",
+       "1        2             39.4         A      F\n",
+       "2        3             39.5         A      M\n",
+       "3        5             39.5         A      M\n",
+       "4        6             38.1         B      F\n",
+       "5        7             40.7         B      M\n",
+       "6        8             37.9         B      F\n",
+       "7        9             40.2         B      M"
       ]
      },
-     "execution_count": 25,
+     "execution_count": 50,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "conn.execute('SELECT DISTINCT patient FROM \"patient_experiment\";').df()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 15,
-   "id": "0c4e1ad8-a9ae-4808-901b-c036e4e0ee17",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "sql_pivot = '''\n",
-    "CREATE TABLE time_series AS\n",
-    "  PIVOT \"data/patient_experiment.csv\"\n",
-    "  ON patient\n",
-    "  USING\n",
-    "    first(temperature) AS temperature,\n",
-    "    first(dose) AS dose\n",
-    "  GROUP BY date;\n",
-    "'''"
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "      COALESCE(exp.patient, mt.patient) AS patient,\n",
+    "      MAX(exp.temperature) AS max_temperature,\n",
+    "      ANY_VALUE(mt.condition) AS condition,\n",
+    "      ANY_VALUE(mt.gender) AS gender\n",
+    "    FROM patient_experiment AS exp INNER JOIN patient_metadata AS mt\n",
+    "      USING (patient)\n",
+    "    GROUP BY exp.patient, mt.patient\n",
+    "    ORDER BY exp.patient, mt.patient\n",
+    "''').df()"
    ]
   },
   {
-   "cell_type": "code",
-   "execution_count": 16,
-   "id": "6ff65df2-1997-4983-b3c8-1753034c3218",
+   "cell_type": "markdown",
+   "id": "b2afc510-6340-4c59-aeec-e245d8358a0e",
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "<duckdb.duckdb.DuckDBPyConnection at 0x762650c61bf0>"
-      ]
-     },
-     "execution_count": 16,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
-    "conn.execute(sql_pivot)"
+    "## New style versus classic style"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
-   "id": "95b029d4-0329-4462-8737-94f036dc8147",
+   "execution_count": 51,
+   "id": "397405b0-756c-461a-81f1-e7af99b98d0c",
    "metadata": {},
    "outputs": [
     {
@@ -180,66 +1096,128 @@
        "  <thead>\n",
        "    <tr style=\"text-align: right;\">\n",
        "      <th></th>\n",
+       "      <th>patient</th>\n",
        "      <th>date</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
-       "      <td>2012-10-02 14:00:00</td>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>37.5</td>\n",
+       "      <td>0.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
+       "      <td>6</td>\n",
        "      <td>2012-10-02 11:00:00</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>2.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>2</th>\n",
-       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 12:00:00</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>3.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>3</th>\n",
+       "      <td>6</td>\n",
        "      <td>2012-10-02 13:00:00</td>\n",
+       "      <td>37.7</td>\n",
+       "      <td>2.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>4</th>\n",
-       "      <td>2012-10-02 12:00:00</td>\n",
+       "      <td>6</td>\n",
+       "      <td>2012-10-02 14:00:00</td>\n",
+       "      <td>37.2</td>\n",
+       "      <td>1.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>5</th>\n",
+       "      <td>6</td>\n",
        "      <td>2012-10-02 15:00:00</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>36.8</td>\n",
+       "      <td>0.0</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                 date\n",
-       "0 2012-10-02 14:00:00\n",
-       "1 2012-10-02 11:00:00\n",
-       "2 2012-10-02 10:00:00\n",
-       "3 2012-10-02 13:00:00\n",
-       "4 2012-10-02 12:00:00\n",
-       "5 2012-10-02 15:00:00\n",
-       "6 2012-10-02 16:00:00"
+       "   patient                date  temperature  dose\n",
+       "0        6 2012-10-02 10:00:00         37.5   0.0\n",
+       "1        6 2012-10-02 11:00:00         38.1   2.0\n",
+       "2        6 2012-10-02 12:00:00         37.9   3.0\n",
+       "3        6 2012-10-02 13:00:00         37.7   2.0\n",
+       "4        6 2012-10-02 14:00:00         37.2   1.0\n",
+       "5        6 2012-10-02 15:00:00         36.8   0.0"
       ]
      },
-     "execution_count": 18,
+     "execution_count": 51,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "conn.execute('SELECT date FROM time_series;').df()"
+    "conn.execute('''\n",
+    "    SELECT patient, date, temperature, dose\n",
+    "      FROM patient_experiment\n",
+    "      WHERE patient == 6;\n",
+    "''').df()"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
-   "id": "78a996cf-4bc2-40dc-8bce-27bcc6731b7b",
+   "execution_count": 52,
+   "id": "3f06bf99-ead9-4eec-8251-b834f5c2eb69",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌─────────┬─────────────────────┬─────────────┬────────┐\n",
+      "│ patient │        date         │ temperature │  dose  │\n",
+      "│  int64  │      timestamp      │   double    │ double │\n",
+      "├─────────┼─────────────────────┼─────────────┼────────┤\n",
+      "│       6 │ 2012-10-02 10:00:00 │        37.5 │    0.0 │\n",
+      "│       6 │ 2012-10-02 11:00:00 │        38.1 │    2.0 │\n",
+      "│       6 │ 2012-10-02 12:00:00 │        37.9 │    3.0 │\n",
+      "│       6 │ 2012-10-02 13:00:00 │        37.7 │    2.0 │\n",
+      "│       6 │ 2012-10-02 14:00:00 │        37.2 │    1.0 │\n",
+      "│       6 │ 2012-10-02 15:00:00 │        36.8 │    0.0 │\n",
+      "└─────────┴─────────────────────┴─────────────┴────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "conn.sql('''\n",
+    "    SELECT patient, date, temperature, dose\n",
+    "      FROM patient_experiment\n",
+    "''').filter('patient = 6').show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cd9dee70-4c1c-4445-9b6c-f957791210fc",
+   "metadata": {},
+   "source": [
+    "For the patients with a high fever, count the number of timepoints they had a temperature above $39.5\\textdegree C$ as well as their maximum temperature."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "0f29e357-5c17-4aca-92dc-ceaecf959023",
    "metadata": {},
    "outputs": [
     {
@@ -263,46 +1241,96 @@
        "  <thead>\n",
        "    <tr style=\"text-align: right;\">\n",
        "      <th></th>\n",
-       "      <th>name</th>\n",
+       "      <th>patient</th>\n",
+       "      <th>high_fever_count</th>\n",
+       "      <th>max_temperature</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
-       "      <td>file</td>\n",
+       "      <td>7</td>\n",
+       "      <td>3</td>\n",
+       "      <td>40.7</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
-       "      <td>patient_experiment</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>time_series</td>\n",
+       "      <td>9</td>\n",
+       "      <td>1</td>\n",
+       "      <td>40.2</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                 name\n",
-       "0                file\n",
-       "1  patient_experiment\n",
-       "2         time_series"
+       "   patient  high_fever_count  max_temperature\n",
+       "0        7                 3             40.7\n",
+       "1        9                 1             40.2"
       ]
      },
-     "execution_count": 23,
+     "execution_count": 10,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "conn.execute('show tables;').df()"
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "        patient,\n",
+    "        COUNT(temperature) AS high_fever_count,\n",
+    "        MAX(temperature) AS max_temperature\n",
+    "      FROM patient_experiment\n",
+    "      WHERE temperature > 39.5\n",
+    "      GROUP BY patient\n",
+    "      ORDER BY patient;\n",
+    "''').df()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 73,
+   "id": "d07c6fff-b72d-49c0-a0f7-f545e4013331",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌─────────┬──────────────────┬─────────────────┐\n",
+      "│ patient │ high_fever_count │ max_temperature │\n",
+      "│  int64  │      int64       │     double      │\n",
+      "├─────────┼──────────────────┼─────────────────┤\n",
+      "│       7 │                3 │            40.7 │\n",
+      "│       9 │                1 │            40.2 │\n",
+      "└─────────┴──────────────────┴─────────────────┘\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "conn.sql('SELECT patient, temperature FROM patient_experiment') \\\n",
+    "    .filter('temperature > 39.5') \\\n",
+    "    .aggregate(\n",
+    "        'patient, '\n",
+    "        'COUNT(temperature) AS high_fever_count, '\n",
+    "        'MAX(temperature) AS max_temperature',\n",
+    "        group_expr='patient') \\\n",
+    "    .show()     "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "65ab2e40-bbf8-4537-a41b-e2321568fb98",
+   "metadata": {},
+   "source": [
+    "For each patient, compute the total dose administered, as well as the maximum temperature, and order by descending maximum temperature."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 24,
-   "id": "ea5cf7e3-1b67-45fd-bdde-1ee294575149",
+   "execution_count": 18,
+   "id": "27f12e02-c92a-459a-a469-e733ba17052f",
    "metadata": {},
    "outputs": [
     {
@@ -326,91 +1354,147 @@
        "  <thead>\n",
        "    <tr style=\"text-align: right;\">\n",
        "      <th></th>\n",
-       "      <th>table_schema</th>\n",
-       "      <th>table_name</th>\n",
-       "      <th>table_type</th>\n",
+       "      <th>patient</th>\n",
+       "      <th>max_temperature</th>\n",
+       "      <th>total_dose</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
-       "      <td>main</td>\n",
-       "      <td>time_series</td>\n",
-       "      <td>BASE TABLE</td>\n",
+       "      <td>7</td>\n",
+       "      <td>40.7</td>\n",
+       "      <td>30.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
-       "      <td>main</td>\n",
-       "      <td>file</td>\n",
-       "      <td>VIEW</td>\n",
+       "      <td>9</td>\n",
+       "      <td>40.2</td>\n",
+       "      <td>30.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>2</th>\n",
-       "      <td>main</td>\n",
-       "      <td>patient_experiment</td>\n",
-       "      <td>VIEW</td>\n",
+       "      <td>5</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>27.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>3</td>\n",
+       "      <td>39.5</td>\n",
+       "      <td>13.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2</td>\n",
+       "      <td>39.4</td>\n",
+       "      <td>15.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>1</td>\n",
+       "      <td>38.5</td>\n",
+       "      <td>6.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>6</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>8.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>4</td>\n",
+       "      <td>38.1</td>\n",
+       "      <td>10.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>8</td>\n",
+       "      <td>37.9</td>\n",
+       "      <td>0.0</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "  table_schema          table_name  table_type\n",
-       "0         main         time_series  BASE TABLE\n",
-       "1         main                file        VIEW\n",
-       "2         main  patient_experiment        VIEW"
+       "   patient  max_temperature  total_dose\n",
+       "0        7             40.7        30.0\n",
+       "1        9             40.2        30.0\n",
+       "2        5             39.5        27.0\n",
+       "3        3             39.5        13.0\n",
+       "4        2             39.4        15.0\n",
+       "5        1             38.5         6.0\n",
+       "6        6             38.1         8.0\n",
+       "7        4             38.1        10.0\n",
+       "8        8             37.9         0.0"
       ]
      },
-     "execution_count": 24,
+     "execution_count": 18,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "conn.sql(\"\"\"\n",
-    "    SELECT table_schema, table_name, table_type\n",
-    "    FROM information_schema.tables\n",
-    "    WHERE table_schema NOT IN ('information_schema', 'pg_catalog')\n",
-    "\"\"\").df()"
+    "conn.execute('''\n",
+    "    SELECT\n",
+    "        patient,\n",
+    "        MAX(temperature) AS 'max_temperature',\n",
+    "        SUM(dose) AS 'total_dose'\n",
+    "      FROM patient_experiment\n",
+    "      GROUP BY patient\n",
+    "      ORDER BY max_temperature DESC;\n",
+    "''').df()"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 28,
-   "id": "843f9d0f-8384-4977-916e-49ef59e5cbad",
+   "execution_count": 77,
+   "id": "5f83cde9-129a-4f76-b199-3ae7adf3f08c",
    "metadata": {},
    "outputs": [
     {
-     "data": {
-      "text/plain": [
-       "┌─────────────┬─────────────┬─────────┬─────────┬─────────┬─────────┐\n",
-       "│ column_name │ column_type │  null   │   key   │ default │  extra  │\n",
-       "│   varchar   │   varchar   │ varchar │ varchar │ varchar │ varchar │\n",
-       "├─────────────┼─────────────┼─────────┼─────────┼─────────┼─────────┤\n",
-       "│ column0     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
-       "│ patient     │ BIGINT      │ YES     │ NULL    │ NULL    │ NULL    │\n",
-       "│ dose        │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
-       "│ date        │ TIMESTAMP   │ YES     │ NULL    │ NULL    │ NULL    │\n",
-       "│ temperature │ DOUBLE      │ YES     │ NULL    │ NULL    │ NULL    │\n",
-       "└─────────────┴─────────────┴─────────┴─────────┴─────────┴─────────┘"
-      ]
-     },
-     "execution_count": 28,
-     "metadata": {},
-     "output_type": "execute_result"
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "┌─────────┬─────────────────┬────────────┐\n",
+      "│ patient │ max_temperature │ total_dose │\n",
+      "│  int64  │     double      │   double   │\n",
+      "├─────────┼─────────────────┼────────────┤\n",
+      "│       7 │            40.7 │       30.0 │\n",
+      "│       9 │            40.2 │       30.0 │\n",
+      "│       5 │            39.5 │       27.0 │\n",
+      "│       3 │            39.5 │       13.0 │\n",
+      "│       2 │            39.4 │       15.0 │\n",
+      "│       1 │            38.5 │        6.0 │\n",
+      "│       4 │            38.1 │       10.0 │\n",
+      "│       6 │            38.1 │        8.0 │\n",
+      "│       8 │            37.9 │        0.0 │\n",
+      "└─────────┴─────────────────┴────────────┘\n",
+      "\n"
+     ]
     }
    ],
    "source": [
-    "conn.sql('''dESCRIBE patient_experiment;''')"
+    "conn.sql('SELECT patient, temperature, dose from patient_experiment') \\\n",
+    "    .aggregate(\n",
+    "        'patient, '\n",
+    "        'MAX(temperature) AS max_temperature, '\n",
+    "        'SUM(dose) AS total_dose',\n",
+    "        group_expr='patient'\n",
+    "    ) \\\n",
+    "    .order('max_temperature DESC') \\\n",
+    "    .show()"
    ]
   },
   {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8570b365-09d5-4993-908e-4eaac974204d",
+   "cell_type": "markdown",
+   "id": "ddf5f25c-b0c1-48c9-9031-5fd8a813649b",
    "metadata": {},
-   "outputs": [],
-   "source": []
+   "source": [
+    "The new-style queries allow for lazy evaluation, while the classic-style queries are evaluated immediately."
+   ]
   }
  ],
  "metadata": {
@@ -429,7 +1513,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12.11"
+   "version": "3.12.12"
   }
  },
  "nbformat": 4,

From d6fddbb3cc085b3fc48a211036b6c59132892688 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Tue, 25 Nov 2025 08:16:36 +0100
Subject: [PATCH 09/10] Add illustration long to wide to long

---
 source-code/pandas/README.md                  |    2 +
 .../from_long_to_wide_and_back_again.ipynb    | 1078 +++++++++++++++++
 2 files changed, 1080 insertions(+)
 create mode 100644 source-code/pandas/from_long_to_wide_and_back_again.ipynb

diff --git a/source-code/pandas/README.md b/source-code/pandas/README.md
index 1bb6cf9..80881e6 100644
--- a/source-code/pandas/README.md
+++ b/source-code/pandas/README.md
@@ -34,3 +34,5 @@ easy to use.
    a comparison of performance between using `apply` and vectorized operations.
 1. `numba_and_pandas.ipynb`: Jupyter notebook that demonstrates how to use Numba
    to optimize performance of operations on pandas dataframes.
+1. `from_long_to_wide_and_back_again.ipynb`: Jupyter notebook that illustrates
+   how to reshape data using `stack` and `pivot` methods in pandas.
diff --git a/source-code/pandas/from_long_to_wide_and_back_again.ipynb b/source-code/pandas/from_long_to_wide_and_back_again.ipynb
new file mode 100644
index 0000000..a3610d4
--- /dev/null
+++ b/source-code/pandas/from_long_to_wide_and_back_again.ipynb
@@ -0,0 +1,1078 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "4773bfbd-a3d3-4683-b51e-c80a649a7caf",
+   "metadata": {},
+   "source": [
+    "## Requirements"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "d7ab15e7-4fd2-4e81-a9ae-8469b05ec45c",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ee9056b1-0b76-4cbb-ad68-049b0095b62d",
+   "metadata": {},
+   "source": [
+    "## Original dataframe"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 39,
+   "id": "2c1acc53-9064-4589-9e88-541175d3deb0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df_orig = pd.read_excel('data/patient_experiment.xlsx',\n",
+    "                        dtype={'dose': np.float32,\n",
+    "                        'temperature': np.float32})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "id": "b64f834e-b044-422c-830f-112868864269",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "RangeIndex: 62 entries, 0 to 61\n",
+      "Data columns (total 4 columns):\n",
+      " #   Column       Non-Null Count  Dtype         \n",
+      "---  ------       --------------  -----         \n",
+      " 0   patient      62 non-null     int64         \n",
+      " 1   dose         61 non-null     float32       \n",
+      " 2   date         62 non-null     datetime64[ns]\n",
+      " 3   temperature  61 non-null     float32       \n",
+      "dtypes: datetime64[ns](1), float32(2), int64(1)\n",
+      "memory usage: 1.6 KB\n"
+     ]
+    }
+   ],
+   "source": [
+    "df_orig.info()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "id": "df59f8e2-0cb6-4dae-b2b2-71a89a5a894a",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>patient</th>\n",
+       "      <th>dose</th>\n",
+       "      <th>date</th>\n",
+       "      <th>temperature</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>38.299999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>1</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2012-10-02 11:00:00</td>\n",
+       "      <td>38.500000</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>1</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2012-10-02 12:00:00</td>\n",
+       "      <td>38.099998</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>1</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>2012-10-02 13:00:00</td>\n",
+       "      <td>37.299999</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>1</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2012-10-02 14:00:00</td>\n",
+       "      <td>37.500000</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   patient  dose                date  temperature\n",
+       "0        1   0.0 2012-10-02 10:00:00    38.299999\n",
+       "1        1   2.0 2012-10-02 11:00:00    38.500000\n",
+       "2        1   2.0 2012-10-02 12:00:00    38.099998\n",
+       "3        1   2.0 2012-10-02 13:00:00    37.299999\n",
+       "4        1   0.0 2012-10-02 14:00:00    37.500000"
+      ]
+     },
+     "execution_count": 41,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_orig.head()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "115ce86f-4e2f-4ea3-a240-2cc68d5721d8",
+   "metadata": {},
+   "source": [
+    "## To wide format: pivot"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "id": "1adfa94d-dbb6-41cc-af21-9ca6d1e97226",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df_wide = df_orig.pivot(\n",
+    "    index='date',\n",
+    "    values=['temperature', 'dose'],\n",
+    "    columns=['patient']\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "id": "18c3ba13-5949-4c14-95f2-1577466313b3",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "DatetimeIndex: 7 entries, 2012-10-02 10:00:00 to 2012-10-02 16:00:00\n",
+      "Data columns (total 18 columns):\n",
+      " #   Column            Non-Null Count  Dtype  \n",
+      "---  ------            --------------  -----  \n",
+      " 0   (temperature, 1)  7 non-null      float32\n",
+      " 1   (temperature, 2)  7 non-null      float32\n",
+      " 2   (temperature, 3)  6 non-null      float32\n",
+      " 3   (temperature, 4)  7 non-null      float32\n",
+      " 4   (temperature, 5)  7 non-null      float32\n",
+      " 5   (temperature, 6)  6 non-null      float32\n",
+      " 6   (temperature, 7)  7 non-null      float32\n",
+      " 7   (temperature, 8)  7 non-null      float32\n",
+      " 8   (temperature, 9)  7 non-null      float32\n",
+      " 9   (dose, 1)         7 non-null      float32\n",
+      " 10  (dose, 2)         7 non-null      float32\n",
+      " 11  (dose, 3)         7 non-null      float32\n",
+      " 12  (dose, 4)         6 non-null      float32\n",
+      " 13  (dose, 5)         7 non-null      float32\n",
+      " 14  (dose, 6)         6 non-null      float32\n",
+      " 15  (dose, 7)         7 non-null      float32\n",
+      " 16  (dose, 8)         7 non-null      float32\n",
+      " 17  (dose, 9)         7 non-null      float32\n",
+      "dtypes: float32(18)\n",
+      "memory usage: 560.0 bytes\n"
+     ]
+    }
+   ],
+   "source": [
+    "df_wide.info()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ea3a9d6b-fd0a-474d-8c42-df7a1f7d7e08",
+   "metadata": {},
+   "source": [
+    "Now you have a dataframe with the date as index, and multi-level columns.  The top-level is the temerature and the dose, but next level is the patient ID."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "id": "a41a59d3-1d12-4aee-a7c1-3b85a9950b07",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead tr th {\n",
+       "        text-align: left;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead tr:last-of-type th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr>\n",
+       "      <th></th>\n",
+       "      <th colspan=\"9\" halign=\"left\">temperature</th>\n",
+       "      <th colspan=\"9\" halign=\"left\">dose</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>patient</th>\n",
+       "      <th>1</th>\n",
+       "      <th>2</th>\n",
+       "      <th>3</th>\n",
+       "      <th>4</th>\n",
+       "      <th>5</th>\n",
+       "      <th>6</th>\n",
+       "      <th>7</th>\n",
+       "      <th>8</th>\n",
+       "      <th>9</th>\n",
+       "      <th>1</th>\n",
+       "      <th>2</th>\n",
+       "      <th>3</th>\n",
+       "      <th>4</th>\n",
+       "      <th>5</th>\n",
+       "      <th>6</th>\n",
+       "      <th>7</th>\n",
+       "      <th>8</th>\n",
+       "      <th>9</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>date</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>2012-10-02 10:00:00</th>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>39.299999</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>37.500000</td>\n",
+       "      <td>39.500000</td>\n",
+       "      <td>37.799999</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2012-10-02 11:00:00</th>\n",
+       "      <td>38.500000</td>\n",
+       "      <td>39.400002</td>\n",
+       "      <td>39.500000</td>\n",
+       "      <td>37.200001</td>\n",
+       "      <td>39.500000</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>40.700001</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>39.500000</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>10.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>10.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2012-10-02 12:00:00</th>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>36.099998</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>39.799999</td>\n",
+       "      <td>37.400002</td>\n",
+       "      <td>40.200001</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>7.0</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>12.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2012-10-02 13:00:00</th>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>35.900002</td>\n",
+       "      <td>38.500000</td>\n",
+       "      <td>37.700001</td>\n",
+       "      <td>40.200001</td>\n",
+       "      <td>37.599998</td>\n",
+       "      <td>39.099998</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>5.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>8.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>4.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2012-10-02 14:00:00</th>\n",
+       "      <td>37.500000</td>\n",
+       "      <td>36.799999</td>\n",
+       "      <td>37.700001</td>\n",
+       "      <td>36.299999</td>\n",
+       "      <td>39.400002</td>\n",
+       "      <td>37.200001</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>2.0</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>9.0</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>3.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>4.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                    temperature                                              \\\n",
+       "patient                       1          2          3          4          5   \n",
+       "date                                                                          \n",
+       "2012-10-02 10:00:00   38.299999  39.299999  37.900002  38.099998  37.900002   \n",
+       "2012-10-02 11:00:00   38.500000  39.400002  39.500000  37.200001  39.500000   \n",
+       "2012-10-02 12:00:00   38.099998  38.099998  38.299999  36.099998  38.299999   \n",
+       "2012-10-02 13:00:00   37.299999  37.299999        NaN  35.900002  38.500000   \n",
+       "2012-10-02 14:00:00   37.500000  36.799999  37.700001  36.299999  39.400002   \n",
+       "\n",
+       "                                                                dose       \\\n",
+       "patient                      6          7          8          9    1    2   \n",
+       "date                                                                        \n",
+       "2012-10-02 10:00:00  37.500000  39.500000  37.799999  38.299999  0.0  0.0   \n",
+       "2012-10-02 11:00:00  38.099998  40.700001  37.900002  39.500000  2.0  5.0   \n",
+       "2012-10-02 12:00:00  37.900002  39.799999  37.400002  40.200001  2.0  5.0   \n",
+       "2012-10-02 13:00:00  37.700001  40.200001  37.599998  39.099998  2.0  5.0   \n",
+       "2012-10-02 14:00:00  37.200001  38.299999  37.299999  37.900002  0.0  0.0   \n",
+       "\n",
+       "                                                          \n",
+       "patient                3    4    5    6     7    8     9  \n",
+       "date                                                      \n",
+       "2012-10-02 10:00:00  0.0  0.0  0.0  0.0   0.0  0.0   0.0  \n",
+       "2012-10-02 11:00:00  2.0  5.0  3.0  2.0  10.0  0.0  10.0  \n",
+       "2012-10-02 12:00:00  5.0  5.0  7.0  3.0   5.0  0.0  12.0  \n",
+       "2012-10-02 13:00:00  2.0  0.0  5.0  2.0   8.0  0.0   4.0  \n",
+       "2012-10-02 14:00:00  2.0  NaN  9.0  1.0   3.0  0.0   4.0  "
+      ]
+     },
+     "execution_count": 44,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_wide.head()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fd0c0272-d182-47c4-bf41-81c869b06932",
+   "metadata": {},
+   "source": [
+    "## And back again: stack + reset index"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 45,
+   "id": "81d18cc4-0451-4fd2-ac0a-56e868a31df0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df_long = df_wide \\\n",
+    "    .stack('patient', future_stack=True)                        \\\n",
+    "    .reset_index()   "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 46,
+   "id": "3a0b4e1f-560e-4639-bcc1-330bdf82c6d2",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "RangeIndex: 63 entries, 0 to 62\n",
+      "Data columns (total 4 columns):\n",
+      " #   Column       Non-Null Count  Dtype         \n",
+      "---  ------       --------------  -----         \n",
+      " 0   date         63 non-null     datetime64[ns]\n",
+      " 1   patient      63 non-null     int64         \n",
+      " 2   temperature  61 non-null     float32       \n",
+      " 3   dose         61 non-null     float32       \n",
+      "dtypes: datetime64[ns](1), float32(2), int64(1)\n",
+      "memory usage: 1.6 KB\n"
+     ]
+    }
+   ],
+   "source": [
+    "df_long.info()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 47,
+   "id": "551264e3-967b-43a2-b8c3-494095f88f87",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>date</th>\n",
+       "      <th>patient</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>1</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>2</td>\n",
+       "      <td>39.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>4</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>5</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                 date  patient  temperature  dose\n",
+       "0 2012-10-02 10:00:00        1    38.299999   0.0\n",
+       "1 2012-10-02 10:00:00        2    39.299999   0.0\n",
+       "2 2012-10-02 10:00:00        3    37.900002   0.0\n",
+       "3 2012-10-02 10:00:00        4    38.099998   0.0\n",
+       "4 2012-10-02 10:00:00        5    37.900002   0.0"
+      ]
+     },
+     "execution_count": 47,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_long.head()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "00be5fc1-e40d-4091-b0d6-4019a412f1e0",
+   "metadata": {},
+   "source": [
+    "Breaking it down into two steps, first the `stack()` method:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "id": "507b3ec3-6780-40e7-a7b8-c2345c3efa61",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>date</th>\n",
+       "      <th>patient</th>\n",
+       "      <th></th>\n",
+       "      <th></th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">2012-10-02 10:00:00</th>\n",
+       "      <th>1</th>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>39.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5</th>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th rowspan=\"5\" valign=\"top\">2012-10-02 16:00:00</th>\n",
+       "      <th>5</th>\n",
+       "      <td>37.200001</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6</th>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>7</th>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>8</th>\n",
+       "      <td>36.799999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>9</th>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>63 rows × 2 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                             temperature  dose\n",
+       "date                patient                   \n",
+       "2012-10-02 10:00:00 1          38.299999   0.0\n",
+       "                    2          39.299999   0.0\n",
+       "                    3          37.900002   0.0\n",
+       "                    4          38.099998   0.0\n",
+       "                    5          37.900002   0.0\n",
+       "...                                  ...   ...\n",
+       "2012-10-02 16:00:00 5          37.200001   0.0\n",
+       "                    6                NaN   NaN\n",
+       "                    7          37.299999   1.0\n",
+       "                    8          36.799999   0.0\n",
+       "                    9          37.299999   0.0\n",
+       "\n",
+       "[63 rows x 2 columns]"
+      ]
+     },
+     "execution_count": 48,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_wide.stack(\"patient\", future_stack=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "57e15671-7a85-41b0-bcb5-fe2e089efdc6",
+   "metadata": {},
+   "source": [
+    "As you can see, this has created a dataframe that has only two columns, but a multi-level index.  The top-level index is the date, the sublevel is the patient."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "id": "4e351540-2f48-4ef3-aa47-e8929cb1c4e4",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>date</th>\n",
+       "      <th>patient</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>1</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>2</td>\n",
+       "      <td>39.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>4</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>5</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>58</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>5</td>\n",
+       "      <td>37.200001</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>59</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>60</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>7</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>61</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>8</td>\n",
+       "      <td>36.799999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>62</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>9</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>63 rows × 4 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                  date  patient  temperature  dose\n",
+       "0  2012-10-02 10:00:00        1    38.299999   0.0\n",
+       "1  2012-10-02 10:00:00        2    39.299999   0.0\n",
+       "2  2012-10-02 10:00:00        3    37.900002   0.0\n",
+       "3  2012-10-02 10:00:00        4    38.099998   0.0\n",
+       "4  2012-10-02 10:00:00        5    37.900002   0.0\n",
+       "..                 ...      ...          ...   ...\n",
+       "58 2012-10-02 16:00:00        5    37.200001   0.0\n",
+       "59 2012-10-02 16:00:00        6          NaN   NaN\n",
+       "60 2012-10-02 16:00:00        7    37.299999   1.0\n",
+       "61 2012-10-02 16:00:00        8    36.799999   0.0\n",
+       "62 2012-10-02 16:00:00        9    37.299999   0.0\n",
+       "\n",
+       "[63 rows x 4 columns]"
+      ]
+     },
+     "execution_count": 51,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_long = df_wide.stack(\"patient\", future_stack=True).reset_index()\n",
+    "df_long"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "23489994-b08f-4aed-a49e-daa0908015b4",
+   "metadata": {},
+   "source": [
+    "Resetting the index will create columns out of the multi-level index, so one for the date, a second for the patient ID."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e7030ce2-291e-45fa-a791-05b7eaa8f1b2",
+   "metadata": {},
+   "source": [
+    "If you prefer to get rid of the column name, simply set it to `None`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "id": "ca46e4f1-407a-4e64-ba85-837e0ec4997e",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>date</th>\n",
+       "      <th>patient</th>\n",
+       "      <th>temperature</th>\n",
+       "      <th>dose</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>1</td>\n",
+       "      <td>38.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>2</td>\n",
+       "      <td>39.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>3</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>4</td>\n",
+       "      <td>38.099998</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>2012-10-02 10:00:00</td>\n",
+       "      <td>5</td>\n",
+       "      <td>37.900002</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>58</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>5</td>\n",
+       "      <td>37.200001</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>59</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>6</td>\n",
+       "      <td>NaN</td>\n",
+       "      <td>NaN</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>60</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>7</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>61</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>8</td>\n",
+       "      <td>36.799999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>62</th>\n",
+       "      <td>2012-10-02 16:00:00</td>\n",
+       "      <td>9</td>\n",
+       "      <td>37.299999</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>63 rows × 4 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                  date  patient  temperature  dose\n",
+       "0  2012-10-02 10:00:00        1    38.299999   0.0\n",
+       "1  2012-10-02 10:00:00        2    39.299999   0.0\n",
+       "2  2012-10-02 10:00:00        3    37.900002   0.0\n",
+       "3  2012-10-02 10:00:00        4    38.099998   0.0\n",
+       "4  2012-10-02 10:00:00        5    37.900002   0.0\n",
+       "..                 ...      ...          ...   ...\n",
+       "58 2012-10-02 16:00:00        5    37.200001   0.0\n",
+       "59 2012-10-02 16:00:00        6          NaN   NaN\n",
+       "60 2012-10-02 16:00:00        7    37.299999   1.0\n",
+       "61 2012-10-02 16:00:00        8    36.799999   0.0\n",
+       "62 2012-10-02 16:00:00        9    37.299999   0.0\n",
+       "\n",
+       "[63 rows x 4 columns]"
+      ]
+     },
+     "execution_count": 52,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "df_long.columns.name = None\n",
+    "df_long"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7447a0bd-fe9e-4976-9c22-0e3c73674def",
+   "metadata": {},
+   "source": [
+    "Except for the order of the columns, and the sorting of the rows, you are back to the original data format."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From 4579ffa065940742758b2b789c19f1c24befee63 Mon Sep 17 00:00:00 2001
From: Geert Jan Bex <geertjan.bex@uhasselt.be>
Date: Tue, 25 Nov 2025 08:20:33 +0100
Subject: [PATCH 10/10] Delete double entry

---
 source-code/README.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/source-code/README.md b/source-code/README.md
index 177a58c..3f0175d 100644
--- a/source-code/README.md
+++ b/source-code/README.md
@@ -23,8 +23,6 @@ to create it.  There is some material not covered in the presentation as well.
   soup and graph representation using networkx.
 * [`xarray`](xarray): illustrates the xarray library for pandas-like operations
   on multi-dimensional arrays.
-* [`duckdb`](duckdb): illustrates the DuckDB library for SQL-like operations
-  on dataframes, including integration with pandas and polars.
 
 **Note:** material on dashboards has been moved to a [dedicated
 repository](https://github.com/gjbex/Python-dashboards).