In [None]:
#%pip install boto3 duckdb 'pyiceberg[glue]' pyarrow

In [1]:
# Import the setup function from gen_tables.py
from gen_tables import setup_notebook_environment

# Set up all necessary components (DuckDB connection, PyIceberg catalog, Glue client)
cn, catalog, glue_client = setup_notebook_environment()

In [3]:
# Import query functions and create views for all table types
from query_glue_table import create_duckdb_view_from_glue_table

# Database and tables to work with
db_name = "icebox1"
tables = ["iceberg_test", "parquet_test", "csv_test"]

# Create views for individual tables
for table in tables:
    try:
        view_name = create_duckdb_view_from_glue_table(
            db_name=db_name, 
            table_name=table,
            glue_client=glue_client, 
            catalog=catalog, 
            cn=cn
        )
    except Exception as e:
        print(f"❌ Failed to create view for {table}: {e}")

In [4]:
# Show sample data from each created view
view_names = ["v_iceberg_test", "v_parquet_test", "v_csv_test"]

for view_name in view_names:
    try:
        print(f"Sample from {view_name}:")
        sample = cn.sql(f"SELECT * FROM {view_name} LIMIT 3")
        print(sample)
        print()
    except Exception as e:
        print(f"❌ Could not query {view_name}: {e}")

Sample from v_iceberg_test:
┌────────┬──────────────────────────────────────┬────────────┬──────────┐
│ row_id │               txn_key                │   rpt_dt   │ some_val │
│ int64  │               varchar                │    date    │  double  │
├────────┼──────────────────────────────────────┼────────────┼──────────┤
│      1 │ 03724388-b7d8-4999-8589-1031a3562f48 │ 2025-09-20 │     4.89 │
│      2 │ 348ce2e6-13b6-489d-8a51-0716f3ce309c │ 2025-09-20 │    91.06 │
│      3 │ e18bb457-ebe0-44e7-81a6-e4c1cae31328 │ 2025-09-20 │     3.87 │
└────────┴──────────────────────────────────────┴────────────┴──────────┘


Sample from v_parquet_test:
┌────────┬──────────────────────────────────────┬────────────┬──────────┐
│ row_id │               txn_key                │   rpt_dt   │ some_val │
│ int64  │               varchar                │    date    │  double  │
├────────┼──────────────────────────────────────┼────────────┼──────────┤
│      1 │ f551e547-9eb7-417a-b37c-deb9b9a7226a │ 2025