# Check Data Warehouse

### Import


In [1]:
from lib.duckdbcontext import DuckDBContext
import duckdb

In [3]:
duckdb_database = "../orchestration/db/bigdata.duckdb"

#### Using SQL Magic Cells


In [7]:
%load_ext sql
conn = duckdb.connect(duckdb_database)
%sql conn --alias duckdb

The sql extension is already loaded. To reload it, use:
  %reload_ext sql


In [8]:
%sql SHOW ALL TABLES; # shows all available tables

database,schema,name,column_names,column_types,temporary
bigdata,main,extra_name_basics,"['nconst', 'primaryName', 'birthYear', 'deathYear', 'primaryProfession', 'knownForTitles', 'tconst']","['VARCHAR', 'VARCHAR', 'INTEGER', 'INTEGER', 'VARCHAR', 'VARCHAR', 'VARCHAR']",False
bigdata,main,extra_title_akas,"['ordering', 'title', 'region', 'language', 'types', 'attributes', 'isOriginalTitle', 'tconst']","['INTEGER', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'INTEGER', 'VARCHAR']",False
bigdata,main,extra_title_basics,"['tconst', 'titleType', 'primaryTitle', 'originalTitle', 'isAdult', 'startYear', 'endYear', 'runtimeMinutes', 'genres']","['VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'INTEGER', 'INTEGER', 'INTEGER', 'VARCHAR', 'VARCHAR']",False
bigdata,main,extra_title_crew,"['tconst', 'directors', 'writers']","['VARCHAR', 'VARCHAR', 'VARCHAR']",False
bigdata,main,extra_title_principals,"['tconst', 'ordering', 'nconst', 'category', 'job', 'characters']","['VARCHAR', 'INTEGER', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR']",False
bigdata,main,extra_title_ratings,"['tconst', 'averageRating', 'numVotes']","['VARCHAR', 'DOUBLE', 'INTEGER']",False
bigdata,main,imdb_directors,"['movie', 'director']","['VARCHAR', 'VARCHAR']",False
bigdata,main,imdb_train,"['tconst', 'primaryTitle', 'originalTitle', 'startYear', 'endYear', 'runtimeMinutes', 'numVotes', 'label']","['VARCHAR', 'VARCHAR', 'VARCHAR', 'INTEGER', 'INTEGER', 'INTEGER', 'DOUBLE', 'BOOLEAN']",False
bigdata,main,imdb_writing,"['movie', 'writer']","['VARCHAR', 'VARCHAR']",False
bigdata,main,letterboxd_movie_ratings_data,"['_id', 'movie_id', 'movie_title', 'original_language', 'popularity', 'release_date', 'runtime', 'vote_average', 'vote_count', 'year_released', 'tconst', 'genre', 'production_countrie', 'spoken_language']","['VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR', 'VARCHAR']",False


In [10]:
conn.close()

#### Using Custom Context Manager


In [9]:
# Usage
with DuckDBContext(duckdb_database) as ctx:
    ctx.show_tables_info(as_dataframe=True)

Table: extra_name_basics


nconst,primaryName,birthYear,deathYear,primaryProfession,knownForTitles,tconst
str,str,i32,i32,str,str,str
"""nm0000115""","""Nicolas Cage""",1964,,"""actor,producer…","""tt0113627""","""tt0113627"""
"""nm0000147""","""Colin Firth""",1960,,"""actor,producer…","""tt2802144""","""tt2802144"""
"""nm0000223""","""Elisabeth Shue…",1963,,"""actress,produc…","""tt0113627""","""tt0113627"""
"""nm0000508""","""Carey Lowell""",1961,,"""actress""","""tt0113627""","""tt0113627"""
"""nm0000629""","""Claudia Schiff…",1970,,"""actress,produc…","""tt2802144""","""tt2802144"""


Table: extra_title_akas


ordering,title,region,language,types,attributes,isOriginalTitle,tconst
i32,str,str,str,str,str,i32,str
10,"""Les nuits de C…","""CA""","""fr""","""imdbDisplay""",,0,"""tt0018526"""
11,"""Moderne Apache…","""AT""",,"""alternative""",,0,"""tt0018526"""
12,"""Underworld""","""GB""",,"""imdbDisplay""",,0,"""tt0018526"""
13,"""Underworld""","""AU""",,"""imdbDisplay""",,0,"""tt0018526"""
14,"""Ludzie podziem…","""PL""",,"""imdbDisplay""",,0,"""tt0018526"""


Table: extra_title_basics


tconst,titleType,primaryTitle,originalTitle,isAdult,startYear,endYear,runtimeMinutes,genres
str,str,str,str,i32,i32,i32,str,str
"""tt0018526""","""movie""","""Underworld""","""Underworld""",0,1927,,"""80""","""Crime,Drama,Fi…"
"""tt0039305""","""movie""","""Dead Reckoning…","""Dead Reckoning…",0,1946,,"""100""","""Crime,Drama,Fi…"
"""tt0044008""","""movie""","""A Christmas Ca…","""Scrooge""",0,1951,,"""86""","""Drama,Family,F…"
"""tt0054412""","""movie""","""Tunes of Glory…","""Tunes of Glory…",0,1960,,"""107""","""Drama"""
"""tt0059538""","""movie""","""Old Surehand""","""Old Surehand, …",0,1965,,"""90""","""Adventure,West…"


Table: extra_title_crew


tconst,directors,writers
str,str,str
"""tt0018526""","""nm0903049,nm07…","""nm0299153,nm00…"
"""tt0039305""","""nm0188669""","""nm0308177,nm02…"
"""tt0044008""","""nm0221423""","""nm0002042,nm04…"
"""tt0054412""","""nm0623768""","""nm0447860"""
"""tt0059538""","""nm0901138""","""nm0562015,nm02…"


Table: extra_title_principals


tconst,ordering,nconst,category,job,characters
str,i32,str,str,str,str
"""tt0018526""",10,"""nm0498133""","""writer""","""adaptation""",
"""tt0018526""",1,"""nm0051628""","""actor""",,"""[""'Bull' Weed""…"
"""tt0018526""",2,"""nm0111612""","""actor""",,"""[""Rolls Royce …"
"""tt0018526""",3,"""nm0107574""","""actress""",,"""[""'Feathers' M…"
"""tt0018526""",4,"""nm0463264""","""actor""",,"""[""'Buck' Mulli…"


Table: extra_title_ratings


tconst,averageRating,numVotes
str,f64,i32
"""tt0014109""",7.0,1371
"""tt0015064""",8.0,15123
"""tt0015841""",7.5,6039
"""tt0017271""",7.6,1229
"""tt0018451""",7.6,1657


Table: imdb_directors


movie,director
str,str
"""tt0003740""","""nm0665163"""
"""tt0008663""","""nm0803705"""
"""tt0009369""","""nm0428059"""
"""tt0009369""","""nm0949648"""
"""tt0010307""","""nm0304098"""


Table: imdb_train


tconst,primaryTitle,originalTitle,startYear,endYear,runtimeMinutes,numVotes,label
str,str,str,i32,i32,i32,f64,bool
"""tt0014109""","""The Saga of Gö…",,1924.0,,183,1231.0,True
"""tt0015064""","""The Last Laugh…","""Der letzte Man…",1924.0,,77,,True
"""tt0015841""","""The Freshman""","""The Freshman""",1925.0,,77,5374.0,True
"""tt0017271""","""By the Law""",,,1926.0,80,1057.0,True
"""tt0018451""","""The Student Pr…",,1927.0,,106,1459.0,True


Table: imdb_writing


movie,writer
str,str
"""tt0003740""","""nm0195339"""
"""tt0003740""","""nm0515385"""
"""tt0003740""","""nm0665163"""
"""tt0003740""","""nm0758215"""
"""tt0008663""","""nm0406585"""


Table: letterboxd_movie_ratings_data


_id,movie_id,movie_title,original_language,popularity,release_date,runtime,vote_average,vote_count,year_released,tconst,genre,production_countrie,spoken_language
str,str,str,str,str,str,str,str,str,str,str,str,str,str
"""5fc86a3d6758f6…","""the-trump-prop…","""The Trump Prop…","""en""","""2.025""","""2018-10-02""","""120""","""4""","""7""","""2018""","""tt8235296""","""Drama""","""United States …","""English"""
"""5fc8708a6758f6…","""nothing-funny""","""Nothing Funny""","""pl""","""4.192""","""1996-02-02""","""95""","""7.2""","""39""","""1996""","""tt0113971""","""Comedy""","""Poland""","""Polski"""
"""5fc8738e6758f6…","""whose-streets""","""Whose Streets?…","""en""","""2.919""","""2017-08-11""","""90""","""5.8""","""19""","""2017""","""tt6176928""","""Documentary""","""United States …","""English"""
"""5fc879006758f6…","""tunes-of-glory…","""Tunes of Glory…","""en""","""2.941""","""1960-09-17""","""106""","""7.1""","""38""","""1960""","""tt0054412""","""Drama""","""United Kingdom…","""English"""
"""5fc87a246758f6…","""baaghi-2""","""Baaghi 2""","""hi""","""4.897""","""2018-03-30""","""145""","""5.8""","""40""","""2018""","""tt6843812""","""Action""","""India""","""हिन्दी"""


Table: movie_data


_id,genres,image_url,imdb_id,imdb_link,movie_id,movie_title,original_language,overview,popularity,production_countries,release_date,runtime,spoken_languages,tmdb_id,tmdb_link,vote_average,vote_count,year_released
str,str,str,str,str,str,str,str,str,str,str,str,str,str,str,str,str,str,str
"""5fc85f606758f6…","""""[""""Music""""""","""""""Animation""""]…","""film-poster/4/…",,,"""football-freak…","""Football Freak…","""en""","""Football crazy…","""0.6""","""""[""""United Kin…","""1971-12-05""","""0""","""[]""","""535272""","""https://www.th…","""0""","""0"""
"""5fc85ff26758f6…","""[]""","""film-poster/2/…","""tt0586129""","""http://www.imd…","""aftermath-1960…","""Aftermath""","""en""","""Aftermath was …","""0.6""","""[]""","""1960-04-17""","""22""","""[]""","""318331""","""https://www.th…","""8""","""1""","""1960"""
"""5fc85f606758f6…","""""[""""Drama""""]""""","""film-poster/9/…","""tt0045731""","""http://www.imd…","""where-chimneys…","""Where Chimneys…","""ja""","""Gosho’s most c…","""1.568""","""""[""""Japan""""]""""","""1953-03-05""","""108""","""""[""""日本語""""]""""","""117779""","""https://www.th…","""6.6""","""10""","""1953"""
"""5fc85f606758f6…","""""[""""Drama""""]""""",,"""tt0187327""","""http://www.imd…","""the-musicians-…","""The Musician's…","""en""","""Carl Wagner's …","""0.6""","""""[""""United Sta…","""1911-12-12""","""15""","""[]""","""560377""","""https://www.th…","""0""","""0""","""1911"""
"""5fc85f606758f6…","""""[""""Documentar…","""film-poster/4/…","""tt4769914""","""http://www.imd…","""50-years-of-fa…","""50 Years of Fa…","""en""","""50 Years of Fa…","""0.6""","""[]""","""2018-05-17""","""75""","""[]""","""525187""","""https://www.th…","""0""","""0""","""2018"""


Table: the_oscar_award


year_film,year_ceremony,ceremony,category,name,film,winner
i32,i32,i32,str,str,str,str
1927,1928,1,"""ACTOR""","""Richard Barthe…","""The Noose""","""False"""
1927,1928,1,"""ACTOR""","""Emil Jannings""","""The Last Comma…","""True"""
1927,1928,1,"""ACTRESS""","""Louise Dresser…","""A Ship Comes I…","""False"""
1927,1928,1,"""ACTRESS""","""Janet Gaynor""","""7th Heaven""","""True"""
1927,1928,1,"""ACTRESS""","""Gloria Swanson…","""Sadie Thompson…","""False"""


Table: users_export


display_name,num_ratings_pages,num_reviews,username,imdb_id
str,i32,i32,str,str
"""Lucy""",32,1650,"""deathproof""",
"""karsten""",20,1147,"""kurstboy""",
"""davidehrlich""",33,2113,"""davidehrlich""",
"""adrianbalboa""",1,975,"""adrianbalboa""",
"""matt lynch""",73,5278,"""colonelmortime…",


### Create Features


In [2]:
# JOIN SOME TABLES TOGETHER