In [0]:
CREATE SCHEMA IF NOT EXISTS movie_bronze;

### Crear tablas para archivos CSV

#### Crear tablas "movies"

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies;
CREATE TABLE IF NOT EXISTS movie_bronze.movies(
  movieId INT,
  title STRING,
  budget DOUBLE,
  homePage STRING,
  overview STRING,
  popularity DOUBLE,
  yearReleaseDate INT,
  releaseDate DATE,
  revenue DOUBLE,
  durationTime INT,
  movieStatus STRING,
  tagline STRING,
  voteAverage DOUBLE,
  voteCount INT
)
USING CSV
OPTIONS (path "/mnt/moviehistory07/bronze/movie.csv", header true)

In [0]:
select * from movie_bronze.movies;

## Crear la tabla "languages"

In [0]:
DROP TABLE IF EXISTS movie_bronze.languages;
CREATE TABLE IF NOT EXISTS movie_bronze.languages(
  languageId INT,
  languageCode STRING,
  languageName STRING
)
  USING CSV
  OPTIONS (path "/mnt/moviehistory07/bronze/language.csv", header true)

In [0]:
select * from movie_bronze.languages;

### Crear la tabla "genres"

In [0]:
DROP TABLE IF EXISTS movie_bronze.genres;
CREATE TABLE IF NOT EXISTS movie_bronze.genres(
  genreId INT,
  genreName STRING
)
USING CSV
OPTIONS (path "/mnt/moviehistory07/bronze/genre.csv", header true)

In [0]:
SELECT * FROM movie_bronze.genres

## Crear tablas para archivos JSON

### Crear la tabla "countries"
- JSON en una sola linea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.countries;
CREATE TABLE if NOT EXISTS movie_bronze.countries(
  countryId INT,
  countryCode STRING,
  countryName STRING
)
USING JSON 
OPTIONS (path "/mnt/moviehistory07/bronze/country.json")

### Crear la tabla "persons"
- JSON en una sola linea
- Estructura Compleja

In [0]:

DROP TABLE IF EXISTS movie_bronze.persons;
CREATE TABLE IF NOT EXISTS movie_bronze.persons(
  personId INT,
  personName STRUCT<forename: STRING, surname : STRING>
  )
USING JSON 
OPTIONS (path "/mnt/moviehistory07/bronze/person.json")

In [0]:
SELECT * FROM movie_bronze.persons

### Crear la tabla "movies_genres"
- JSON en una sola linea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_genres;
CREATE TABLE if NOT EXISTS movie_bronze.movies_genres(
  movieId INT,
  genreId INT
)
USING JSON 
OPTIONS (path "/mnt/moviehistory07/bronze/movie_genre.json")

In [0]:
select * from movie_bronze.movies_genres

### Crear la tabla "movies_cats"
- JSON Multilinea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.movie_casts;
CREATE TABLE IF NOT EXISTS movie_bronze.movie_casts(
  movieId INT,
  personId INT,
  characterName STRING,
  genderId INT,
  castOrder INT
)
USING JSON 
OPTIONS (path "/mnt/moviehistory07/bronze/movie_cast.json", multiLine true)

In [0]:
select * from movie_bronze.movie_casts

### Crear la tabla "languages_roles"
- JSON en una sola linea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.languages_roles;
CREATE TABLE IF NOT EXISTS movie_bronze.languages_roles(
  roleId INT,
  languageRole STRING
)
USING JSON 
OPTIONS (path "/mnt/moviehistory07/bronze/language_role.json", multiLine true)

In [0]:
select * from movie_bronze.languages_roles

## Crear tablas para la lista de Archivos (CSVs y JSONs)

#### Crear la tabla "productions_companies"
- Archivo CSV
- Multiples archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.productions_companies;
CREATE TABLE IF NOT EXISTS movie_bronze.productions_companies(
  companyId INT,
  companyName STRING
)
USING CSV
OPTIONS (path "/mnt/moviehistory07/bronze/production_company")

In [0]:
select * from movie_bronze.productions_companies

#### Crear la tabla "movies_companies"
- Archivo CSV
- Multiples archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_companies;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_companies(
  movieId INT,
  companyId INT
)
USING CSV
OPTIONS (path "/mnt/moviehistory07/bronze/movie_company")

In [0]:
select * from movie_bronze.movies_companies

#### Crear la tabla "movies_languages"
- Archivo JSON Multilinea
- Multiples archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_languages;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_languages(
  movieId INT,
  languageId INT,
  languageRoleId INT
)
USING JSON
OPTIONS (path "/mnt/moviehistory07/bronze/movie_language", multiLine true)

In [0]:
SELECT * FROM movie_bronze.movies_languages

#### Crear la tabla "productions_countries"
- Archivo JSON Multilinea
- Multiples archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.productions_countries;
CREATE TABLE IF NOT EXISTS movie_bronze.productions_countries(
  movieId INT,
  countryId INT
)
USING JSON
OPTIONS (path "/mnt/moviehistory07/bronze/production_country", multiLine true)

In [0]:
select * from movie_bronze.productions_countries