In [0]:
CREATE SCHEMA IF NOT EXISTS movie_bronze;

In [0]:
SHOW DATABASES

### Crear tablas para archivos CSV

#### Crear la tabla "movies"

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies;

In [0]:
CREATE TABLE IF NOT EXISTS movie_bronze.movies(
  movieId INT,
  title STRING,
  budget DOUBLE,
  homePage STRING,
  overview STRING,
  popularity DOUBLE,
  yearReleaseDate INT,
  releaseDate DATE,
  revenue DOUBLE,
  durationTime INT,
  movieStatus STRING,
  tagline STRING,
  voteAverage DOUBLE,
  voteCount INT
)
USING CSV
OPTIONS(path "/mnt/moviehistory/bronze/movie.csv", header true)

#### Crear la tabla "languages"

In [0]:
DROP TABLE IF EXISTS movie_bronze.languages;
CREATE TABLE IF NOT EXISTS movie_bronze.languages(
  languageId INT,
  languageCode STRING,
  languageName STRING
)
USING CSV
OPTIONS(path "/mnt/moviehistory/bronze/language.csv", header true)

#### Crear la Tabla "genres"

In [0]:
DROP TABLE IF EXISTS movie_bronze.genres;
CREATE TABLE IF NOT EXISTS movie_bronze.genres(
  genreId INT,
  genreName STRING
)
USING CSV
OPTIONS(path "/mnt/moviehistory/bronze/genre.csv", header true)

### Crear tablas para archivos JSON

#### Crear la tabla "countries"

- JSON de una sola línea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.countries;
CREATE TABLE IF NOT EXISTS movie_bronze.countries(
  countryId INT,
  countryIsoCode STRING,
  countryName STRING
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/country.json")

In [0]:

SELECT * FROM movie_bronze.countries;

#### Crear la tabla "persons"

In [0]:
DROP TABLE IF EXISTS movie_bronze.persons;
CREATE TABLE IF NOT EXISTS movie_bronze.persons(
  personId INT,
  personName STRUCT<forename: STRING, surname: STRING>
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/person.json")

In [0]:
SELECT * FROM movie_bronze.persons;

#### Crear la tabla "movies_genres"
- JSON de una sola línea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_genres;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_genres(
  movieId INT,
  genreId INT

)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/movie_genre.json")

In [0]:
SELECT * FROM movie_bronze.movies_genres;

#### Crear la tabla "movies_cats"

- JSON Multilínea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_cats;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_cats(
  movieId INT,
  personId INT,
  characterName STRING,
  genderId INT,
  castOrder INT
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/movie_cast.json", multiLine true)

In [0]:
SELECT * FROM movie_bronze.movies_cats;

#### Crear la tabla "languages_roles"
- JSON Multilínea
- Estructura Simple

In [0]:
DROP TABLE IF EXISTS movie_bronze.languages_roles;
CREATE TABLE IF NOT EXISTS movie_bronze.languages_roles(
  roleId INT,
  languageRole STRING
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/language_role.json", multiLine true)

In [0]:
SELECT * FROM movie_bronze.languages_roles;

### Crear tablas para Lista de Archivos(CSVs y JSONs)

#### Crear la tabla "productions_companies"
- Archivo CSV
- Múltiples Archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.productions_companies;
CREATE TABLE IF NOT EXISTS movie_bronze.productions_companies(
  companyId INT,
  companyName STRING
)
USING CSV
OPTIONS(path "/mnt/moviehistory/bronze/production_company")

In [0]:
SELECT * FROM movie_bronze.productions_companies;

#### Crear la tabla "movies_companies"
- Archivo CSV
- Múltiples Archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_companies;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_companies(
  movieId INT,
  companyId INT
)
USING CSV
OPTIONS(path "/mnt/moviehistory/bronze/movie_company")

In [0]:
SELECT * FROM movie_bronze.movies_companies;

#### Crear la tabla "movies_languages"
- Archivo JSON Multilínea
- Múltiples Archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.movies_languages;
CREATE TABLE IF NOT EXISTS movie_bronze.movies_languages(
  movieId INT,
  languageId INT
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/movie_language", multiLine true)

In [0]:
SELECT * FROM movie_bronze.movies_languages;

#### Crear la tabla "productions_countries"
- Archivo JSON Multilínea
- Múltiples Archivos

In [0]:
DROP TABLE IF EXISTS movie_bronze.productions_countries;
CREATE TABLE IF NOT EXISTS movie_bronze.productions_countries(
  movieId INT,
  countryId INT
)
USING JSON
OPTIONS(path "/mnt/moviehistory/bronze/production_country", multiLine true)

In [0]:
SELECT * FROM movie_bronze.productions_countries;