Yellow Trips Silver DDL

In [0]:
CREATE OR REPLACE TABLE nyc_taxi.silver.yellow_taxi_trips
(
  trip_id string PRIMARY KEY COMMENT 'Hash of vendor_id,pickup_datetime, dropoff_datetime, pickup_location_id, dropoff_location_id,rate_code_id,payment_type_id',
  year int COMMENT 'Partition Key',
 month int COMMENT 'Partition Key',
 vendor_id int,
 pickup_datetime timestamp_ntz,
 dropoff_datetime timestamp_ntz,
 trip_distance double,
 trip_duration int COMMENT 'Dropoff Time - Pickup Time in seconds',
 passenger_count int, 
 rate_code_id int,
 pickup_location_id int,
 dropoff_location_id int,
 payment_type_id int,
 fare_amount double,
 extra_charge double,
 mta_tax double,
 tip_amount double,
 tolls_amount double,
 improvement_surcharge double,
 congestion_surcharge double,
 cbd_congestion_fee double,
 airport_fee double,
 total_amount double,
 driver_pay double COMMENT 'Fare Amount + Tip Amount',
 store_and_fwd_flag boolean,
 run_id STRING COMMENT 'Unique id for run',
 bronze_id string COMMENT 'Bronze batch run id',
 ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested'
)
USING DELTA
PARTITIONED BY (year,month)
LOCATION 's3://nyc-tlc-data-398563707364/silver/yellow_taxi_trips/';

Green trips Silver DDL

In [0]:
CREATE OR REPLACE TABLE nyc_taxi.silver.green_taxi_trips
(
 trip_id STRING PRIMARY KEY COMMENT 'Hash of vendor_id,pickup_datetime, dropoff_datetime, pickup_location_id, dropoff_location_id,rate_code_id,payment_type_id,trip_type', 
 year int COMMENT 'Partition Key',
 month int COMMENT 'Partition Key',
 vendor_id int,
 pickup_datetime timestamp_ntz,
 dropoff_datetime timestamp_ntz,
 trip_distance double ,
 trip_duration int COMMENT 'Dropoff Time - Pickup Time in seconds' ,
 rate_code_id int,
 pickup_location_id int,
 dropoff_location_id int,
 payment_type_id int,
 fare_amount double,
 extra_charge double,
 mta_tax double,
 tip_amount double,
 tolls_amount double,
 improvement_surcharge double,
 congestion_surcharge double,
 cbd_congestion_fee double,
 total_amount double,
 driver_pay double COMMENT 'Fare Amount + Tips Amount',
 trip_type int,
 ehail_fee double,
 store_and_fwd_flag boolean ,
  run_id STRING COMMENT 'Unique id for run',
 bronze_id string COMMENT 'Bronze batch run id',
 ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested'
)
USING DELTA
PARTITIONED BY (year,month)
LOCATION 's3://nyc-tlc-data-398563707364/silver/green_taxi_trips/'

For Hire Vehicles Silver DDL

In [0]:
CREATE OR REPLACE TABLE nyc_taxi.silver.fhv_trips
(
trip_id STRING PRIMARY KEY COMMENT 'Hash of dispatching_base_num, pickup_datetime, dropoff_datetime, pickup_location_id, dropoff_location_id ', 
year int,
month int,
dispatching_base_num string,
affiliated_base_num string,
pickup_datetime timestamp_ntz,
dropoff_datetime timestamp_ntz,
pickup_location_id int,
dropoff_location_id int,
shared_ride_flag boolean,
 run_id STRING COMMENT 'Unique id for run',
 bronze_id string COMMENT 'Bronze batch run id',
 ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested' 
)
USING DELTA
PARTITIONED BY (year,month)
LOCATION 's3://nyc-tlc-data-398563707364/silver/fhv_trips/'

High-Volume For Hire Vehicles Silver DDL

In [0]:
CREATE OR REPLACE TABLE nyc_taxi.silver.hvfhv_trips
(
trip_id STRING PRIMARY KEY COMMENT 'Hash of license_number,dispatching_base_num,originating_base_num,request_datetime,on_scene_datetime,pickup_datetime,dropoff_datetime,pickup_location_id,dropoff_location_id', 
year int,
month int,
 license_number string,
 dispatching_base_num string,
 originating_base_num string,
 request_datetime timestamp_ntz,
 on_scene_datetime timestamp_ntz,
 pickup_datetime timestamp_ntz,
 dropoff_datetime timestamp_ntz,
 pickup_location_id int,
 dropoff_location_id int,
 trip_distance double,
 trip_duration int,
 fare_amount double, 
 tolls_amount double,
 bcf_amount double,
 sales_tax double,
 congestion_surcharge double,
 airport_fee double,
 cbd_congestion_fee double,
 total_amount double COMMENT 'Total Amount = Fare + Fees + Charges',
 shared_request_flag boolean,
 shared_match_flag boolean,
 access_a_ride_flag boolean,
 wav_request_flag BOOLEAN,
 run_id STRING COMMENT 'Unique id for run',
 bronze_id string COMMENT 'Bronze batch run id',
 ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested'
)
USING DELTA
PARTITIONED BY (year,month)
LOCATION 's3://nyc-tlc-data-398563707364/silver/hvfhv_trips/'

Taxi Zones Silver DDL

In [0]:
CREATE  or REPLACE TABLE nyc_taxi.silver.taxi_zone_lookup
(
 location_id int,
 borough string,
 zone string,
 service_zone string,
 run_id STRING COMMENT 'Unique id for run',
 bronze_id string COMMENT 'Bronze batch run id',
 ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested'
)
USING DELTA
LOCATION 's3://nyc-tlc-data-398563707364/silver/taxi_zone_lookup/'

License Mapping Silver DDL

In [0]:
create or replace table nyc_taxi.silver.license_mapping_lookup(
  high_volume_license_number string,
  license_number string,
  base_name string,
  app_company_affiliation string,
  run_id STRING COMMENT 'Unique id for run',
  bronze_id string COMMENT 'Bronze batch run id',
  ingest_ts TIMESTAMP COMMENT 'Timestamp when record was ingested'
)
using delta
LOCATION 's3://nyc-tlc-data-398563707364/silver/license_mapping_lookup/'