# Load Airport Data

Data sourced from the <a href="https://www.transtats.bts.gov/Data_Elements.aspx?Data=4">Bureau of Transportation Statistics.</a>

In [1]:
import pandas as pd
# Load data
airport_data = pd.read_csv ('~/jupyter/sp22Capstone_01_Group02/data/COAggregateAirportData.csv')

airport_data.columns = ['year','month','airport_city','domestic_passengers',
              'international_passengers','total_passengers','domestic_flights',
              'international_flights','total_flights']


airport_data.head()

Unnamed: 0,year,month,airport_city,domestic_passengers,international_passengers,total_passengers,domestic_flights,international_flights,total_flights
0,2002,10,Alamosa,387,0,387,81,0,81
1,2002,11,Alamosa,252,0,252,66,0,66
2,2002,12,Alamosa,298,0,298,75,0,75
3,2003,1,Alamosa,257,0,257,78,0,78
4,2003,2,Alamosa,248,0,248,70,0,70


In [9]:
airport_data.dtypes

year                         int64
month                        int64
airport_city                object
domestic_passengers          int64
international_passengers     int64
total_passengers             int64
domestic_flights             int64
international_flights        int64
total_flights                int64
dtype: object

# Create Database

In [4]:
import getpass
from sqlalchemy.engine.url import URL
from sqlalchemy import create_engine
%reload_ext sql

mypasswd = getpass.getpass()
username = 'nnfd2' # Replace with your pawprint
host = 'pgsql.dsa.lan'
database = 'caponl_22g2'

postgres_db = {'drivername': 'postgres',
               'username': username,
               'password': mypasswd,
               'host': host,
               'database': database}
engine = create_engine(URL(**postgres_db), echo=False)


connection_string = f'postgres://{username}:{mypasswd}@{host}/{database}'
%sql $connection_string
del mypasswd

········


In [12]:
%%sql

drop table if exists airport_data cascade;

create table airport_data (
    year int,
    month int,
    airport_city varchar(100),
    domestic_passengers int,
    international_passengers int,
    total_passengers int,
    domestic_flights int,
    international_flights int,
    total_flights int,
    constraint pk_airport_data primary key (year,month,airport_city)
);

grant all privileges on airport_data to nnfd2, dgyw5, jwcp64, gfdbq

 * postgres://nnfd2:***@pgsql.dsa.lan/caponl_22g2
Done.
Done.
Done.


[]

# Load Data

In [13]:
airport_data.to_sql ('airport_data', engine, if_exists='append', index=False, method='multi', chunksize=1000)    

In [19]:
%%sql

select year,airport_city,sum(total_passengers),sum(total_flights)
from airport_data
group by year,airport_city
order by year

 * postgres://nnfd2:***@pgsql.dsa.lan/caponl_22g2
239 rows affected.


year,airport_city,sum,sum_1
2002,Alamosa,937,222
2002,Eagle,30267,449
2002,Colorado Springs,247775,4937
2002,Denver,4042504,57206
2002,Telluride,2899,350
2002,Gunnison,7174,323
2002,Durango,22110,1126
2002,Grand Junction,32729,1558
2002,Hayden,19574,387
2002,Cortez,1634,233
