In [1]:
import pandas as pd
import datetime as dt

In [2]:
#The goal of this file is to create a dataset of reservations made for 2016-2020 (May 1 - September 30) 
#for Pacific NorthWest (Washington, Oregon, California)

#Because of a large size of the dataset (exceeds limits of GitHub repo) cleaning and merging was done on a local computer

In [3]:
#Reading the data for 2016
data2016 = pd.read_csv("../../Resources/data/reservations2016.csv", encoding= 'unicode_escape')
data2016

Unnamed: 0,HistoricalReservationID,OrderNumber,Agency,OrgID,CodeHierarchy,RegionCode,RegionDescription,ParentLocationID,ParentLocation,LegacyFacilityID,...,Truck,Bus,Bicycle,Snowmobile,OffRoadlAllTerrainVehicle,PowerBoat,PickupCamper,LargeTentOver9x12,SmallTent,Marinaboat
0,2078081704,2-32732134,USACE,130,|1|70902|74304|74350|74559|71075|,CH3013280,OLD HICKORY LAKE,74350,NASHVILLE DISTRICT,71075,...,,,,,,,,,,
1,2078083331,2-32732551,USFS,131,|1|70903|72602|74411|74812|70392|,F50755,OJAI RD - FS,74411,LOS PADRES NF -FS,70392,...,,,,,,,,,,
2,2078083497,2-32732552,USFS,131,|1|70903|72602|74416|72724|75429|,F51753,YUBA RIVER RD -FS,74416,TAHOE NF - FS,75429,...,,,,,,,,,,
3,2078083555,4-3155416,NPS,128,|1|70904|74324|77803|77813|,CAVE-7170,Carlsbad Caverns National Park,74324,Intermountain Region,77813,...,,,,,,,,,,
4,2078083581,2-32732553,USFS,131,|1|70903|74311|74387|72667|70468|,F30406,RED ROCK RD -FS,74387,COCONINO NF - FS,70468,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2980709,2434322908,6-3050956,NPS,128,|1|70904|74325|74274|70853|,CAHA-5190,Cape Hatteras National Seashore,74325,Southeast Region,70853,...,,,,,,,,,,
2980710,2434323098,4-3698992,NPS,128,|1|70904|74327|74292|135840|,SEKI-8550,Sequoia and Kings Canyon National Park,74327,Pacific West Region,135840,...,,,,,,,,,,
2980711,2434324894,2-36683621,NPS,128,|1|70904|74324|74297|70923|,ZION-1590,Zion National Park,74324,Intermountain Region,70923,...,,,,,,,,,,
2980712,2434324927,2-36683622,NPS,128,|1|70904|74324|74282|70971|,GRCA-8210,Grand Canyon National Park,74324,Intermountain Region,70971,...,,,,,,,,,,


In [4]:
#Checking columns
data2016.columns

Index(['HistoricalReservationID', 'OrderNumber', 'Agency', 'OrgID',
       'CodeHierarchy', 'RegionCode', 'RegionDescription', 'ParentLocationID',
       'ParentLocation', 'LegacyFacilityID', 'Park', 'SiteType', 'UseType',
       'ProductID', 'EntityType', 'EntityID', 'FacilityID', 'FacilityZIP',
       'FacilityState', 'FacilityLongitude', 'FacilityLatitude', 'CustomerZIP',
       'CustomerState', 'CustomerCountry', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalBeforeTax', 'TotalPaid', 'StartDate', 'EndDate',
       'OrderDate', 'NumberOfPeople', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat'],
      dtype='object')

In [6]:
#Choosing only West Coast states data
data2016_WestCoast = data2016.loc[(data2016["FacilityState"] == "Oregon") |
                                  (data2016["FacilityState"] == "OR") |
                                  (data2016["FacilityState"] == "Washington") |
                                  (data2016["FacilityState"] == "WA") |
                                  (data2016["FacilityState"] == "California") |
                                  (data2016["FacilityState"] == "CA")]

In [7]:
#For the purposes of the project we interested only in reservable overnight campsites, but the reservation data also 
#included other types of camgrounds services

data2016_WestCoast["EntityType"].unique()

array(['Site', 'Entrance', 'Tour', 'POS'], dtype=object)

In [8]:
data2016_WestCoast["UseType"].unique()

array(['Overnight', 'Day', 'None'], dtype=object)

In [9]:
#Choosing only reservable overnight campsites

data2016_WestCoast_clean = data2016_WestCoast.loc[(data2016_WestCoast["UseType"] == "Overnight") & 
                                                  (data2016_WestCoast["EntityType"] == "Site")]


In [10]:
#Dropping unnecessary columns

data2016_WestCoast_clean = data2016_WestCoast_clean.drop(columns=['HistoricalReservationID', 
       'OrderNumber', 'OrgID', 'CodeHierarchy', 'RegionCode', 'ParentLocationID',
       'LegacyFacilityID', 'UseType', 'ProductID', 'EntityType', 'EntityID',
       'FacilityLongitude', 'FacilityLatitude', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalPaid', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat'])


In [11]:
#Checking datatypes for future manipulations
data2016_WestCoast_clean.dtypes

Agency                object
RegionDescription     object
ParentLocation        object
Park                  object
SiteType              object
FacilityID           float64
FacilityZIP           object
FacilityState         object
CustomerZIP           object
CustomerState         object
CustomerCountry       object
TotalBeforeTax       float64
StartDate             object
EndDate               object
OrderDate             object
NumberOfPeople         int64
dtype: object

In [12]:
#Converting dates to datetime data type with purpose extract data for the camping season (May 1 - September 30)
data2016_WestCoast_clean["StartDate"] = pd.to_datetime(data2016_WestCoast_clean["StartDate"])
data2016_WestCoast_clean["EndDate"] = pd.to_datetime(data2016_WestCoast_clean["EndDate"])
data2016_WestCoast_clean["OrderDate"] = pd.to_datetime(data2016_WestCoast_clean["OrderDate"])

In [13]:
#Checking the success of converting the date data
data2016_WestCoast_clean.dtypes

Agency                       object
RegionDescription            object
ParentLocation               object
Park                         object
SiteType                     object
FacilityID                  float64
FacilityZIP                  object
FacilityState                object
CustomerZIP                  object
CustomerState                object
CustomerCountry              object
TotalBeforeTax              float64
StartDate            datetime64[ns]
EndDate              datetime64[ns]
OrderDate            datetime64[ns]
NumberOfPeople                int64
dtype: object

In [14]:
#Extracting camping season data
data2016_WestCoast_clean = data2016_WestCoast_clean.loc[(data2016_WestCoast_clean["StartDate"] >= "2016-05-01") 
                                                      & (data2016_WestCoast_clean["EndDate"] <= "2016-09-30")]
data2016_WestCoast_clean

Unnamed: 0,Agency,RegionDescription,ParentLocation,Park,SiteType,FacilityID,FacilityZIP,FacilityState,CustomerZIP,CustomerState,CustomerCountry,TotalBeforeTax,StartDate,EndDate,OrderDate,NumberOfPeople
48,NPS,Joshua Tree National Park,Pacific West Region,SHEEP PASS GROUP,GROUP TENT ONLY AREA NONELECTRIC,232470.0,92277-3597,CA,90027,CA,USA,100.00,2016-09-03,2016-09-05,2015-10-01,20
96,USFS,MAMMOTH RD - FS,INYO NF - FS,PUMICE FLAT GROUP CAMP,GROUP STANDARD NONELECTRIC,231957.0,94301,CA,92301,CA,USA,313.05,2016-06-30,2016-07-03,2015-10-01,30
99,USFS,LOS ANGELES RIVER RD - FS,ANGELES NF - FS,MEADOW GROUP CAMPGROUND,GROUP STANDARD NONELECTRIC,233366.0,,CA,91701,CA,USA,81.00,2016-06-24,2016-06-26,2015-10-01,24
243,USFS,NACHES RD - FS,OKANOGAN - WENATCHEE NF -FS,SALMON COVE GROUP SITE,GROUP STANDARD AREA NONELECTRIC,234498.0,98937,WA,98942,WA,USA,159.00,2016-09-08,2016-09-11,2015-10-01,27
274,USACE,LAKE MENDOCINO,SAN FRANCISCO DIST,BUSHAY RECREATION AREA,GROUP STANDARD NONELECTRIC,233437.0,95482-9404,CA,94565,CA,USA,705.00,2016-09-02,2016-09-05,2015-10-01,40
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2976217,USACE,LAKE KAWEAH,SACRAMENTO DIST.,HORSE CREEK,STANDARD NONELECTRIC,233692.0,93244-4270,CA,93244,CA,USA,10.00,2016-09-23,2016-09-24,2016-09-30,2
2976234,USACE,SUCCESS LAKE,SACRAMENTO DIST.,TULE,STANDARD ELECTRIC,233655.0,,CA,unknown,CA,USA,15.00,2016-09-26,2016-09-27,2016-09-30,2
2976244,USACE,SUCCESS LAKE,SACRAMENTO DIST.,TULE,STANDARD ELECTRIC,233655.0,,CA,unknown,CA,USA,15.00,2016-09-27,2016-09-28,2016-09-30,2
2976246,USACE,LAKE KAWEAH,SACRAMENTO DIST.,HORSE CREEK,STANDARD NONELECTRIC,233692.0,93244-4270,CA,93292,CA,USA,0.00,2016-09-27,2016-09-28,2016-09-30,3


In [15]:
#Reading the data for 2017
data2017 = pd.read_csv("../../Resources/data/reservations2017.csv", encoding= 'unicode_escape')
data2017

Unnamed: 0,HistoricalReservationID,OrderNumber,Agency,OrgID,CodeHierarchy,RegionCode,RegionDescription,ParentLocationID,ParentLocation,LegacyFacilityID,...,Truck,Bus,Bicycle,Snowmobile,OffRoadlAllTerrainVehicle,PowerBoat,PickupCamper,LargeTentOver9x12,SmallTent,Marinaboat
0,2434304548,2-36681755,USFS,131,|1|70903|72601|72630|72684|71879|,F00531,SITKA RD - FS,72630,TONGASS NF - FS,71879,...,,,,,,,,,,
1,2434322404,4-3699000,NPS,128,|1|70904|74268|77805|77815|,INDE-4450,Independence National Historical Park,74268,Northeast Region,77815,...,,,,,,,,,,
2,2434322425,4-3699001,NPS,128,|1|70904|74327|72368|72369|,VALR,World War II Valor in the Pacific,74327,Pacific West Region,72369,...,,,,,,,,,,
3,2434322473,4-3699002,NPS,128,|1|70904|74327|74292|135840|,SEKI-8550,Sequoia and Kings Canyon National Park,74327,Pacific West Region,135840,...,,,,,,,,,,
4,2434322626,2-36683841,NPS,128,|1|70904|74324|74282|70971|,GRCA-8210,Grand Canyon National Park,74324,Intermountain Region,70971,...,,,,,,,,1.0,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3303548,2830803631,4-4180361,NPS,128,|1|70904|74327|72368|72369|,VALR,World War II Valor in the Pacific,74327,Pacific West Region,72369,...,,,,,,,,,,
3303549,2830803653,4-4180362,NPS,128,|1|70904|74327|72368|72369|,VALR,World War II Valor in the Pacific,74327,Pacific West Region,72369,...,,,,,,,,,,
3303550,2830803670,2-39280451,NPS,128,|1|70904|74324|74282|70971|,GRCA-8210,Grand Canyon National Park,74324,Intermountain Region,70971,...,,,,,,,,,,
3303551,2830803705,2-39280452,USACE,130,|1|70902|74306|74358|74590|73251|,CL3004990,LAKE SONOMA,74358,SAN FRANCISCO DIST,73251,...,,,,,,,,,,


In [18]:
#Checking columns
data2017.columns

Index(['HistoricalReservationID', 'OrderNumber', 'Agency', 'OrgID',
       'CodeHierarchy', 'RegionCode', 'RegionDescription', 'ParentLocationID',
       'ParentLocation', 'LegacyFacilityID', 'Park', 'SiteType', 'UseType',
       'ProductID', 'EntityType', 'EntityID', 'FacilityID', 'FacilityZIP',
       'FacilityState', 'FacilityLongitude', 'FacilityLatitude', 'CustomerZIP',
       'CustomerState', 'CustomerCountry', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalBeforeTax', 'TotalPaid', 'StartDate', 'EndDate',
       'OrderDate', 'NumberOfPeople', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat'],
      dtype='object')

In [17]:
#Choosing only West Coast states data
data2017_WestCoast = data2017.loc[(data2017["FacilityState"] == "Oregon") |
                                  (data2017["FacilityState"] == "OR") |
                                  (data2017["FacilityState"] == "Washington") |
                                  (data2017["FacilityState"] == "WA") |
                                  (data2017["FacilityState"] == "California") |
                                  (data2017["FacilityState"] == "CA")]

In [19]:
#For the purposes of the project we interested only in reservable overnight campsites, but the reservation data also 
#included other types of camgrounds services
data2017_WestCoast["UseType"].unique()

array(['Overnight', 'None', 'Day'], dtype=object)

In [20]:
data2017_WestCoast["EntityType"].unique()

array(['Tour', 'Site', 'POS', 'Entrance'], dtype=object)

In [21]:
#Choosing only reservable overnight campsites
data2017_WestCoast_clean = data2017_WestCoast.loc[(data2017_WestCoast["UseType"] == "Overnight") 
                                                & (data2017_WestCoast["EntityType"] == "Site")]

In [22]:
#Dropping unnecessary columns
data2017_WestCoast_clean = data2017_WestCoast_clean.drop(columns=['HistoricalReservationID', 
       'OrderNumber', 'OrgID', 'CodeHierarchy', 'RegionCode', 'ParentLocationID',
       'LegacyFacilityID', 'UseType', 'ProductID', 'EntityType', 'EntityID',
       'FacilityLongitude', 'FacilityLatitude', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalPaid', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat'])


In [23]:
#Checking datatypes for future manipulations
data2017_WestCoast_clean.dtypes

Agency                object
RegionDescription     object
ParentLocation        object
Park                  object
SiteType              object
FacilityID           float64
FacilityZIP           object
FacilityState         object
CustomerZIP           object
CustomerState         object
CustomerCountry       object
TotalBeforeTax       float64
StartDate             object
EndDate               object
OrderDate             object
NumberOfPeople         int64
dtype: object

In [24]:
#Converting dates to datetime data type with purpose extract data for the camping season (May 1 - September 30)
data2017_WestCoast_clean["StartDate"] = pd.to_datetime(data2017_WestCoast_clean["StartDate"])
data2017_WestCoast_clean["EndDate"] = pd.to_datetime(data2017_WestCoast_clean["EndDate"])
data2017_WestCoast_clean["OrderDate"] = pd.to_datetime(data2017_WestCoast_clean["OrderDate"])

In [25]:
#Checking the success of converting the date data
data2017_WestCoast_clean.dtypes

Agency                       object
RegionDescription            object
ParentLocation               object
Park                         object
SiteType                     object
FacilityID                  float64
FacilityZIP                  object
FacilityState                object
CustomerZIP                  object
CustomerState                object
CustomerCountry              object
TotalBeforeTax              float64
StartDate            datetime64[ns]
EndDate              datetime64[ns]
OrderDate            datetime64[ns]
NumberOfPeople                int64
dtype: object

In [27]:
#Extracting camping season data
data2017_WestCoast_clean = data2017_WestCoast_clean.loc[(data2017_WestCoast_clean["StartDate"] >= "2017-05-01") 
                                                      & (data2017_WestCoast_clean["EndDate"] <= "2017-09-30")]
data2017_WestCoast_clean 

Unnamed: 0,Agency,RegionDescription,ParentLocation,Park,SiteType,FacilityID,FacilityZIP,FacilityState,CustomerZIP,CustomerState,CustomerCountry,TotalBeforeTax,StartDate,EndDate,OrderDate,NumberOfPeople
55,NPS,Olympic National Park,Pacific West Region,SOL DUC HOT SPRINGS RESORT CAMPGROUND,STANDARD NONELECTRIC,251906.0,,WA,97202,OR,USA,69.00,2017-07-01,2017-07-04,2016-10-01,8
109,USFS,MONTEREY RD - FS,LOS PADRES NF -FS,ARROYO SECO,GROUP STANDARD NONELECTRIC,231958.0,,CA,93907,CA,USA,159.00,2017-07-14,2017-07-16,2016-10-01,20
234,USFS,MT ADAMS RD - FS,GIFFORD PINCHOT NF - FS,Beaver Campground,GROUP STANDARD NONELECTRIC,232864.0,,WA,98606,WA,USA,19.00,2017-08-03,2017-08-06,2016-10-01,40
286,NPS,Joshua Tree National Park,Pacific West Region,SHEEP PASS GROUP,GROUP TENT ONLY AREA NONELECTRIC,232470.0,92277-3597,CA,92694,CA,USA,60.00,2017-09-01,2017-09-04,2016-10-01,8
764,NPS,Joshua Tree National Park,Pacific West Region,INDIAN COVE CAMPGROUND,GROUP TENT ONLY AREA NONELECTRIC,232472.0,92277-3597,CA,90065,CA,USA,100.00,2017-09-22,2017-09-24,2016-10-01,20
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3299676,USFS,HIGH SIERRA RD -FS,SIERRA NF - FS,DINKEY CREEK,TENT ONLY NONELECTRIC,232136.0,94301,CA,93727,CA,USA,31.50,2017-09-29,2017-09-30,2017-09-30,5
3300287,USACE,HENSLEY LAKE,SACRAMENTO DIST.,HIDDEN VIEW,STANDARD NONELECTRIC,233509.0,,CA,93635,CA,USA,20.00,2017-09-29,2017-09-30,2017-09-30,8
3300326,USACE,HENSLEY LAKE,SACRAMENTO DIST.,HIDDEN VIEW,STANDARD ELECTRIC,233509.0,,CA,95348,CA,USA,15.00,2017-09-29,2017-09-30,2017-09-30,1
3300335,USACE,HENSLEY LAKE,SACRAMENTO DIST.,HIDDEN VIEW,STANDARD NONELECTRIC,233509.0,,CA,93653,CA,USA,20.00,2017-09-29,2017-09-30,2017-09-30,8


In [28]:
#Reading the data for 2018
data2018 = pd.read_csv("../../Resources/data/reservations2018.csv", encoding= 'unicode_escape')
data2018

  interactivity=interactivity, compiler=compiler, result=result)


Unnamed: 0,HistoricalReservationID,OrderNumber,Agency,OrgID,CodeHierarchy,RegionCode,RegionDescription,ParentLocationID,ParentLocation,LegacyFacilityID,...,Bus,Bicycle,Snowmobile,OffRoadlAllTerrainVehicle,PowerBoat,PickupCamper,LargeTentOver9x12,SmallTent,Marinaboat,LatLongPoint
0,2976269875,4-4358197,NPS,128.0,|1|70904|74265|70710|70711|,KLGO-9825,Klondike Gold Rush National Historical Park,74265,Alaska Region,70711,...,,,,,,,,,,<e6100000 010cabaa aaaaaaba 4d40610b b6600bea ...
1,2976269875,4-4358197,NPS,128.0,|1|70904|74265|70710|70711|,KLGO-9825,Klondike Gold Rush National Historical Park,74265,Alaska Region,70711,...,,,,,,,,,,<e6100000 010cabaa aaaaaaba 4d40610b b6600bea ...
2,2976269875,4-4358197,NPS,128.0,|1|70904|74265|70710|70711|,KLGO-9825,Klondike Gold Rush National Historical Park,74265,Alaska Region,70711,...,,,,,,,,,,<e6100000 010cabaa aaaaaaba 4d40610b b6600bea ...
3,2976371845,4-4358345,NPS,128.0,|1|70904|74265|70710|70711|,KLGO-9825,Klondike Gold Rush National Historical Park,74265,Alaska Region,70711,...,,,,,,,,,,<e6100000 010cabaa aaaaaaba 4d40610b b6600bea ...
4,2976358486,4-4358374,NPS,128.0,|1|70904|74265|70710|70711|,KLGO-9825,Klondike Gold Rush National Historical Park,74265,Alaska Region,70711,...,,,,,,,,,,<e6100000 010cabaa aaaaaaba 4d40610b b6600bea ...
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3299800,3221486652,6-3833254,NPS,128.0,|1|70904|74322|74995|74996|,APIS-6140,Apostle Islands National Lakeshore,74322,Midwest Region,74996,...,,,,,,,,,,<e6100000 010c8888 88888878 47403a6d a0d306be ...
3299801,3221486652,6-3833254,NPS,128.0,|1|70904|74322|74995|74996|,APIS-6140,Apostle Islands National Lakeshore,74322,Midwest Region,74996,...,,,,,,,,,,<e6100000 010c8888 88888878 47403a6d a0d306be ...
3299802,3221486652,6-3833254,NPS,128.0,|1|70904|74322|74995|74996|,APIS-6140,Apostle Islands National Lakeshore,74322,Midwest Region,74996,...,,,,,,,,,,<e6100000 010c8888 88888878 47403a6d a0d306be ...
3299803,3221486652,6-3833254,NPS,128.0,|1|70904|74322|74995|74996|,APIS-6140,Apostle Islands National Lakeshore,74322,Midwest Region,74996,...,,,,,,,,,,<e6100000 010c8888 88888878 47403a6d a0d306be ...


In [29]:
#Checking columns
data2018.columns

Index(['HistoricalReservationID', 'OrderNumber', 'Agency', 'OrgID',
       'CodeHierarchy', 'RegionCode', 'RegionDescription', 'ParentLocationID',
       'ParentLocation', 'LegacyFacilityID', 'Park', 'SiteType', 'UseType',
       'ProductID', 'EntityType', 'EntityID', 'FacilityID', 'FacilityZIP',
       'FacilityState', 'FacilityLongitude', 'FacilityLatitude', 'CustomerZIP',
       'CustomerState', 'CustomerCountry', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalBeforeTax', 'TotalPaid', 'StartDate', 'EndDate',
       'OrderDate', 'NumberOfPeople', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat', 'LatLongPoint'],
      dtype='object')

In [30]:
#Choosing only West Coast states data
data2018_WestCoast = data2018.loc[(data2018["FacilityState"] == "Oregon") |
                                  (data2018["FacilityState"] == "OR") |
                                  (data2018["FacilityState"] == "Washington") |
                                  (data2018["FacilityState"] == "WA") |
                                  (data2018["FacilityState"] == "California") |
                                  (data2018["FacilityState"] == "CA")]

In [31]:
#For the purposes of the project we interested only in reservable overnight campsites, but the reservation data also 
#included other types of camgrounds services
data2018_WestCoast["UseType"].unique()

array(['Overnight', 'Day', nan, 'OverNight'], dtype=object)

In [32]:
data2018_WestCoast["EntityType"].unique()

array(['Site', 'ERR', 'Tour'], dtype=object)

In [33]:
#Choosing only reservable overnight campsites
data2018_WestCoast_clean = data2018_WestCoast.loc[((data2018_WestCoast["UseType"] == "Overnight") 
                                                 | (data2018_WestCoast["UseType"] == "OverNight"))
                                                 & (data2018_WestCoast["EntityType"] == "Site")]


In [34]:
#Dropping unnecessary columns
data2018_WestCoast_clean = data2018_WestCoast_clean.drop(columns=['HistoricalReservationID', 
       'OrderNumber', 'OrgID', 'CodeHierarchy', 'RegionCode', 'ParentLocationID',
       'LegacyFacilityID', 'UseType', 'ProductID', 'EntityType', 'EntityID',
       'FacilityLongitude', 'FacilityLatitude', 'Tax', 'UseFee', 'TranFee',
       'AttrFee', 'TotalPaid', 'Tent', 'Popup', 'Trailer',
       'RVMotorhome', 'Boat', 'HorseTrailer', 'Car', 'FifthWheel', 'Van',
       'CanoeKayak', 'BoatTrailer', 'Motorcycle', 'Truck', 'Bus', 'Bicycle',
       'Snowmobile', 'OffRoadlAllTerrainVehicle', 'PowerBoat', 'PickupCamper',
       'LargeTentOver9x12', 'SmallTent', 'Marinaboat', 'LatLongPoint'])


In [35]:
#Checking datatypes for future manipulations
data2018_WestCoast_clean.dtypes

Agency                object
RegionDescription     object
ParentLocation        object
Park                  object
SiteType              object
FacilityID           float64
FacilityZIP           object
FacilityState         object
CustomerZIP           object
CustomerState         object
CustomerCountry       object
TotalBeforeTax       float64
StartDate             object
EndDate               object
OrderDate             object
NumberOfPeople       float64
dtype: object

In [36]:
#Converting dates to datetime data type with purpose extract data for the camping season (May 1 - September 30)
data2018_WestCoast_clean["StartDate"] = pd.to_datetime(data2018_WestCoast_clean["StartDate"])
data2018_WestCoast_clean["EndDate"] = pd.to_datetime(data2018_WestCoast_clean["EndDate"])
data2018_WestCoast_clean["OrderDate"] = pd.to_datetime(data2018_WestCoast_clean["OrderDate"])

In [39]:
#Checking the success of converting the date data
data2018_WestCoast_clean.dtypes

Agency                       object
RegionDescription            object
ParentLocation               object
Park                         object
SiteType                     object
FacilityID                  float64
FacilityZIP                  object
FacilityState                object
CustomerZIP                  object
CustomerState                object
CustomerCountry              object
TotalBeforeTax              float64
StartDate            datetime64[ns]
EndDate              datetime64[ns]
OrderDate            datetime64[ns]
NumberOfPeople              float64
dtype: object

In [40]:
#Extracting camping season data
data2018_WestCoast_clean = data2018_WestCoast_clean.loc[(data2018_WestCoast_clean["StartDate"] >= "2018-05-01") 
                                                      & (data2018_WestCoast_clean["EndDate"] <= "2018-09-30")]
data2018_WestCoast_clean 

Unnamed: 0,Agency,RegionDescription,ParentLocation,Park,SiteType,FacilityID,FacilityZIP,FacilityState,CustomerZIP,CustomerState,CustomerCountry,TotalBeforeTax,StartDate,EndDate,OrderDate,NumberOfPeople
3200,USFS,GEORGETOWN RD -FS,ELDORADO NF - FS,Middle Meadows --- FPIN151,GROUP STANDARD NONELECTRIC,231953.0,95634,CA,89521,NV,USA,135.0,2018-07-04,2018-07-09,2017-10-02,50.0
3201,USFS,GEORGETOWN RD -FS,ELDORADO NF - FS,Middle Meadows --- FPIN151,GROUP STANDARD NONELECTRIC,231953.0,95634,CA,95616,CA,USA,20.0,2018-05-11,2018-05-13,2017-11-11,50.0
3202,USFS,GEORGETOWN RD -FS,ELDORADO NF - FS,Middle Meadows --- FPIN151,GROUP STANDARD NONELECTRIC,231953.0,95634,CA,95823,CA,USA,20.0,2018-06-22,2018-06-24,2017-11-15,50.0
3203,USFS,GEORGETOWN RD -FS,ELDORADO NF - FS,Middle Meadows --- FPIN151,GROUP STANDARD NONELECTRIC,231953.0,95634,CA,93245,CA,USA,185.0,2018-06-24,2018-07-01,2017-11-24,50.0
3204,USFS,GEORGETOWN RD -FS,ELDORADO NF - FS,Middle Meadows --- FPIN151,GROUP STANDARD NONELECTRIC,231953.0,95634,CA,95660-4137,CA,USA,85.0,2018-06-15,2018-06-18,2017-12-13,50.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3299469,USFS,HOOD CANAL RD - FS,OLYMPIC NF - FS,Coho Campground --- FPIN2427,YURT,233384.0,98376,WA,98166,WA,USA,80.0,2018-08-09,2018-08-10,2018-08-04,4.0
3299470,USFS,HOOD CANAL RD - FS,OLYMPIC NF - FS,Coho Campground --- FPIN2427,YURT,233384.0,98376,WA,98509,WA,USA,80.0,2018-08-15,2018-08-16,2018-08-09,2.0
3299471,USFS,HOOD CANAL RD - FS,OLYMPIC NF - FS,Coho Campground --- FPIN2427,YURT,233384.0,98376,WA,59602,MT,USA,80.0,2018-08-19,2018-08-20,2018-08-12,6.0
3299472,USFS,HOOD CANAL RD - FS,OLYMPIC NF - FS,Coho Campground --- FPIN2427,YURT,233384.0,98376,WA,98109,WA,USA,80.0,2018-09-02,2018-09-03,2018-08-17,2.0


In [41]:
#Reading the data for 2019
data2019 = pd.read_csv("../../Resources/data/reservations2019.csv", encoding= 'unicode_escape')
data2019

  interactivity=interactivity, compiler=compiler, result=result)


Unnamed: 0,historicalreservationid,ordernumber,agency,orgid,codehierarchy,regioncode,regiondescription,parentlocationid,parentlocation,legacyfacilityid,...,attrfee,totalbeforetax,discount,totalpaid,startdate,enddate,orderdate,numberofpeople,equipmentdescription,equipmentlength
0,9c4a5398-4b50-4aa6-92fe-9a32699e49f9,0100084620-1,BLM,126.0,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,,33.0,0.0,33.0,2019-01-26 00:00:00,2019-01-27 00:00:00,2018-12-27 20:54:55.233,4.0,,0.0
1,4018a5bb-7e8a-49a1-bea2-f86be53b16e0,0100162496-1,BLM,126.0,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,,18.0,0.0,18.0,2019-03-26 00:00:00,2019-03-27 00:00:00,2019-02-24 15:00:45.718,1.0,,0.0
2,6458d681-584b-4e2b-b3f9-f398fa28f9eb,0100328335-1,BLM,126.0,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,,33.0,0.0,33.0,2019-08-26 00:00:00,2019-08-27 00:00:00,2019-08-26 17:06:23.052,2.0,,0.0
3,c4b1f737-44b8-46ca-ada4-523fe74a199c,0100404611-1,BLM,126.0,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,,58.0,0.0,58.0,2018-11-23 00:00:00,2018-11-25 00:00:00,2018-10-23 00:23:58.275,5.0,,0.0
4,e4f54fd0-2739-44a1-b807-bba4e3584e4a,0100444692-1,BLM,126.0,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,,33.0,0.0,33.0,2019-08-28 00:00:00,2019-08-29 00:00:00,2019-08-15 18:33:22.488,2.0,,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3479638,4-4609121-1,4-4609121-1,,,,,,,,,...,,6.0,0.0,6.0,2018-11-02 00:00:00,,2019-10-01 00:00:00,6.0,,
3479639,4-4618681-1,4-4618681-1,,,,,,,,,...,,4.0,0.0,4.0,2018-11-04 00:00:00,,2019-10-01 00:00:00,4.0,,
3479640,4-4626415-1,4-4626415-1,,,,,,,,,...,,4.0,0.0,4.0,2018-11-20 00:00:00,,2019-10-01 00:00:00,4.0,,
3479641,4-4628875-1,4-4628875-1,,,,,,,,,...,,47.0,0.0,47.0,2018-12-08 00:00:00,,2019-10-01 00:00:00,47.0,,


In [42]:
#Checking columns
data2019.columns

Index(['historicalreservationid', 'ordernumber', 'agency', 'orgid',
       'codehierarchy', 'regioncode', 'regiondescription', 'parentlocationid',
       'parentlocation', 'legacyfacilityid', 'park', 'sitetype', 'usetype',
       'productid', 'inventorytype', 'facilityid', 'facilityzip',
       'facilitystate', 'facilitylongitude', 'facilitylatitude', 'customerzip',
       'customerstate', 'customercountry', 'tax', 'usefee', 'tranfee',
       'attrfee', 'totalbeforetax', 'discount', 'totalpaid', 'startdate',
       'enddate', 'orderdate', 'numberofpeople', 'equipmentdescription',
       'equipmentlength'],
      dtype='object')

In [43]:
#Choosing only West Coast states data
data2019_WestCoast = data2019.loc[(data2019["facilitystate"] == "Oregon") |
                                  (data2019["facilitystate"] == "OR") |
                                  (data2019["facilitystate"] == "Washington") |
                                  (data2019["facilitystate"] == "WA") |
                                  (data2019["facilitystate"] == "California") |
                                  (data2019["facilitystate"] == "CA")]

In [44]:
#For the purposes of the project we interested only in reservable overnight campsites, but the reservation data also 
#included other types of camgrounds services
data2019_WestCoast["usetype"].unique()

array([nan, 'Overnight', 'Day'], dtype=object)

In [45]:
data2019_WestCoast["inventorytype"].unique()

array(['TICKET', 'VEHICLE_PERMIT', 'PERMIT', 'CAMPING', 'LOTTERY_PERMIT',
       'LOTTERY_CAMPING'], dtype=object)

In [46]:
#Choosing only reservable overnight campsites
data2019_WestCoast_clean = data2019_WestCoast.loc[((data2019["usetype"] == "Overnight") 
                                                 | (data2019_WestCoast["usetype"] == "Multi"))
                                                & ((data2019_WestCoast["inventorytype"] == "CAMPING") 
                                                 | (data2019_WestCoast["inventorytype"] == "LOTTERY_CAMPING"))]


In [47]:
#Dropping unnecessary columns
data2019_WestCoast_clean = data2019_WestCoast_clean.drop(columns=['historicalreservationid', 'ordernumber', 'orgid',
       'codehierarchy', 'regioncode', 'parentlocationid', 'legacyfacilityid', 'usetype',
       'productid', 'inventorytype', 'facilitylongitude', 'facilitylatitude', 'tax', 'usefee', 'tranfee',
       'attrfee', 'discount', 'totalpaid', 'equipmentdescription',
       'equipmentlength'])



In [48]:
#Checking datatypes for future manipulations
data2019_WestCoast_clean.dtypes

agency                object
regiondescription     object
parentlocation        object
park                  object
sitetype              object
facilityid             int64
facilityzip          float64
facilitystate         object
customerzip           object
customerstate         object
customercountry       object
totalbeforetax       float64
startdate             object
enddate               object
orderdate             object
numberofpeople       float64
dtype: object

In [49]:
#Converting dates to datetime data type with purpose extract data for the camping season (May 1 - September 30)
data2019_WestCoast_clean["startdate"] = pd.to_datetime(data2019_WestCoast_clean["startdate"])
data2019_WestCoast_clean["enddate"] = pd.to_datetime(data2019_WestCoast_clean["enddate"])
data2019_WestCoast_clean["orderdate"] = pd.to_datetime(data2019_WestCoast_clean["orderdate"])

In [50]:
#Checking the success of converting the date data
data2019_WestCoast_clean.dtypes

agency                       object
regiondescription            object
parentlocation               object
park                         object
sitetype                     object
facilityid                    int64
facilityzip                 float64
facilitystate                object
customerzip                  object
customerstate                object
customercountry              object
totalbeforetax              float64
startdate            datetime64[ns]
enddate              datetime64[ns]
orderdate            datetime64[ns]
numberofpeople              float64
dtype: object

In [51]:
#Extracting camping season data
data2019_WestCoast_clean = data2019_WestCoast_clean.loc[(data2019_WestCoast_clean["startdate"] >= "2019-05-01") 
                                                      & (data2019_WestCoast_clean["enddate"] <= "2019-09-30")]
data2019_WestCoast_clean 

Unnamed: 0,agency,regiondescription,parentlocation,park,sitetype,facilityid,facilityzip,facilitystate,customerzip,customerstate,customercountry,totalbeforetax,startdate,enddate,orderdate,numberofpeople
14540,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,0.0,2019-05-31,2019-06-02,2019-01-02 02:34:22.705,75.0
14541,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,97321,OR,USA,153.0,2019-07-28,2019-07-29,2019-01-26 19:44:15.325,100.0
14542,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,8.0,2019-09-13,2019-09-16,2018-10-31 19:47:28.666,100.0
14543,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,598.0,2019-09-02,2019-09-24,2019-02-21 05:51:32.858,50.0
14544,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,97210,OR,USA,298.0,2019-08-04,2019-08-06,2019-02-26 01:06:30.684,20.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3479460,USFS,,,HAYSTACK CAMPGROUND (EAST SHORE),STANDARD NONELECTRIC,234779,97734.0,Oregon,97471,,,53.0,2019-07-25,2019-07-28,2019-04-26 02:36:20.224,6.0
3479461,USFS,,,HAYSTACK CAMPGROUND (EAST SHORE),STANDARD NONELECTRIC,234779,97734.0,Oregon,97471,,,53.0,2019-07-25,2019-07-28,2019-04-26 02:36:20.224,6.0
3479462,USFS,,,HAYSTACK CAMPGROUND (EAST SHORE),STANDARD NONELECTRIC,234779,97734.0,Oregon,,,,38.0,2019-07-12,2019-07-14,2019-05-13 04:25:42.686,3.0
3479463,USFS,,,HAYSTACK CAMPGROUND (EAST SHORE),STANDARD NONELECTRIC,234779,97734.0,Oregon,98446,WA,USA,23.0,2019-08-30,2019-08-31,2019-04-10 02:28:52.698,3.0


In [52]:
#Reading the data for 2020
data2020 = pd.read_csv("../../Resources/data/reservations2020.csv", encoding= 'unicode_escape')
data2020

  interactivity=interactivity, compiler=compiler, result=result)


Unnamed: 0,historicalreservationid,ordernumber,agency,orgid,codehierarchy,regioncode,regiondescription,parentlocationid,parentlocation,legacyfacilityid,...,totalbeforetax,discount,totalpaid,startdate,enddate,orderdate,nights,numberofpeople,equipmentdescription,equipmentlength
0,fa50401c-f08a-4738-b576-56335cc19cb7,0121072064-1,BLM,126,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,33.0,0.0,33.0,2019-10-17 00:00:00,2019-10-18 00:00:00,2019-09-18 16:25:42.28,1 day,6.0,,0.0
1,09c37303-cf15-49d9-9b0c-ccc120328bbb,0200063847-1,BLM,126,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,33.0,0.0,33.0,2020-04-11 00:00:00,2020-04-12 00:00:00,2020-03-13 16:35:11.612,1 day,1.0,,0.0
2,f1f5c841-46b1-4ff8-a6dc-fcac2e76ae1c,0200087454-1,BLM,126,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,83.0,0.0,83.0,2020-09-07 00:00:00,2020-09-10 00:00:00,2020-08-17 05:19:08.159,3 days,2.0,,0.0
3,619f4394-1cac-4a64-8f0c-eae6e7f6bf3b,0200102788-1,BLM,126,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,33.0,0.0,33.0,2020-03-21 00:00:00,2020-03-22 00:00:00,2020-02-20 15:01:33.904,1 day,3.0,,0.0
4,82674243-7f31-41e6-b3db-d0690513cad3,0200147542-1,BLM,126,|1|70901|72193|72194|146090,AK,Alaska (BLM),72195,White Mountains National Recreation Area,146090.0,...,0.0,0.0,0.0,2019-12-07 00:00:00,2019-12-08 00:00:00,2019-11-07 17:54:01.448,1 day,2.0,,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5114784,3dc6db19-e935-11ea-b093-0a4663ab7691,0299936603-1,USFS,131,|1|70903|300017,,,14487,El Yunque National Forest,,...,4.0,0.0,4.0,2020-09-05 00:00:00,2020-09-05 00:00:00,2020-08-28 13:49:44.115,00:00:00,2.0,,
5114785,31aa3a26-bf9f-11ea-9be3-ae918ba7a17b,0299948467-1,USFS,131,|1|70903|300017,,,14487,El Yunque National Forest,,...,2.0,0.0,2.0,2020-07-17 00:00:00,2020-07-17 00:00:00,2020-07-06 15:43:44.14,00:00:00,1.0,,
5114786,abdea1e5-bfd3-11ea-b504-127b1cc19b77,0299955580-1,USFS,131,|1|70903|300017,,,14487,El Yunque National Forest,,...,2.0,0.0,2.0,2020-07-12 00:00:00,2020-07-12 00:00:00,2020-07-06 22:00:34.837,00:00:00,1.0,,
5114787,8a06cee8-cd58-11ea-a075-5eeb99748ba8,0299963410-1,USFS,131,|1|70903|300017,,,14487,El Yunque National Forest,,...,2.0,0.0,2.0,2020-07-30 00:00:00,2020-07-30 00:00:00,2020-07-24 02:52:17.583,00:00:00,0.0,,


In [53]:
#Checking columns
data2020.columns

Index(['historicalreservationid', 'ordernumber', 'agency', 'orgid',
       'codehierarchy', 'regioncode', 'regiondescription', 'parentlocationid',
       'parentlocation', 'legacyfacilityid', 'park', 'sitetype', 'usetype',
       'productid', 'inventorytype', 'facilityid', 'facilityzip',
       'facilitystate', 'facilitylongitude', 'facilitylatitude', 'customerzip',
       'customerstate', 'customercountry', 'tax', 'usefee', 'tranfee',
       'attrfee', 'totalbeforetax', 'discount', 'totalpaid', 'startdate',
       'enddate', 'orderdate', 'nights', 'numberofpeople',
       'equipmentdescription', 'equipmentlength'],
      dtype='object')

In [54]:
#Choosing only West Coast states data
data2020_WestCoast = data2020.loc[(data2020["facilitystate"] == "Oregon") |
                                  (data2020["facilitystate"] == "OR") |
                                  (data2020["facilitystate"] == "Washington") |
                                  (data2020["facilitystate"] == "WA") |
                                  (data2020["facilitystate"] == "California") |
                                  (data2020["facilitystate"] == "CA")]

In [57]:
#For the purposes of the project we interested only in reservable overnight campsites, but the reservation data also 
#included other types of camgrounds services
data2020_WestCoast["usetype"].unique()

array([nan, 'Overnight', 'Day'], dtype=object)

In [58]:
data2020_WestCoast["inventorytype"].unique()

array(['TICKET', 'VEHICLE_PERMIT', 'PERMIT', 'CAMPING', 'LOTTERY_PERMIT'],
      dtype=object)

In [59]:
#Choosing only reservable overnight campsites
data2020_WestCoast_clean = data2020_WestCoast.loc[(data2020_WestCoast["usetype"] == "Overnight") 
                                                & (data2020_WestCoast["inventorytype"] == "CAMPING")] 
                                                 


In [60]:
#Dropping unnecessary columns
data2020_WestCoast_clean = data2020_WestCoast_clean.drop(columns=['historicalreservationid', 'ordernumber', 'orgid',
       'codehierarchy', 'regioncode', 'parentlocationid', 'legacyfacilityid', 'usetype',
       'productid', 'inventorytype', 'facilitylongitude', 'facilitylatitude', 'tax', 'usefee', 'tranfee',
       'attrfee', 'discount', 'totalpaid', 'nights', 'equipmentdescription', 'equipmentlength'])


In [61]:
#Checking datatypes for future manipulations
data2020_WestCoast_clean.dtypes

agency                object
regiondescription     object
parentlocation        object
park                  object
sitetype              object
facilityid            object
facilityzip          float64
facilitystate         object
customerzip           object
customerstate         object
customercountry       object
totalbeforetax       float64
startdate             object
enddate               object
orderdate             object
numberofpeople       float64
dtype: object

In [62]:
#Converting dates to datetime data type with purpose extract data for the camping season (May 1 - September 30)
data2020_WestCoast_clean["startdate"] = pd.to_datetime(data2020_WestCoast_clean["startdate"])
data2020_WestCoast_clean["enddate"] = pd.to_datetime(data2020_WestCoast_clean["enddate"])
data2020_WestCoast_clean["orderdate"] = pd.to_datetime(data2020_WestCoast_clean["orderdate"])

In [63]:
#Checking the success of converting the date data
data2020_WestCoast_clean.dtypes

agency                       object
regiondescription            object
parentlocation               object
park                         object
sitetype                     object
facilityid                   object
facilityzip                 float64
facilitystate                object
customerzip                  object
customerstate                object
customercountry              object
totalbeforetax              float64
startdate            datetime64[ns]
enddate              datetime64[ns]
orderdate            datetime64[ns]
numberofpeople              float64
dtype: object

In [65]:
#Extracting camping season data
data2020_WestCoast_clean = data2020_WestCoast_clean.loc[(data2020_WestCoast_clean["startdate"] >= "2020-05-01") 
                                                      & (data2020_WestCoast_clean["enddate"] <= "2020-09-30")]
data2020_WestCoast_clean 

Unnamed: 0,agency,regiondescription,parentlocation,park,sitetype,facilityid,facilityzip,facilitystate,customerzip,customerstate,customercountry,totalbeforetax,startdate,enddate,orderdate,numberofpeople
22636,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,0.0,2020-07-23,2020-07-29,2019-07-23 14:01:57.903,15.0
22637,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,97477,OR,USA,0.0,2020-07-19,2020-07-23,2019-07-20 02:08:30.961,22.0
22638,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,97420,OR,USA,0.0,2020-08-09,2020-08-17,2019-08-10 00:16:02.951,100.0
22639,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,0.0,2020-08-01,2020-08-06,2019-08-27 19:39:13.162,30.0
22640,BLM,Oregon (BLM),North Umpqua Wild and Scenic River,Eagleview Group Campground (Reservation),GROUP PICNIC AREA,233153,97462.0,Oregon,,,,18.0,2020-08-20,2020-08-24,2019-08-21 06:02:41.910,100.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4712272,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822.0,Washington,98117,WA,USA,28.0,2020-08-14,2020-08-16,2020-08-10 18:14:43.334,2.0
4712273,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822.0,Washington,,,,18.0,2020-07-02,2020-07-03,2020-06-30 06:08:40.328,1.0
4712274,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822.0,Washington,98801,WA,USA,108.0,2020-07-07,2020-07-17,2020-07-02 16:31:16.374,2.0
4712275,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822.0,Washington,98006,WA,USA,38.0,2020-08-06,2020-08-09,2020-07-20 23:16:45.644,8.0


In [66]:
#Connecting all data for 2016 - 2020
data2016_2018 = pd.concat([data2016_WestCoast_clean, data2017_WestCoast_clean, data2018_WestCoast_clean])
data2016_2018.columns

Index(['Agency', 'RegionDescription', 'ParentLocation', 'Park', 'SiteType',
       'FacilityID', 'FacilityZIP', 'FacilityState', 'CustomerZIP',
       'CustomerState', 'CustomerCountry', 'TotalBeforeTax', 'StartDate',
       'EndDate', 'OrderDate', 'NumberOfPeople'],
      dtype='object')

In [67]:
data2016_2018 = data2016_2018.rename(columns={'Agency':'agency', 
                                              'RegionDescription':'regiondescription',
                                              'ParentLocation':'parentlocation', 
                                              'Park':'park',
                                              'SiteType':'sitetype', 
                                              'FacilityID':'facilityid', 
                                              'FacilityZIP':'facilityzip', 
                                              'FacilityState':'facilitystate',
                                              'CustomerZIP':'customerzip', 
                                              'CustomerState':'customerstate', 
                                              'CustomerCountry':'customercountry', 
                                              'TotalBeforeTax':'totalbeforetax', 
                                              'StartDate':'startdate', 
                                              'EndDate':'enddate', 
                                              'OrderDate':'orderdate',
                                              'NumberOfPeople':'numberofpeople'})

In [68]:
data2016_2020 = pd.concat([data2016_2018, data2019_WestCoast_clean, data2020_WestCoast_clean])
data2016_2020

Unnamed: 0,agency,regiondescription,parentlocation,park,sitetype,facilityid,facilityzip,facilitystate,customerzip,customerstate,customercountry,totalbeforetax,startdate,enddate,orderdate,numberofpeople
48,NPS,Joshua Tree National Park,Pacific West Region,SHEEP PASS GROUP,GROUP TENT ONLY AREA NONELECTRIC,232470,92277-3597,CA,90027,CA,USA,100.00,2016-09-03,2016-09-05,2015-10-01 00:00:00.000,20.0
96,USFS,MAMMOTH RD - FS,INYO NF - FS,PUMICE FLAT GROUP CAMP,GROUP STANDARD NONELECTRIC,231957,94301,CA,92301,CA,USA,313.05,2016-06-30,2016-07-03,2015-10-01 00:00:00.000,30.0
99,USFS,LOS ANGELES RIVER RD - FS,ANGELES NF - FS,MEADOW GROUP CAMPGROUND,GROUP STANDARD NONELECTRIC,233366,,CA,91701,CA,USA,81.00,2016-06-24,2016-06-26,2015-10-01 00:00:00.000,24.0
243,USFS,NACHES RD - FS,OKANOGAN - WENATCHEE NF -FS,SALMON COVE GROUP SITE,GROUP STANDARD AREA NONELECTRIC,234498,98937,WA,98942,WA,USA,159.00,2016-09-08,2016-09-11,2015-10-01 00:00:00.000,27.0
274,USACE,LAKE MENDOCINO,SAN FRANCISCO DIST,BUSHAY RECREATION AREA,GROUP STANDARD NONELECTRIC,233437,95482-9404,CA,94565,CA,USA,705.00,2016-09-02,2016-09-05,2015-10-01 00:00:00.000,40.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4712272,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822,Washington,98117,WA,USA,28.00,2020-08-14,2020-08-16,2020-08-10 18:14:43.334,2.0
4712273,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822,Washington,,,,18.00,2020-07-02,2020-07-03,2020-06-30 06:08:40.328,1.0
4712274,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822,Washington,98801,WA,USA,108.00,2020-07-07,2020-07-17,2020-07-02 16:31:16.374,2.0
4712275,USFS,Pacific Northwest,Okanogan-Wenatchee National Forest,Lake Creek Campground - Entiat River,STANDARD NONELECTRIC,273975,98822,Washington,98006,WA,USA,38.00,2020-08-06,2020-08-09,2020-07-20 23:16:45.644,8.0


In [69]:
data2016_2020.to_csv("../../Resources/data/reservations_West_Coast.csv", index = False, header=True)