In [1]:
%matplotlib inline
import matplotlib.pyplot as plt
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.tree import DecisionTreeRegressor
import numpy as np
import datetime

In [2]:
# Load Our Data
avodatafile=pd.read_csv('avo_geo_data_final.csv')
avodatafile.head()

Unnamed: 0.1,Unnamed: 0,date,average_price,total_volume,type_4046,type_4225,type_4770,total_bags,small_bags,large_bags,xlarge_bags,type,year,city,state,region,city_state,latitude,longitude
0,0,12/27/2015,1.33,64236.62,1036.74,54454.85,48.16,8696.87,8603.62,93.25,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
1,1,12/20/2015,1.35,54876.98,674.28,44638.81,58.33,9505.56,9408.07,97.49,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
2,2,12/13/2015,0.93,118220.22,794.7,109149.67,130.5,8145.35,8042.21,103.14,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
3,3,12/6/2015,1.08,78992.15,1132.0,71976.41,72.58,5811.16,5677.4,133.76,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
4,4,11/29/2015,1.28,51039.6,941.48,43838.39,75.78,6183.95,5986.26,197.69,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987


In [3]:
# Our file has a blank column lets remove it

avodatafile = avodatafile.drop(['Unnamed: 0'], axis=1)
avodatafile.head()

Unnamed: 0,date,average_price,total_volume,type_4046,type_4225,type_4770,total_bags,small_bags,large_bags,xlarge_bags,type,year,city,state,region,city_state,latitude,longitude
0,12/27/2015,1.33,64236.62,1036.74,54454.85,48.16,8696.87,8603.62,93.25,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
1,12/20/2015,1.35,54876.98,674.28,44638.81,58.33,9505.56,9408.07,97.49,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
2,12/13/2015,0.93,118220.22,794.7,109149.67,130.5,8145.35,8042.21,103.14,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
3,12/6/2015,1.08,78992.15,1132.0,71976.41,72.58,5811.16,5677.4,133.76,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
4,11/29/2015,1.28,51039.6,941.48,43838.39,75.78,6183.95,5986.26,197.69,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987


In [4]:
# Our data is from 2015 - March 2018 so we will seperate data older than 2018
# to train our model

# convert the date column to date data type so we can filter
avodatafile['date'] = pd.to_datetime(avodatafile['date'])

oldavodata = avodatafile[(avodatafile['date'] >= '2015-1-1') & 
                         (avodatafile['date'] <= '2017-12-31')]
oldavodata.head()

Unnamed: 0,date,average_price,total_volume,type_4046,type_4225,type_4770,total_bags,small_bags,large_bags,xlarge_bags,type,year,city,state,region,city_state,latitude,longitude
0,2015-12-27,1.33,64236.62,1036.74,54454.85,48.16,8696.87,8603.62,93.25,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
1,2015-12-20,1.35,54876.98,674.28,44638.81,58.33,9505.56,9408.07,97.49,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
2,2015-12-13,0.93,118220.22,794.7,109149.67,130.5,8145.35,8042.21,103.14,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
3,2015-12-06,1.08,78992.15,1132.0,71976.41,72.58,5811.16,5677.4,133.76,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
4,2015-11-29,1.28,51039.6,941.48,43838.39,75.78,6183.95,5986.26,197.69,0.0,conventional,2015,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987


In [5]:
# Store the 2018 data for later

avo2018 = avodatafile[(avodatafile['date'] >= '2018-1-1')
                      & (avodatafile['date'] <= '2018-12-31')]
avo2018

Unnamed: 0,date,average_price,total_volume,type_4046,type_4225,type_4770,total_bags,small_bags,large_bags,xlarge_bags,type,year,city,state,region,city_state,latitude,longitude
6437,2018-03-25,1.57,149396.50,16361.69,109045.03,65.45,23924.33,19273.80,4270.53,380.00,conventional,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
6438,2018-03-18,1.35,105304.65,13234.86,61037.58,55.00,30977.21,26755.90,3721.31,500.00,conventional,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
6439,2018-03-11,1.12,144648.75,15823.35,110950.68,70.00,17804.72,14480.52,3033.09,291.11,conventional,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
6440,2018-03-04,1.08,139520.60,12002.12,105069.57,95.62,22353.29,16128.51,5941.45,283.33,conventional,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
6441,2018-02-25,1.28,104278.89,10368.77,59723.32,48.00,34138.80,30126.31,3702.49,310.00,conventional,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
13853,2018-02-04,1.32,7363.56,89.59,440.31,0.00,6833.66,6827.78,5.88,0.00,organic,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451
13854,2018-01-28,1.61,7695.89,156.01,859.20,0.00,6680.68,5567.39,1113.29,0.00,organic,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451
13855,2018-01-21,1.52,6871.05,76.66,407.09,0.00,6387.30,6375.55,11.75,0.00,organic,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451
13856,2018-01-14,1.53,7238.04,106.98,496.61,0.00,6634.45,6634.45,0.00,0.00,organic,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451


In [6]:
## Here's the painful part to give our machine learning model the best chance
## to predict avocado prices we need to break the data up for each city to
## make things harder we have to split it by conventional and organic.
## We are also putting the data in order by date

## Conventional data

Albany_conv_data = oldavodata.loc[(oldavodata['city'] =='Albany') &
                                  (oldavodata['type'] =='conventional')
                                 ].sort_values(by=['date'])
Atlanta_conv_data = oldavodata.loc[(oldavodata['city'] =='Atlanta') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Baltimore_conv_data = oldavodata.loc[(oldavodata['city'] =='Baltimore') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Boise_conv_data = oldavodata.loc[(oldavodata['city'] =='Boise') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Boston_conv_data = oldavodata.loc[(oldavodata['city'] =='Boston') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Buffalo_conv_data = oldavodata.loc[(oldavodata['city'] =='Buffalo') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Charlotte_conv_data = oldavodata.loc[(oldavodata['city'] =='Charlotte') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Chicago_conv_data = oldavodata.loc[(oldavodata['city'] =='Chicago') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Cincinnati_conv_data = oldavodata.loc[(oldavodata['city'] =='Cincinnati') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Columbus_conv_data = oldavodata.loc[(oldavodata['city'] =='Columbus') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Dallas_conv_data = oldavodata.loc[(oldavodata['city'] =='Dallas') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Denver_conv_data = oldavodata.loc[(oldavodata['city'] =='Denver') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Detroit_conv_data = oldavodata.loc[(oldavodata['city'] =='Detroit') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Grand_Rapids_conv_data = oldavodata.loc[(oldavodata['city'] =='Grand Rapids') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Harrisburg_conv_data = oldavodata.loc[(oldavodata['city'] =='Harrisburg') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Hartford_conv_data = oldavodata.loc[(oldavodata['city'] =='Hartford') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Houston_conv_data = oldavodata.loc[(oldavodata['city'] =='Houston') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Indianapolis_conv_data = oldavodata.loc[(oldavodata['city'] =='Indianapolis') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Jacksonville_conv_data = oldavodata.loc[(oldavodata['city'] =='Jacksonville') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Las_Vegas_conv_data = oldavodata.loc[(oldavodata['city'] =='Las Vegas') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Los_Angeles_conv_data = oldavodata.loc[(oldavodata['city'] =='Los Angeles') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Louisville_conv_data = oldavodata.loc[(oldavodata['city'] =='Louisville') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Miami_conv_data = oldavodata.loc[(oldavodata['city'] =='Miami') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Nashville_conv_data = oldavodata.loc[(oldavodata['city'] =='Nashville') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
New_Orleans_conv_data = oldavodata.loc[(oldavodata['city'] =='New Orleans') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
New_York_conv_data = oldavodata.loc[(oldavodata['city'] =='New York') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Orlando_conv_data = oldavodata.loc[(oldavodata['city'] =='Orlando') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Philadelphia_conv_data = oldavodata.loc[(oldavodata['city'] =='Philadelphia') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Phoenix_conv_data = oldavodata.loc[(oldavodata['city'] =='Phoenix') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Pittsburgh_conv_data = oldavodata.loc[(oldavodata['city'] =='Pittsburgh') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Portland_conv_data = oldavodata.loc[(oldavodata['city'] =='Portland') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Raleigh_conv_data = oldavodata.loc[(oldavodata['city'] =='Raleigh') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Richmond_conv_data = oldavodata.loc[(oldavodata['city'] =='Richmond') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Roanoke_conv_data = oldavodata.loc[(oldavodata['city'] =='Roanoke') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Sacramento_conv_data = oldavodata.loc[(oldavodata['city'] =='Sacramento') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
San_Diego_conv_data = oldavodata.loc[(oldavodata['city'] =='San Diego') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
San_Francisco_conv_data = oldavodata.loc[(oldavodata['city'] =='San Francisco') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Seattle_conv_data = oldavodata.loc[(oldavodata['city'] =='Seattle') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Spokane_conv_data = oldavodata.loc[(oldavodata['city'] =='Spokane') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Syracuse_conv_data = oldavodata.loc[(oldavodata['city'] =='Syracuse') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])
Tampa_conv_data = oldavodata.loc[(oldavodata['city'] =='Tampa') & (oldavodata['type'] =='conventional')].sort_values(by=['date'])

## Organic Data

Albany_org_data = oldavodata.loc[(oldavodata['city'] =='Albany') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Atlanta_org_data = oldavodata.loc[(oldavodata['city'] =='Atlanta') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Baltimore_org_data = oldavodata.loc[(oldavodata['city'] =='Baltimore') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Boise_org_data = oldavodata.loc[(oldavodata['city'] =='Boise') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Boston_org_data = oldavodata.loc[(oldavodata['city'] =='Boston') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Buffalo_org_data = oldavodata.loc[(oldavodata['city'] =='Buffalo') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Charlotte_org_data = oldavodata.loc[(oldavodata['city'] =='Charlotte') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Chicago_org_data = oldavodata.loc[(oldavodata['city'] =='Chicago') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Cincinnati_org_data = oldavodata.loc[(oldavodata['city'] =='Cincinnati') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Columbus_org_data = oldavodata.loc[(oldavodata['city'] =='Columbus') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Dallas_org_data = oldavodata.loc[(oldavodata['city'] =='Dallas') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Denver_org_data = oldavodata.loc[(oldavodata['city'] =='Denver') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Detroit_org_data = oldavodata.loc[(oldavodata['city'] =='Detroit') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Grand_Rapids_org_data = oldavodata.loc[(oldavodata['city'] =='Grand Rapids') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Harrisburg_org_data = oldavodata.loc[(oldavodata['city'] =='Harrisburg') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Hartford_org_data = oldavodata.loc[(oldavodata['city'] =='Hartford') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Houston_org_data = oldavodata.loc[(oldavodata['city'] =='Houston') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Indianapolis_org_data = oldavodata.loc[(oldavodata['city'] =='Indianapolis') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Jacksonville_org_data = oldavodata.loc[(oldavodata['city'] =='Jacksonville') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Las_Vegas_org_data = oldavodata.loc[(oldavodata['city'] =='Las Vegas') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Los_Angeles_org_data = oldavodata.loc[(oldavodata['city'] =='Los Angeles') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Louisville_org_data = oldavodata.loc[(oldavodata['city'] =='Louisville') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Miami_org_data = oldavodata.loc[(oldavodata['city'] =='Miami') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Nashville_org_data = oldavodata.loc[(oldavodata['city'] =='Nashville') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
New_Orleans_org_data = oldavodata.loc[(oldavodata['city'] =='New Orleans') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
New_York_org_data = oldavodata.loc[(oldavodata['city'] =='New York') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Orlando_org_data = oldavodata.loc[(oldavodata['city'] =='Orlando') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Philadelphia_org_data = oldavodata.loc[(oldavodata['city'] =='Philadelphia') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Phoenix_org_data = oldavodata.loc[(oldavodata['city'] =='Phoenix') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Pittsburgh_org_data = oldavodata.loc[(oldavodata['city'] =='Pittsburgh') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Portland_org_data = oldavodata.loc[(oldavodata['city'] =='Portland') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Raleigh_org_data = oldavodata.loc[(oldavodata['city'] =='Raleigh') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Richmond_org_data = oldavodata.loc[(oldavodata['city'] =='Richmond') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Roanoke_org_data = oldavodata.loc[(oldavodata['city'] =='Roanoke') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Sacramento_org_data = oldavodata.loc[(oldavodata['city'] =='Sacramento') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
San_Diego_org_data = oldavodata.loc[(oldavodata['city'] =='San Diego') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
San_Francisco_org_data = oldavodata.loc[(oldavodata['city'] =='San Francisco') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Seattle_org_data = oldavodata.loc[(oldavodata['city'] =='Seattle') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Spokane_org_data = oldavodata.loc[(oldavodata['city'] =='Spokane') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Syracuse_org_data = oldavodata.loc[(oldavodata['city'] =='Syracuse') & (oldavodata['type'] =='organic')].sort_values(by=['date'])
Tampa_org_data = oldavodata.loc[(oldavodata['city'] =='Tampa') & (oldavodata['type'] =='organic')].sort_values(by=['date'])


In [7]:
# To Prepare our data to use machine learning we have to remove
# All columns that are not numeric in our case we are going to remove
# Date, type, year, city, state, region, city_state, latitude, and longitude
# for each data set

# Conventinal Data

Albany_conv_cleandata = Albany_conv_data.drop(['date','type', 'year', 'city',
                                               'state','region', 'city_state',
                                               'latitude', 'longitude'],
                                              axis=1)
Atlanta_conv_cleandata = Atlanta_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Baltimore_conv_cleandata = Baltimore_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Boise_conv_cleandata = Boise_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Boston_conv_cleandata = Boston_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Buffalo_conv_cleandata = Buffalo_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Charlotte_conv_cleandata = Charlotte_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Chicago_conv_cleandata = Chicago_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Cincinnati_conv_cleandata = Cincinnati_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Columbus_conv_cleandata = Columbus_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Dallas_conv_cleandata = Dallas_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Denver_conv_cleandata = Denver_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Detroit_conv_cleandata = Detroit_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Grand_Rapids_conv_cleandata = Grand_Rapids_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Harrisburg_conv_cleandata = Harrisburg_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Hartford_conv_cleandata = Hartford_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Houston_conv_cleandata = Houston_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Indianapolis_conv_cleandata = Indianapolis_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Jacksonville_conv_cleandata = Jacksonville_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Las_Vegas_conv_cleandata = Las_Vegas_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Los_Angeles_conv_cleandata = Los_Angeles_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Louisville_conv_cleandata = Louisville_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Miami_conv_cleandata = Miami_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Nashville_conv_cleandata = Nashville_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
New_Orleans_conv_cleandata = New_Orleans_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
New_York_conv_cleandata = New_York_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Orlando_conv_cleandata = Orlando_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Philadelphia_conv_cleandata = Philadelphia_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Phoenix_conv_cleandata = Phoenix_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Pittsburgh_conv_cleandata = Pittsburgh_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Portland_conv_cleandata = Portland_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Raleigh_conv_cleandata = Raleigh_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Richmond_conv_cleandata = Richmond_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Roanoke_conv_cleandata = Roanoke_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Sacramento_conv_cleandata = Sacramento_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
San_Diego_conv_cleandata = San_Diego_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
San_Francisco_conv_cleandata = San_Francisco_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Seattle_conv_cleandata = Seattle_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Spokane_conv_cleandata = Spokane_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Syracuse_conv_cleandata = Syracuse_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Tampa_conv_cleandata = Tampa_conv_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)

# Organic Data

Albany_org_cleandata = Albany_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Atlanta_org_cleandata = Atlanta_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Baltimore_org_cleandata = Baltimore_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Boise_org_cleandata = Boise_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Boston_org_cleandata = Boston_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Buffalo_org_cleandata = Buffalo_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Charlotte_org_cleandata = Charlotte_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Chicago_org_cleandata = Chicago_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Cincinnati_org_cleandata = Cincinnati_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Columbus_org_cleandata = Columbus_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Dallas_org_cleandata = Dallas_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Denver_org_cleandata = Denver_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Detroit_org_cleandata = Detroit_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Grand_Rapids_org_cleandata = Grand_Rapids_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Harrisburg_org_cleandata = Harrisburg_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Hartford_org_cleandata = Hartford_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Houston_org_cleandata = Houston_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Indianapolis_org_cleandata = Indianapolis_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Jacksonville_org_cleandata = Jacksonville_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Las_Vegas_org_cleandata = Las_Vegas_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Los_Angeles_org_cleandata = Los_Angeles_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Louisville_org_cleandata = Louisville_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Miami_org_cleandata = Miami_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Nashville_org_cleandata = Nashville_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
New_Orleans_org_cleandata = New_Orleans_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
New_York_org_cleandata = New_York_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Orlando_org_cleandata = Orlando_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Philadelphia_org_cleandata = Philadelphia_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Phoenix_org_cleandata = Phoenix_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Pittsburgh_org_cleandata = Pittsburgh_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Portland_org_cleandata = Portland_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Raleigh_org_cleandata = Raleigh_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Richmond_org_cleandata = Richmond_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Roanoke_org_cleandata = Roanoke_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Sacramento_org_cleandata = Sacramento_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
San_Diego_org_cleandata = San_Diego_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
San_Francisco_org_cleandata = San_Francisco_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Seattle_org_cleandata = Seattle_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Spokane_org_cleandata = Spokane_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Syracuse_org_cleandata = Syracuse_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)
Tampa_org_cleandata = Tampa_org_data.drop(['date','type', 'year', 'city', 'state','region', 'city_state', 'latitude', 'longitude'], axis=1)


In [8]:
# Now that we have our data prepared we just to seperate what we want
# the machine learning to predict (called the target) and the other data
# properties it will use to make the prediction (called the features)
# Looking at our data it will make the most sense to try and predict the
# average price of avocados because all the other columns are just a total
# of how many sold

# Conventional Data Features

Albany_conv_feature_data = Albany_conv_cleandata[['total_volume','type_4046',
                                                  'type_4225','type_4770',
                                                  'total_bags','small_bags',
                                                  'large_bags','xlarge_bags'
                                                 ]]
Atlanta_conv_feature_data = Atlanta_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Baltimore_conv_feature_data = Baltimore_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boise_conv_feature_data = Boise_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boston_conv_feature_data = Boston_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Buffalo_conv_feature_data = Buffalo_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Charlotte_conv_feature_data = Charlotte_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Chicago_conv_feature_data = Chicago_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Cincinnati_conv_feature_data = Cincinnati_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Columbus_conv_feature_data = Columbus_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Dallas_conv_feature_data = Dallas_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Denver_conv_feature_data = Denver_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Detroit_conv_feature_data = Detroit_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Grand_Rapids_conv_feature_data = Grand_Rapids_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Harrisburg_conv_feature_data = Harrisburg_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Hartford_conv_feature_data = Hartford_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Houston_conv_feature_data = Houston_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Indianapolis_conv_feature_data = Indianapolis_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Jacksonville_conv_feature_data = Jacksonville_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Las_Vegas_conv_feature_data = Las_Vegas_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Los_Angeles_conv_feature_data = Los_Angeles_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Louisville_conv_feature_data = Louisville_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Miami_conv_feature_data = Miami_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Nashville_conv_feature_data = Nashville_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_Orleans_conv_feature_data = New_Orleans_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_York_conv_feature_data = New_York_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Orlando_conv_feature_data = Orlando_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Philadelphia_conv_feature_data = Philadelphia_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Phoenix_conv_feature_data = Phoenix_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Pittsburgh_conv_feature_data = Pittsburgh_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Portland_conv_feature_data = Portland_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Raleigh_conv_feature_data = Raleigh_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Richmond_conv_feature_data = Richmond_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Roanoke_conv_feature_data = Roanoke_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Sacramento_conv_feature_data = Sacramento_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Diego_conv_feature_data = San_Diego_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Francisco_conv_feature_data = San_Francisco_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Seattle_conv_feature_data = Seattle_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Spokane_conv_feature_data = Spokane_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Syracuse_conv_feature_data = Syracuse_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Tampa_conv_feature_data = Tampa_conv_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]

# Conventional Data Targets
#per month per city per year

Albany_conv_target_data = Albany_conv_cleandata[['average_price']]
Atlanta_conv_target_data = Atlanta_conv_cleandata[['average_price']]
Baltimore_conv_target_data = Baltimore_conv_cleandata[['average_price']]
Boise_conv_target_data = Boise_conv_cleandata[['average_price']]
Boston_conv_target_data = Boston_conv_cleandata[['average_price']]
Buffalo_conv_target_data = Buffalo_conv_cleandata[['average_price']]
Charlotte_conv_target_data = Charlotte_conv_cleandata[['average_price']]
Chicago_conv_target_data = Chicago_conv_cleandata[['average_price']]
Cincinnati_conv_target_data = Cincinnati_conv_cleandata[['average_price']]
Columbus_conv_target_data = Columbus_conv_cleandata[['average_price']]
Dallas_conv_target_data = Dallas_conv_cleandata[['average_price']]
Denver_conv_target_data = Denver_conv_cleandata[['average_price']]
Detroit_conv_target_data = Detroit_conv_cleandata[['average_price']]
Grand_Rapids_conv_target_data = Grand_Rapids_conv_cleandata[['average_price']]
Harrisburg_conv_target_data = Harrisburg_conv_cleandata[['average_price']]
Hartford_conv_target_data = Hartford_conv_cleandata[['average_price']]
Houston_conv_target_data = Houston_conv_cleandata[['average_price']]
Indianapolis_conv_target_data = Indianapolis_conv_cleandata[['average_price']]
Jacksonville_conv_target_data = Jacksonville_conv_cleandata[['average_price']]
Las_Vegas_conv_target_data = Las_Vegas_conv_cleandata[['average_price']]
Los_Angeles_conv_target_data = Los_Angeles_conv_cleandata[['average_price']]
Louisville_conv_target_data = Louisville_conv_cleandata[['average_price']]
Miami_conv_target_data = Miami_conv_cleandata[['average_price']]
Nashville_conv_target_data = Nashville_conv_cleandata[['average_price']]
New_Orleans_conv_target_data = New_Orleans_conv_cleandata[['average_price']]
New_York_conv_target_data = New_York_conv_cleandata[['average_price']]
Orlando_conv_target_data = Orlando_conv_cleandata[['average_price']]
Philadelphia_conv_target_data = Philadelphia_conv_cleandata[['average_price']]
Phoenix_conv_target_data = Phoenix_conv_cleandata[['average_price']]
Pittsburgh_conv_target_data = Pittsburgh_conv_cleandata[['average_price']]
Portland_conv_target_data = Portland_conv_cleandata[['average_price']]
Raleigh_conv_target_data = Raleigh_conv_cleandata[['average_price']]
Richmond_conv_target_data = Richmond_conv_cleandata[['average_price']]
Roanoke_conv_target_data = Roanoke_conv_cleandata[['average_price']]
Sacramento_conv_target_data = Sacramento_conv_cleandata[['average_price']]
San_Diego_conv_target_data = San_Diego_conv_cleandata[['average_price']]
San_Francisco_conv_target_data = San_Francisco_conv_cleandata[['average_price']]
Seattle_conv_target_data = Seattle_conv_cleandata[['average_price']]
Spokane_conv_target_data = Spokane_conv_cleandata[['average_price']]
Syracuse_conv_target_data = Syracuse_conv_cleandata[['average_price']]
Tampa_conv_target_data = Tampa_conv_cleandata[['average_price']]

# Organic Data Features

Albany_org_feature_data = Albany_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Atlanta_org_feature_data = Atlanta_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Baltimore_org_feature_data = Baltimore_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boise_org_feature_data = Boise_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boston_org_feature_data = Boston_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Buffalo_org_feature_data = Buffalo_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Charlotte_org_feature_data = Charlotte_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Chicago_org_feature_data = Chicago_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Cincinnati_org_feature_data = Cincinnati_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Columbus_org_feature_data = Columbus_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Dallas_org_feature_data = Dallas_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Denver_org_feature_data = Denver_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Detroit_org_feature_data = Detroit_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Grand_Rapids_org_feature_data = Grand_Rapids_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Harrisburg_org_feature_data = Harrisburg_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Hartford_org_feature_data = Hartford_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Houston_org_feature_data = Houston_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Indianapolis_org_feature_data = Indianapolis_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Jacksonville_org_feature_data = Jacksonville_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Las_Vegas_org_feature_data = Las_Vegas_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Los_Angeles_org_feature_data = Los_Angeles_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Louisville_org_feature_data = Louisville_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Miami_org_feature_data = Miami_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Nashville_org_feature_data = Nashville_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_Orleans_org_feature_data = New_Orleans_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_York_org_feature_data = New_York_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Orlando_org_feature_data = Orlando_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Philadelphia_org_feature_data = Philadelphia_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Phoenix_org_feature_data = Phoenix_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Pittsburgh_org_feature_data = Pittsburgh_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Portland_org_feature_data = Portland_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Raleigh_org_feature_data = Raleigh_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Richmond_org_feature_data = Richmond_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Roanoke_org_feature_data = Roanoke_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Sacramento_org_feature_data = Sacramento_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Diego_org_feature_data = San_Diego_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Francisco_org_feature_data = San_Francisco_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Seattle_org_feature_data = Seattle_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Spokane_org_feature_data = Spokane_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Syracuse_org_feature_data = Syracuse_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Tampa_org_feature_data = Tampa_org_cleandata[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]

# Organic Data Targets

Albany_org_target_data = Albany_org_cleandata[['average_price']]
Atlanta_org_target_data = Atlanta_org_cleandata[['average_price']]
Baltimore_org_target_data = Baltimore_org_cleandata[['average_price']]
Boise_org_target_data = Boise_org_cleandata[['average_price']]
Boston_org_target_data = Boston_org_cleandata[['average_price']]
Buffalo_org_target_data = Buffalo_org_cleandata[['average_price']]
Charlotte_org_target_data = Charlotte_org_cleandata[['average_price']]
Chicago_org_target_data = Chicago_org_cleandata[['average_price']]
Cincinnati_org_target_data = Cincinnati_org_cleandata[['average_price']]
Columbus_org_target_data = Columbus_org_cleandata[['average_price']]
Dallas_org_target_data = Dallas_org_cleandata[['average_price']]
Denver_org_target_data = Denver_org_cleandata[['average_price']]
Detroit_org_target_data = Detroit_org_cleandata[['average_price']]
Grand_Rapids_org_target_data = Grand_Rapids_org_cleandata[['average_price']]
Harrisburg_org_target_data = Harrisburg_org_cleandata[['average_price']]
Hartford_org_target_data = Hartford_org_cleandata[['average_price']]
Houston_org_target_data = Houston_org_cleandata[['average_price']]
Indianapolis_org_target_data = Indianapolis_org_cleandata[['average_price']]
Jacksonville_org_target_data = Jacksonville_org_cleandata[['average_price']]
Las_Vegas_org_target_data = Las_Vegas_org_cleandata[['average_price']]
Los_Angeles_org_target_data = Los_Angeles_org_cleandata[['average_price']]
Louisville_org_target_data = Louisville_org_cleandata[['average_price']]
Miami_org_target_data = Miami_org_cleandata[['average_price']]
Nashville_org_target_data = Nashville_org_cleandata[['average_price']]
New_Orleans_org_target_data = New_Orleans_org_cleandata[['average_price']]
New_York_org_target_data = New_York_org_cleandata[['average_price']]
Orlando_org_target_data = Orlando_org_cleandata[['average_price']]
Philadelphia_org_target_data = Philadelphia_org_cleandata[['average_price']]
Phoenix_org_target_data = Phoenix_org_cleandata[['average_price']]
Pittsburgh_org_target_data = Pittsburgh_org_cleandata[['average_price']]
Portland_org_target_data = Portland_org_cleandata[['average_price']]
Raleigh_org_target_data = Raleigh_org_cleandata[['average_price']]
Richmond_org_target_data = Richmond_org_cleandata[['average_price']]
Roanoke_org_target_data = Roanoke_org_cleandata[['average_price']]
Sacramento_org_target_data = Sacramento_org_cleandata[['average_price']]
San_Diego_org_target_data = San_Diego_org_cleandata[['average_price']]
San_Francisco_org_target_data = San_Francisco_org_cleandata[['average_price']]
Seattle_org_target_data = Seattle_org_cleandata[['average_price']]
Spokane_org_target_data = Spokane_org_cleandata[['average_price']]
Syracuse_org_target_data = Syracuse_org_cleandata[['average_price']]
Tampa_org_target_data = Tampa_org_cleandata[['average_price']]

In [9]:
# Now that we have our features and our targets we just have to split them up
# into test and training groups

# Conventional Data

Albany_conv_feature_train, Albany_conv_feature_test, Albany_conv_target_train, Albany_conv_target_test = train_test_split(Albany_conv_feature_data, Albany_conv_target_data,random_state=42)
Atlanta_conv_feature_train, Atlanta_conv_feature_test, Atlanta_conv_target_train, Atlanta_conv_target_test = train_test_split(Atlanta_conv_feature_data, Atlanta_conv_target_data,random_state=42)
Baltimore_conv_feature_train, Baltimore_conv_feature_test, Baltimore_conv_target_train, Baltimore_conv_target_test = train_test_split(Baltimore_conv_feature_data, Baltimore_conv_target_data,random_state=42)
Boise_conv_feature_train, Boise_conv_feature_test, Boise_conv_target_train, Boise_conv_target_test = train_test_split(Boise_conv_feature_data, Boise_conv_target_data,random_state=42)
Boston_conv_feature_train, Boston_conv_feature_test, Boston_conv_target_train, Boston_conv_target_test = train_test_split(Boston_conv_feature_data, Boston_conv_target_data,random_state=42)
Buffalo_conv_feature_train, Buffalo_conv_feature_test, Buffalo_conv_target_train, Buffalo_conv_target_test = train_test_split(Buffalo_conv_feature_data, Buffalo_conv_target_data,random_state=42)
Charlotte_conv_feature_train, Charlotte_conv_feature_test, Charlotte_conv_target_train, Charlotte_conv_target_test = train_test_split(Charlotte_conv_feature_data, Charlotte_conv_target_data,random_state=42)
Chicago_conv_feature_train, Chicago_conv_feature_test, Chicago_conv_target_train, Chicago_conv_target_test = train_test_split(Chicago_conv_feature_data, Chicago_conv_target_data,random_state=42)
Cincinnati_conv_feature_train, Cincinnati_conv_feature_test, Cincinnati_conv_target_train, Cincinnati_conv_target_test = train_test_split(Cincinnati_conv_feature_data, Cincinnati_conv_target_data,random_state=42)
Columbus_conv_feature_train, Columbus_conv_feature_test, Columbus_conv_target_train, Columbus_conv_target_test = train_test_split(Columbus_conv_feature_data, Columbus_conv_target_data,random_state=42)
Dallas_conv_feature_train, Dallas_conv_feature_test, Dallas_conv_target_train, Dallas_conv_target_test = train_test_split(Dallas_conv_feature_data, Dallas_conv_target_data,random_state=42)
Denver_conv_feature_train, Denver_conv_feature_test, Denver_conv_target_train, Denver_conv_target_test = train_test_split(Denver_conv_feature_data, Denver_conv_target_data,random_state=42)
Detroit_conv_feature_train, Detroit_conv_feature_test, Detroit_conv_target_train, Detroit_conv_target_test = train_test_split(Detroit_conv_feature_data, Detroit_conv_target_data,random_state=42)
Grand_Rapids_conv_feature_train, Grand_Rapids_conv_feature_test, Grand_Rapids_conv_target_train, Grand_Rapids_conv_target_test = train_test_split(Grand_Rapids_conv_feature_data, Grand_Rapids_conv_target_data,random_state=42)
Harrisburg_conv_feature_train, Harrisburg_conv_feature_test, Harrisburg_conv_target_train, Harrisburg_conv_target_test = train_test_split(Harrisburg_conv_feature_data, Harrisburg_conv_target_data,random_state=42)
Hartford_conv_feature_train, Hartford_conv_feature_test, Hartford_conv_target_train, Hartford_conv_target_test = train_test_split(Hartford_conv_feature_data, Hartford_conv_target_data,random_state=42)
Houston_conv_feature_train, Houston_conv_feature_test, Houston_conv_target_train, Houston_conv_target_test = train_test_split(Houston_conv_feature_data, Houston_conv_target_data,random_state=42)
Indianapolis_conv_feature_train, Indianapolis_conv_feature_test, Indianapolis_conv_target_train, Indianapolis_conv_target_test = train_test_split(Indianapolis_conv_feature_data, Indianapolis_conv_target_data,random_state=42)
Jacksonville_conv_feature_train, Jacksonville_conv_feature_test, Jacksonville_conv_target_train, Jacksonville_conv_target_test = train_test_split(Jacksonville_conv_feature_data, Jacksonville_conv_target_data,random_state=42)
Las_Vegas_conv_feature_train, Las_Vegas_conv_feature_test, Las_Vegas_conv_target_train, Las_Vegas_conv_target_test = train_test_split(Las_Vegas_conv_feature_data, Las_Vegas_conv_target_data,random_state=42)
Los_Angeles_conv_feature_train, Los_Angeles_conv_feature_test, Los_Angeles_conv_target_train, Los_Angeles_conv_target_test = train_test_split(Los_Angeles_conv_feature_data, Los_Angeles_conv_target_data,random_state=42)
Louisville_conv_feature_train, Louisville_conv_feature_test, Louisville_conv_target_train, Louisville_conv_target_test = train_test_split(Louisville_conv_feature_data, Louisville_conv_target_data,random_state=42)
Miami_conv_feature_train, Miami_conv_feature_test, Miami_conv_target_train, Miami_conv_target_test = train_test_split(Miami_conv_feature_data, Miami_conv_target_data,random_state=42)
Nashville_conv_feature_train, Nashville_conv_feature_test, Nashville_conv_target_train, Nashville_conv_target_test = train_test_split(Nashville_conv_feature_data, Nashville_conv_target_data,random_state=42)
New_Orleans_conv_feature_train, New_Orleans_conv_feature_test, New_Orleans_conv_target_train, New_Orleans_conv_target_test = train_test_split(New_Orleans_conv_feature_data, New_Orleans_conv_target_data,random_state=42)
New_York_conv_feature_train, New_York_conv_feature_test, New_York_conv_target_train, New_York_conv_target_test = train_test_split(New_York_conv_feature_data, New_York_conv_target_data,random_state=42)
Orlando_conv_feature_train, Orlando_conv_feature_test, Orlando_conv_target_train, Orlando_conv_target_test = train_test_split(Orlando_conv_feature_data, Orlando_conv_target_data,random_state=42)
Philadelphia_conv_feature_train, Philadelphia_conv_feature_test, Philadelphia_conv_target_train, Philadelphia_conv_target_test = train_test_split(Philadelphia_conv_feature_data, Philadelphia_conv_target_data,random_state=42)
Phoenix_conv_feature_train, Phoenix_conv_feature_test, Phoenix_conv_target_train, Phoenix_conv_target_test = train_test_split(Phoenix_conv_feature_data, Phoenix_conv_target_data,random_state=42)
Pittsburgh_conv_feature_train, Pittsburgh_conv_feature_test, Pittsburgh_conv_target_train, Pittsburgh_conv_target_test = train_test_split(Pittsburgh_conv_feature_data, Pittsburgh_conv_target_data,random_state=42)
Portland_conv_feature_train, Portland_conv_feature_test, Portland_conv_target_train, Portland_conv_target_test = train_test_split(Portland_conv_feature_data, Portland_conv_target_data,random_state=42)
Raleigh_conv_feature_train, Raleigh_conv_feature_test, Raleigh_conv_target_train, Raleigh_conv_target_test = train_test_split(Raleigh_conv_feature_data, Raleigh_conv_target_data,random_state=42)
Richmond_conv_feature_train, Richmond_conv_feature_test, Richmond_conv_target_train, Richmond_conv_target_test = train_test_split(Richmond_conv_feature_data, Richmond_conv_target_data,random_state=42)
Roanoke_conv_feature_train, Roanoke_conv_feature_test, Roanoke_conv_target_train, Roanoke_conv_target_test = train_test_split(Roanoke_conv_feature_data, Roanoke_conv_target_data,random_state=42)
Sacramento_conv_feature_train, Sacramento_conv_feature_test, Sacramento_conv_target_train, Sacramento_conv_target_test = train_test_split(Sacramento_conv_feature_data, Sacramento_conv_target_data,random_state=42)
San_Diego_conv_feature_train, San_Diego_conv_feature_test, San_Diego_conv_target_train, San_Diego_conv_target_test = train_test_split(San_Diego_conv_feature_data, San_Diego_conv_target_data,random_state=42)
San_Francisco_conv_feature_train, San_Francisco_conv_feature_test, San_Francisco_conv_target_train, San_Francisco_conv_target_test = train_test_split(San_Francisco_conv_feature_data, San_Francisco_conv_target_data,random_state=42)
Seattle_conv_feature_train, Seattle_conv_feature_test, Seattle_conv_target_train, Seattle_conv_target_test = train_test_split(Seattle_conv_feature_data, Seattle_conv_target_data,random_state=42)
Spokane_conv_feature_train, Spokane_conv_feature_test, Spokane_conv_target_train, Spokane_conv_target_test = train_test_split(Spokane_conv_feature_data, Spokane_conv_target_data,random_state=42)
Syracuse_conv_feature_train, Syracuse_conv_feature_test, Syracuse_conv_target_train, Syracuse_conv_target_test = train_test_split(Syracuse_conv_feature_data, Syracuse_conv_target_data,random_state=42)
Tampa_conv_feature_train, Tampa_conv_feature_test, Tampa_conv_target_train, Tampa_conv_target_test = train_test_split(Tampa_conv_feature_data, Tampa_conv_target_data,random_state=42)

# Organic Data

Albany_org_feature_train, Albany_org_feature_test, Albany_org_target_train, Albany_org_target_test = train_test_split(Albany_org_feature_data, Albany_org_target_data,random_state=42)
Atlanta_org_feature_train, Atlanta_org_feature_test, Atlanta_org_target_train, Atlanta_org_target_test = train_test_split(Atlanta_org_feature_data, Atlanta_org_target_data,random_state=42)
Baltimore_org_feature_train, Baltimore_org_feature_test, Baltimore_org_target_train, Baltimore_org_target_test = train_test_split(Baltimore_org_feature_data, Baltimore_org_target_data,random_state=42)
Boise_org_feature_train, Boise_org_feature_test, Boise_org_target_train, Boise_org_target_test = train_test_split(Boise_org_feature_data, Boise_org_target_data,random_state=42)
Boston_org_feature_train, Boston_org_feature_test, Boston_org_target_train, Boston_org_target_test = train_test_split(Boston_org_feature_data, Boston_org_target_data,random_state=42)
Buffalo_org_feature_train, Buffalo_org_feature_test, Buffalo_org_target_train, Buffalo_org_target_test = train_test_split(Buffalo_org_feature_data, Buffalo_org_target_data,random_state=42)
Charlotte_org_feature_train, Charlotte_org_feature_test, Charlotte_org_target_train, Charlotte_org_target_test = train_test_split(Charlotte_org_feature_data, Charlotte_org_target_data,random_state=42)
Chicago_org_feature_train, Chicago_org_feature_test, Chicago_org_target_train, Chicago_org_target_test = train_test_split(Chicago_org_feature_data, Chicago_org_target_data,random_state=42)
Cincinnati_org_feature_train, Cincinnati_org_feature_test, Cincinnati_org_target_train, Cincinnati_org_target_test = train_test_split(Cincinnati_org_feature_data, Cincinnati_org_target_data,random_state=42)
Columbus_org_feature_train, Columbus_org_feature_test, Columbus_org_target_train, Columbus_org_target_test = train_test_split(Columbus_org_feature_data, Columbus_org_target_data,random_state=42)
Dallas_org_feature_train, Dallas_org_feature_test, Dallas_org_target_train, Dallas_org_target_test = train_test_split(Dallas_org_feature_data, Dallas_org_target_data,random_state=42)
Denver_org_feature_train, Denver_org_feature_test, Denver_org_target_train, Denver_org_target_test = train_test_split(Denver_org_feature_data, Denver_org_target_data,random_state=42)
Detroit_org_feature_train, Detroit_org_feature_test, Detroit_org_target_train, Detroit_org_target_test = train_test_split(Detroit_org_feature_data, Detroit_org_target_data,random_state=42)
Grand_Rapids_org_feature_train, Grand_Rapids_org_feature_test, Grand_Rapids_org_target_train, Grand_Rapids_org_target_test = train_test_split(Grand_Rapids_org_feature_data, Grand_Rapids_org_target_data,random_state=42)
Harrisburg_org_feature_train, Harrisburg_org_feature_test, Harrisburg_org_target_train, Harrisburg_org_target_test = train_test_split(Harrisburg_org_feature_data, Harrisburg_org_target_data,random_state=42)
Hartford_org_feature_train, Hartford_org_feature_test, Hartford_org_target_train, Hartford_org_target_test = train_test_split(Hartford_org_feature_data, Hartford_org_target_data,random_state=42)
Houston_org_feature_train, Houston_org_feature_test, Houston_org_target_train, Houston_org_target_test = train_test_split(Houston_org_feature_data, Houston_org_target_data,random_state=42)
Indianapolis_org_feature_train, Indianapolis_org_feature_test, Indianapolis_org_target_train, Indianapolis_org_target_test = train_test_split(Indianapolis_org_feature_data, Indianapolis_org_target_data,random_state=42)
Jacksonville_org_feature_train, Jacksonville_org_feature_test, Jacksonville_org_target_train, Jacksonville_org_target_test = train_test_split(Jacksonville_org_feature_data, Jacksonville_org_target_data,random_state=42)
Las_Vegas_org_feature_train, Las_Vegas_org_feature_test, Las_Vegas_org_target_train, Las_Vegas_org_target_test = train_test_split(Las_Vegas_org_feature_data, Las_Vegas_org_target_data,random_state=42)
Los_Angeles_org_feature_train, Los_Angeles_org_feature_test, Los_Angeles_org_target_train, Los_Angeles_org_target_test = train_test_split(Los_Angeles_org_feature_data, Los_Angeles_org_target_data,random_state=42)
Louisville_org_feature_train, Louisville_org_feature_test, Louisville_org_target_train, Louisville_org_target_test = train_test_split(Louisville_org_feature_data, Louisville_org_target_data,random_state=42)
Miami_org_feature_train, Miami_org_feature_test, Miami_org_target_train, Miami_org_target_test = train_test_split(Miami_org_feature_data, Miami_org_target_data,random_state=42)
Nashville_org_feature_train, Nashville_org_feature_test, Nashville_org_target_train, Nashville_org_target_test = train_test_split(Nashville_org_feature_data, Nashville_org_target_data,random_state=42)
New_Orleans_org_feature_train, New_Orleans_org_feature_test, New_Orleans_org_target_train, New_Orleans_org_target_test = train_test_split(New_Orleans_org_feature_data, New_Orleans_org_target_data,random_state=42)
New_York_org_feature_train, New_York_org_feature_test, New_York_org_target_train, New_York_org_target_test = train_test_split(New_York_org_feature_data, New_York_org_target_data,random_state=42)
Orlando_org_feature_train, Orlando_org_feature_test, Orlando_org_target_train, Orlando_org_target_test = train_test_split(Orlando_org_feature_data, Orlando_org_target_data,random_state=42)
Philadelphia_org_feature_train, Philadelphia_org_feature_test, Philadelphia_org_target_train, Philadelphia_org_target_test = train_test_split(Philadelphia_org_feature_data, Philadelphia_org_target_data,random_state=42)
Phoenix_org_feature_train, Phoenix_org_feature_test, Phoenix_org_target_train, Phoenix_org_target_test = train_test_split(Phoenix_org_feature_data, Phoenix_org_target_data,random_state=42)
Pittsburgh_org_feature_train, Pittsburgh_org_feature_test, Pittsburgh_org_target_train, Pittsburgh_org_target_test = train_test_split(Pittsburgh_org_feature_data, Pittsburgh_org_target_data,random_state=42)
Portland_org_feature_train, Portland_org_feature_test, Portland_org_target_train, Portland_org_target_test = train_test_split(Portland_org_feature_data, Portland_org_target_data,random_state=42)
Raleigh_org_feature_train, Raleigh_org_feature_test, Raleigh_org_target_train, Raleigh_org_target_test = train_test_split(Raleigh_org_feature_data, Raleigh_org_target_data,random_state=42)
Richmond_org_feature_train, Richmond_org_feature_test, Richmond_org_target_train, Richmond_org_target_test = train_test_split(Richmond_org_feature_data, Richmond_org_target_data,random_state=42)
Roanoke_org_feature_train, Roanoke_org_feature_test, Roanoke_org_target_train, Roanoke_org_target_test = train_test_split(Roanoke_org_feature_data, Roanoke_org_target_data,random_state=42)
Sacramento_org_feature_train, Sacramento_org_feature_test, Sacramento_org_target_train, Sacramento_org_target_test = train_test_split(Sacramento_org_feature_data, Sacramento_org_target_data,random_state=42)
San_Diego_org_feature_train, San_Diego_org_feature_test, San_Diego_org_target_train, San_Diego_org_target_test = train_test_split(San_Diego_org_feature_data, San_Diego_org_target_data,random_state=42)
San_Francisco_org_feature_train, San_Francisco_org_feature_test, San_Francisco_org_target_train, San_Francisco_org_target_test = train_test_split(San_Francisco_org_feature_data, San_Francisco_org_target_data,random_state=42)
Seattle_org_feature_train, Seattle_org_feature_test, Seattle_org_target_train, Seattle_org_target_test = train_test_split(Seattle_org_feature_data, Seattle_org_target_data,random_state=42)
Spokane_org_feature_train, Spokane_org_feature_test, Spokane_org_target_train, Spokane_org_target_test = train_test_split(Spokane_org_feature_data, Spokane_org_target_data,random_state=42)
Syracuse_org_feature_train, Syracuse_org_feature_test, Syracuse_org_target_train, Syracuse_org_target_test = train_test_split(Syracuse_org_feature_data, Syracuse_org_target_data,random_state=42)
Tampa_org_feature_train, Tampa_org_feature_test, Tampa_org_target_train, Tampa_org_target_test = train_test_split(Tampa_org_feature_data, Tampa_org_target_data,random_state=42)


In [10]:
# Now we just need to train our model using the sample data

# Conventional Data

Albany_lr_conv = LinearRegression().fit(Albany_conv_feature_train,Albany_conv_target_train)
Atlanta_lr_conv = LinearRegression().fit(Atlanta_conv_feature_train,Atlanta_conv_target_train)
Baltimore_lr_conv = LinearRegression().fit(Baltimore_conv_feature_train,Baltimore_conv_target_train)
Boise_lr_conv = LinearRegression().fit(Boise_conv_feature_train,Boise_conv_target_train)
Boston_lr_conv = LinearRegression().fit(Boston_conv_feature_train,Boston_conv_target_train)
Buffalo_lr_conv = LinearRegression().fit(Buffalo_conv_feature_train,Buffalo_conv_target_train)
Charlotte_lr_conv = LinearRegression().fit(Charlotte_conv_feature_train,Charlotte_conv_target_train)
Chicago_lr_conv = LinearRegression().fit(Chicago_conv_feature_train,Chicago_conv_target_train)
Cincinnati_lr_conv = LinearRegression().fit(Cincinnati_conv_feature_train,Cincinnati_conv_target_train)
Columbus_lr_conv = LinearRegression().fit(Columbus_conv_feature_train,Columbus_conv_target_train)
Dallas_lr_conv = LinearRegression().fit(Dallas_conv_feature_train,Dallas_conv_target_train)
Denver_lr_conv = LinearRegression().fit(Denver_conv_feature_train,Denver_conv_target_train)
Detroit_lr_conv = LinearRegression().fit(Detroit_conv_feature_train,Detroit_conv_target_train)
Grand_Rapids_lr_conv = LinearRegression().fit(Grand_Rapids_conv_feature_train,Grand_Rapids_conv_target_train)
Harrisburg_lr_conv = LinearRegression().fit(Harrisburg_conv_feature_train,Harrisburg_conv_target_train)
Hartford_lr_conv = LinearRegression().fit(Hartford_conv_feature_train,Hartford_conv_target_train)
Houston_lr_conv = LinearRegression().fit(Houston_conv_feature_train,Houston_conv_target_train)
Indianapolis_lr_conv = LinearRegression().fit(Indianapolis_conv_feature_train,Indianapolis_conv_target_train)
Jacksonville_lr_conv = LinearRegression().fit(Jacksonville_conv_feature_train,Jacksonville_conv_target_train)
Las_Vegas_lr_conv = LinearRegression().fit(Las_Vegas_conv_feature_train,Las_Vegas_conv_target_train)
Los_Angeles_lr_conv = LinearRegression().fit(Los_Angeles_conv_feature_train,Los_Angeles_conv_target_train)
Louisville_lr_conv = LinearRegression().fit(Louisville_conv_feature_train,Louisville_conv_target_train)
Miami_lr_conv = LinearRegression().fit(Miami_conv_feature_train,Miami_conv_target_train)
Nashville_lr_conv = LinearRegression().fit(Nashville_conv_feature_train,Nashville_conv_target_train)
New_Orleans_lr_conv = LinearRegression().fit(New_Orleans_conv_feature_train,New_Orleans_conv_target_train)
New_York_lr_conv = LinearRegression().fit(New_York_conv_feature_train,New_York_conv_target_train)
Orlando_lr_conv = LinearRegression().fit(Orlando_conv_feature_train,Orlando_conv_target_train)
Philadelphia_lr_conv = LinearRegression().fit(Philadelphia_conv_feature_train,Philadelphia_conv_target_train)
Phoenix_lr_conv = LinearRegression().fit(Phoenix_conv_feature_train,Phoenix_conv_target_train)
Pittsburgh_lr_conv = LinearRegression().fit(Pittsburgh_conv_feature_train,Pittsburgh_conv_target_train)
Portland_lr_conv = LinearRegression().fit(Portland_conv_feature_train,Portland_conv_target_train)
Raleigh_lr_conv = LinearRegression().fit(Raleigh_conv_feature_train,Raleigh_conv_target_train)
Richmond_lr_conv = LinearRegression().fit(Richmond_conv_feature_train,Richmond_conv_target_train)
Roanoke_lr_conv = LinearRegression().fit(Roanoke_conv_feature_train,Roanoke_conv_target_train)
Sacramento_lr_conv = LinearRegression().fit(Sacramento_conv_feature_train,Sacramento_conv_target_train)
San_Diego_lr_conv = LinearRegression().fit(San_Diego_conv_feature_train,San_Diego_conv_target_train)
San_Francisco_lr_conv = LinearRegression().fit(San_Francisco_conv_feature_train,San_Francisco_conv_target_train)
Seattle_lr_conv = LinearRegression().fit(Seattle_conv_feature_train,Seattle_conv_target_train)
Spokane_lr_conv = LinearRegression().fit(Spokane_conv_feature_train,Spokane_conv_target_train)
Syracuse_lr_conv = LinearRegression().fit(Syracuse_conv_feature_train,Syracuse_conv_target_train)
Tampa_lr_conv = LinearRegression().fit(Tampa_conv_feature_train,Tampa_conv_target_train)

# Organic

Albany_lr_org = LinearRegression().fit(Albany_org_feature_train,Albany_org_target_train)
Atlanta_lr_org = LinearRegression().fit(Atlanta_org_feature_train,Atlanta_org_target_train)
Baltimore_lr_org = LinearRegression().fit(Baltimore_org_feature_train,Baltimore_org_target_train)
Boise_lr_org = LinearRegression().fit(Boise_org_feature_train,Boise_org_target_train)
Boston_lr_org = LinearRegression().fit(Boston_org_feature_train,Boston_org_target_train)
Buffalo_lr_org = LinearRegression().fit(Buffalo_org_feature_train,Buffalo_org_target_train)
Charlotte_lr_org = LinearRegression().fit(Charlotte_org_feature_train,Charlotte_org_target_train)
Chicago_lr_org = LinearRegression().fit(Chicago_org_feature_train,Chicago_org_target_train)
Cincinnati_lr_org = LinearRegression().fit(Cincinnati_org_feature_train,Cincinnati_org_target_train)
Columbus_lr_org = LinearRegression().fit(Columbus_org_feature_train,Columbus_org_target_train)
Dallas_lr_org = LinearRegression().fit(Dallas_org_feature_train,Dallas_org_target_train)
Denver_lr_org = LinearRegression().fit(Denver_org_feature_train,Denver_org_target_train)
Detroit_lr_org = LinearRegression().fit(Detroit_org_feature_train,Detroit_org_target_train)
Grand_Rapids_lr_org = LinearRegression().fit(Grand_Rapids_org_feature_train,Grand_Rapids_org_target_train)
Harrisburg_lr_org = LinearRegression().fit(Harrisburg_org_feature_train,Harrisburg_org_target_train)
Hartford_lr_org = LinearRegression().fit(Hartford_org_feature_train,Hartford_org_target_train)
Houston_lr_org = LinearRegression().fit(Houston_org_feature_train,Houston_org_target_train)
Indianapolis_lr_org = LinearRegression().fit(Indianapolis_org_feature_train,Indianapolis_org_target_train)
Jacksonville_lr_org = LinearRegression().fit(Jacksonville_org_feature_train,Jacksonville_org_target_train)
Las_Vegas_lr_org = LinearRegression().fit(Las_Vegas_org_feature_train,Las_Vegas_org_target_train)
Los_Angeles_lr_org = LinearRegression().fit(Los_Angeles_org_feature_train,Los_Angeles_org_target_train)
Louisville_lr_org = LinearRegression().fit(Louisville_org_feature_train,Louisville_org_target_train)
Miami_lr_org = LinearRegression().fit(Miami_org_feature_train,Miami_org_target_train)
Nashville_lr_org = LinearRegression().fit(Nashville_org_feature_train,Nashville_org_target_train)
New_Orleans_lr_org = LinearRegression().fit(New_Orleans_org_feature_train,New_Orleans_org_target_train)
New_York_lr_org = LinearRegression().fit(New_York_org_feature_train,New_York_org_target_train)
Orlando_lr_org = LinearRegression().fit(Orlando_org_feature_train,Orlando_org_target_train)
Philadelphia_lr_org = LinearRegression().fit(Philadelphia_org_feature_train,Philadelphia_org_target_train)
Phoenix_lr_org = LinearRegression().fit(Phoenix_org_feature_train,Phoenix_org_target_train)
Pittsburgh_lr_org = LinearRegression().fit(Pittsburgh_org_feature_train,Pittsburgh_org_target_train)
Portland_lr_org = LinearRegression().fit(Portland_org_feature_train,Portland_org_target_train)
Raleigh_lr_org = LinearRegression().fit(Raleigh_org_feature_train,Raleigh_org_target_train)
Richmond_lr_org = LinearRegression().fit(Richmond_org_feature_train,Richmond_org_target_train)
Roanoke_lr_org = LinearRegression().fit(Roanoke_org_feature_train,Roanoke_org_target_train)
Sacramento_lr_org = LinearRegression().fit(Sacramento_org_feature_train,Sacramento_org_target_train)
San_Diego_lr_org = LinearRegression().fit(San_Diego_org_feature_train,San_Diego_org_target_train)
San_Francisco_lr_org = LinearRegression().fit(San_Francisco_org_feature_train,San_Francisco_org_target_train)
Seattle_lr_org = LinearRegression().fit(Seattle_org_feature_train,Seattle_org_target_train)
Spokane_lr_org = LinearRegression().fit(Spokane_org_feature_train,Spokane_org_target_train)
Syracuse_lr_org = LinearRegression().fit(Syracuse_org_feature_train,Syracuse_org_target_train)
Tampa_lr_org = LinearRegression().fit(Tampa_org_feature_train,Tampa_org_target_train)


In [11]:
# Now that our model is trained we will clean up the 2018 data
# We need to split the 2018 data by city and then by conventional and organic


# Conventional

Albany_conv_data18 = avo2018.loc[(avo2018['city'] =='Albany') &
                                 (avo2018['type'] =='conventional')
                                ].sort_values(by=['date'])
Atlanta_conv_data18 = avo2018.loc[(avo2018['city'] =='Atlanta') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Baltimore_conv_data18 = avo2018.loc[(avo2018['city'] =='Baltimore') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Boise_conv_data18 = avo2018.loc[(avo2018['city'] =='Boise') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Boston_conv_data18 = avo2018.loc[(avo2018['city'] =='Boston') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Buffalo_conv_data18 = avo2018.loc[(avo2018['city'] =='Buffalo') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Charlotte_conv_data18 = avo2018.loc[(avo2018['city'] =='Charlotte') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Chicago_conv_data18 = avo2018.loc[(avo2018['city'] =='Chicago') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Cincinnati_conv_data18 = avo2018.loc[(avo2018['city'] =='Cincinnati') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Columbus_conv_data18 = avo2018.loc[(avo2018['city'] =='Columbus') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Dallas_conv_data18 = avo2018.loc[(avo2018['city'] =='Dallas') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Denver_conv_data18 = avo2018.loc[(avo2018['city'] =='Denver') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Detroit_conv_data18 = avo2018.loc[(avo2018['city'] =='Detroit') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Grand_Rapids_conv_data18 = avo2018.loc[(avo2018['city'] =='Grand Rapids') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Harrisburg_conv_data18 = avo2018.loc[(avo2018['city'] =='Harrisburg') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Hartford_conv_data18 = avo2018.loc[(avo2018['city'] =='Hartford') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Houston_conv_data18 = avo2018.loc[(avo2018['city'] =='Houston') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Indianapolis_conv_data18 = avo2018.loc[(avo2018['city'] =='Indianapolis') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Jacksonville_conv_data18 = avo2018.loc[(avo2018['city'] =='Jacksonville') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Las_Vegas_conv_data18 = avo2018.loc[(avo2018['city'] =='Las Vegas') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Los_Angeles_conv_data18 = avo2018.loc[(avo2018['city'] =='Los Angeles') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Louisville_conv_data18 = avo2018.loc[(avo2018['city'] =='Louisville') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Miami_conv_data18 = avo2018.loc[(avo2018['city'] =='Miami') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Nashville_conv_data18 = avo2018.loc[(avo2018['city'] =='Nashville') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
New_Orleans_conv_data18 = avo2018.loc[(avo2018['city'] =='New Orleans') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
New_York_conv_data18 = avo2018.loc[(avo2018['city'] =='New York') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Orlando_conv_data18 = avo2018.loc[(avo2018['city'] =='Orlando') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Philadelphia_conv_data18 = avo2018.loc[(avo2018['city'] =='Philadelphia') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Phoenix_conv_data18 = avo2018.loc[(avo2018['city'] =='Phoenix') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Pittsburgh_conv_data18 = avo2018.loc[(avo2018['city'] =='Pittsburgh') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Portland_conv_data18 = avo2018.loc[(avo2018['city'] =='Portland') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Raleigh_conv_data18 = avo2018.loc[(avo2018['city'] =='Raleigh') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Richmond_conv_data18 = avo2018.loc[(avo2018['city'] =='Richmond') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Roanoke_conv_data18 = avo2018.loc[(avo2018['city'] =='Roanoke') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Sacramento_conv_data18 = avo2018.loc[(avo2018['city'] =='Sacramento') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
San_Diego_conv_data18 = avo2018.loc[(avo2018['city'] =='San Diego') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
San_Francisco_conv_data18 = avo2018.loc[(avo2018['city'] =='San Francisco') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Seattle_conv_data18 = avo2018.loc[(avo2018['city'] =='Seattle') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Spokane_conv_data18 = avo2018.loc[(avo2018['city'] =='Spokane') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Syracuse_conv_data18 = avo2018.loc[(avo2018['city'] =='Syracuse') & (avo2018['type'] =='conventional')].sort_values(by=['date'])
Tampa_conv_data18 = avo2018.loc[(avo2018['city'] =='Tampa') & (avo2018['type'] =='conventional')].sort_values(by=['date'])

# Organic

Albany_org_data18 = avo2018.loc[(avo2018['city'] =='Albany') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Atlanta_org_data18 = avo2018.loc[(avo2018['city'] =='Atlanta') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Baltimore_org_data18 = avo2018.loc[(avo2018['city'] =='Baltimore') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Boise_org_data18 = avo2018.loc[(avo2018['city'] =='Boise') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Boston_org_data18 = avo2018.loc[(avo2018['city'] =='Boston') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Buffalo_org_data18 = avo2018.loc[(avo2018['city'] =='Buffalo') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Charlotte_org_data18 = avo2018.loc[(avo2018['city'] =='Charlotte') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Chicago_org_data18 = avo2018.loc[(avo2018['city'] =='Chicago') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Cincinnati_org_data18 = avo2018.loc[(avo2018['city'] =='Cincinnati') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Columbus_org_data18 = avo2018.loc[(avo2018['city'] =='Columbus') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Dallas_org_data18 = avo2018.loc[(avo2018['city'] =='Dallas') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Denver_org_data18 = avo2018.loc[(avo2018['city'] =='Denver') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Detroit_org_data18 = avo2018.loc[(avo2018['city'] =='Detroit') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Grand_Rapids_org_data18 = avo2018.loc[(avo2018['city'] =='Grand Rapids') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Harrisburg_org_data18 = avo2018.loc[(avo2018['city'] =='Harrisburg') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Hartford_org_data18 = avo2018.loc[(avo2018['city'] =='Hartford') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Houston_org_data18 = avo2018.loc[(avo2018['city'] =='Houston') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Indianapolis_org_data18 = avo2018.loc[(avo2018['city'] =='Indianapolis') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Jacksonville_org_data18 = avo2018.loc[(avo2018['city'] =='Jacksonville') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Las_Vegas_org_data18 = avo2018.loc[(avo2018['city'] =='Las Vegas') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Los_Angeles_org_data18 = avo2018.loc[(avo2018['city'] =='Los Angeles') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Louisville_org_data18 = avo2018.loc[(avo2018['city'] =='Louisville') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Miami_org_data18 = avo2018.loc[(avo2018['city'] =='Miami') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Nashville_org_data18 = avo2018.loc[(avo2018['city'] =='Nashville') & (avo2018['type'] =='organic')].sort_values(by=['date'])
New_Orleans_org_data18 = avo2018.loc[(avo2018['city'] =='New Orleans') & (avo2018['type'] =='organic')].sort_values(by=['date'])
New_York_org_data18 = avo2018.loc[(avo2018['city'] =='New York') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Orlando_org_data18 = avo2018.loc[(avo2018['city'] =='Orlando') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Philadelphia_org_data18 = avo2018.loc[(avo2018['city'] =='Philadelphia') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Phoenix_org_data18 = avo2018.loc[(avo2018['city'] =='Phoenix') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Pittsburgh_org_data18 = avo2018.loc[(avo2018['city'] =='Pittsburgh') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Portland_org_data18 = avo2018.loc[(avo2018['city'] =='Portland') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Raleigh_org_data18 = avo2018.loc[(avo2018['city'] =='Raleigh') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Richmond_org_data18 = avo2018.loc[(avo2018['city'] =='Richmond') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Roanoke_org_data18 = avo2018.loc[(avo2018['city'] =='Roanoke') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Sacramento_org_data18 = avo2018.loc[(avo2018['city'] =='Sacramento') & (avo2018['type'] =='organic')].sort_values(by=['date'])
San_Diego_org_data18 = avo2018.loc[(avo2018['city'] =='San Diego') & (avo2018['type'] =='organic')].sort_values(by=['date'])
San_Francisco_org_data18 = avo2018.loc[(avo2018['city'] =='San Francisco') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Seattle_org_data18 = avo2018.loc[(avo2018['city'] =='Seattle') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Spokane_org_data18 = avo2018.loc[(avo2018['city'] =='Spokane') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Syracuse_org_data18 = avo2018.loc[(avo2018['city'] =='Syracuse') & (avo2018['type'] =='organic')].sort_values(by=['date'])
Tampa_org_data18 = avo2018.loc[(avo2018['city'] =='Tampa') & (avo2018['type'] =='organic')].sort_values(by=['date'])


In [12]:
# Then we just need to create our feature data sets

# Conventional

Albany_conv_feature_data18 = Albany_conv_data18[['total_volume','type_4046','type_4225',
                                                 'type_4770','total_bags','small_bags',
                                                 'large_bags','xlarge_bags']]
Atlanta_conv_feature_data18 = Atlanta_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Baltimore_conv_feature_data18 = Baltimore_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boise_conv_feature_data18 = Boise_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boston_conv_feature_data18 = Boston_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Buffalo_conv_feature_data18 = Buffalo_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Charlotte_conv_feature_data18 = Charlotte_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Chicago_conv_feature_data18 = Chicago_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Cincinnati_conv_feature_data18 = Cincinnati_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Columbus_conv_feature_data18 = Columbus_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Dallas_conv_feature_data18 = Dallas_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Denver_conv_feature_data18 = Denver_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Detroit_conv_feature_data18 = Detroit_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Grand_Rapids_conv_feature_data18 = Grand_Rapids_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Harrisburg_conv_feature_data18 = Harrisburg_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Hartford_conv_feature_data18 = Hartford_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Houston_conv_feature_data18 = Houston_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Indianapolis_conv_feature_data18 = Indianapolis_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Jacksonville_conv_feature_data18 = Jacksonville_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Las_Vegas_conv_feature_data18 = Las_Vegas_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Los_Angeles_conv_feature_data18 = Los_Angeles_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Louisville_conv_feature_data18 = Louisville_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Miami_conv_feature_data18 = Miami_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Nashville_conv_feature_data18 = Nashville_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_Orleans_conv_feature_data18 = New_Orleans_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_York_conv_feature_data18 = New_York_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Orlando_conv_feature_data18 = Orlando_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Philadelphia_conv_feature_data18 = Philadelphia_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Phoenix_conv_feature_data18 = Phoenix_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Pittsburgh_conv_feature_data18 = Pittsburgh_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Portland_conv_feature_data18 = Portland_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Raleigh_conv_feature_data18 = Raleigh_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Richmond_conv_feature_data18 = Richmond_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Roanoke_conv_feature_data18 = Roanoke_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Sacramento_conv_feature_data18 = Sacramento_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Diego_conv_feature_data18 = San_Diego_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Francisco_conv_feature_data18 = San_Francisco_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Seattle_conv_feature_data18 = Seattle_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Spokane_conv_feature_data18 = Spokane_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Syracuse_conv_feature_data18 = Syracuse_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Tampa_conv_feature_data18 = Tampa_conv_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]

# Organic

Albany_org_feature_data18 = Albany_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Atlanta_org_feature_data18 = Atlanta_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Baltimore_org_feature_data18 = Baltimore_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boise_org_feature_data18 = Boise_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Boston_org_feature_data18 = Boston_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Buffalo_org_feature_data18 = Buffalo_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Charlotte_org_feature_data18 = Charlotte_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Chicago_org_feature_data18 = Chicago_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Cincinnati_org_feature_data18 = Cincinnati_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Columbus_org_feature_data18 = Columbus_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Dallas_org_feature_data18 = Dallas_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Denver_org_feature_data18 = Denver_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Detroit_org_feature_data18 = Detroit_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Grand_Rapids_org_feature_data18 = Grand_Rapids_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Harrisburg_org_feature_data18 = Harrisburg_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Hartford_org_feature_data18 = Hartford_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Houston_org_feature_data18 = Houston_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Indianapolis_org_feature_data18 = Indianapolis_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Jacksonville_org_feature_data18 = Jacksonville_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Las_Vegas_org_feature_data18 = Las_Vegas_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Los_Angeles_org_feature_data18 = Los_Angeles_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Louisville_org_feature_data18 = Louisville_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Miami_org_feature_data18 = Miami_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Nashville_org_feature_data18 = Nashville_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_Orleans_org_feature_data18 = New_Orleans_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
New_York_org_feature_data18 = New_York_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Orlando_org_feature_data18 = Orlando_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Philadelphia_org_feature_data18 = Philadelphia_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Phoenix_org_feature_data18 = Phoenix_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Pittsburgh_org_feature_data18 = Pittsburgh_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Portland_org_feature_data18 = Portland_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Raleigh_org_feature_data18 = Raleigh_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Richmond_org_feature_data18 = Richmond_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Roanoke_org_feature_data18 = Roanoke_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Sacramento_org_feature_data18 = Sacramento_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Diego_org_feature_data18 = San_Diego_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
San_Francisco_org_feature_data18 = San_Francisco_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Seattle_org_feature_data18 = Seattle_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Spokane_org_feature_data18 = Spokane_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Syracuse_org_feature_data18 = Syracuse_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]
Tampa_org_feature_data18 = Tampa_org_data18[['total_volume','type_4046','type_4225','type_4770','total_bags','small_bags','large_bags','xlarge_bags']]


In [13]:
# Now we can run our predictions against each city

# Conventional

Albany_conv_lr_prediction = Albany_lr_conv.predict(Albany_conv_feature_data18)
Atlanta_conv_lr_prediction = Atlanta_lr_conv.predict(Atlanta_conv_feature_data18)
Baltimore_conv_lr_prediction = Baltimore_lr_conv.predict(Baltimore_conv_feature_data18)
Boise_conv_lr_prediction = Boise_lr_conv.predict(Boise_conv_feature_data18)
Boston_conv_lr_prediction = Boston_lr_conv.predict(Boston_conv_feature_data18)
Buffalo_conv_lr_prediction = Buffalo_lr_conv.predict(Buffalo_conv_feature_data18)
Charlotte_conv_lr_prediction = Charlotte_lr_conv.predict(Charlotte_conv_feature_data18)
Chicago_conv_lr_prediction = Chicago_lr_conv.predict(Chicago_conv_feature_data18)
Cincinnati_conv_lr_prediction = Cincinnati_lr_conv.predict(Cincinnati_conv_feature_data18)
Columbus_conv_lr_prediction = Columbus_lr_conv.predict(Columbus_conv_feature_data18)
Dallas_conv_lr_prediction = Dallas_lr_conv.predict(Dallas_conv_feature_data18)
Denver_conv_lr_prediction = Denver_lr_conv.predict(Denver_conv_feature_data18)
Detroit_conv_lr_prediction = Detroit_lr_conv.predict(Detroit_conv_feature_data18)
Grand_Rapids_conv_lr_prediction = Grand_Rapids_lr_conv.predict(Grand_Rapids_conv_feature_data18)
Harrisburg_conv_lr_prediction = Harrisburg_lr_conv.predict(Harrisburg_conv_feature_data18)
Hartford_conv_lr_prediction = Hartford_lr_conv.predict(Hartford_conv_feature_data18)
Houston_conv_lr_prediction = Houston_lr_conv.predict(Houston_conv_feature_data18)
Indianapolis_conv_lr_prediction = Indianapolis_lr_conv.predict(Indianapolis_conv_feature_data18)
Jacksonville_conv_lr_prediction = Jacksonville_lr_conv.predict(Jacksonville_conv_feature_data18)
Las_Vegas_conv_lr_prediction = Las_Vegas_lr_conv.predict(Las_Vegas_conv_feature_data18)
Los_Angeles_conv_lr_prediction = Los_Angeles_lr_conv.predict(Los_Angeles_conv_feature_data18)
Louisville_conv_lr_prediction = Louisville_lr_conv.predict(Louisville_conv_feature_data18)
Miami_conv_lr_prediction = Miami_lr_conv.predict(Miami_conv_feature_data18)
Nashville_conv_lr_prediction = Nashville_lr_conv.predict(Nashville_conv_feature_data18)
New_Orleans_conv_lr_prediction = New_Orleans_lr_conv.predict(New_Orleans_conv_feature_data18)
New_York_conv_lr_prediction = New_York_lr_conv.predict(New_York_conv_feature_data18)
Orlando_conv_lr_prediction = Orlando_lr_conv.predict(Orlando_conv_feature_data18)
Philadelphia_conv_lr_prediction = Philadelphia_lr_conv.predict(Philadelphia_conv_feature_data18)
Phoenix_conv_lr_prediction = Phoenix_lr_conv.predict(Phoenix_conv_feature_data18)
Pittsburgh_conv_lr_prediction = Pittsburgh_lr_conv.predict(Pittsburgh_conv_feature_data18)
Portland_conv_lr_prediction = Portland_lr_conv.predict(Portland_conv_feature_data18)
Raleigh_conv_lr_prediction = Raleigh_lr_conv.predict(Raleigh_conv_feature_data18)
Richmond_conv_lr_prediction = Richmond_lr_conv.predict(Richmond_conv_feature_data18)
Roanoke_conv_lr_prediction = Roanoke_lr_conv.predict(Roanoke_conv_feature_data18)
Sacramento_conv_lr_prediction = Sacramento_lr_conv.predict(Sacramento_conv_feature_data18)
San_Diego_conv_lr_prediction = San_Diego_lr_conv.predict(San_Diego_conv_feature_data18)
San_Francisco_conv_lr_prediction = San_Francisco_lr_conv.predict(San_Francisco_conv_feature_data18)
Seattle_conv_lr_prediction = Seattle_lr_conv.predict(Seattle_conv_feature_data18)
Spokane_conv_lr_prediction = Spokane_lr_conv.predict(Spokane_conv_feature_data18)
Syracuse_conv_lr_prediction = Syracuse_lr_conv.predict(Syracuse_conv_feature_data18)
Tampa_conv_lr_prediction = Tampa_lr_conv.predict(Tampa_conv_feature_data18)

# Organic

Albany_org_lr_prediction = Albany_lr_org.predict(Albany_org_feature_data18)
Atlanta_org_lr_prediction = Atlanta_lr_org.predict(Atlanta_org_feature_data18)
Baltimore_org_lr_prediction = Baltimore_lr_org.predict(Baltimore_org_feature_data18)
Boise_org_lr_prediction = Boise_lr_org.predict(Boise_org_feature_data18)
Boston_org_lr_prediction = Boston_lr_org.predict(Boston_org_feature_data18)
Buffalo_org_lr_prediction = Buffalo_lr_org.predict(Buffalo_org_feature_data18)
Charlotte_org_lr_prediction = Charlotte_lr_org.predict(Charlotte_org_feature_data18)
Chicago_org_lr_prediction = Chicago_lr_org.predict(Chicago_org_feature_data18)
Cincinnati_org_lr_prediction = Cincinnati_lr_org.predict(Cincinnati_org_feature_data18)
Columbus_org_lr_prediction = Columbus_lr_org.predict(Columbus_org_feature_data18)
Dallas_org_lr_prediction = Dallas_lr_org.predict(Dallas_org_feature_data18)
Denver_org_lr_prediction = Denver_lr_org.predict(Denver_org_feature_data18)
Detroit_org_lr_prediction = Detroit_lr_org.predict(Detroit_org_feature_data18)
Grand_Rapids_org_lr_prediction = Grand_Rapids_lr_org.predict(Grand_Rapids_org_feature_data18)
Harrisburg_org_lr_prediction = Harrisburg_lr_org.predict(Harrisburg_org_feature_data18)
Hartford_org_lr_prediction = Hartford_lr_org.predict(Hartford_org_feature_data18)
Houston_org_lr_prediction = Houston_lr_org.predict(Houston_org_feature_data18)
Indianapolis_org_lr_prediction = Indianapolis_lr_org.predict(Indianapolis_org_feature_data18)
Jacksonville_org_lr_prediction = Jacksonville_lr_org.predict(Jacksonville_org_feature_data18)
Las_Vegas_org_lr_prediction = Las_Vegas_lr_org.predict(Las_Vegas_org_feature_data18)
Los_Angeles_org_lr_prediction = Los_Angeles_lr_org.predict(Los_Angeles_org_feature_data18)
Louisville_org_lr_prediction = Louisville_lr_org.predict(Louisville_org_feature_data18)
Miami_org_lr_prediction = Miami_lr_org.predict(Miami_org_feature_data18)
Nashville_org_lr_prediction = Nashville_lr_org.predict(Nashville_org_feature_data18)
New_Orleans_org_lr_prediction = New_Orleans_lr_org.predict(New_Orleans_org_feature_data18)
New_York_org_lr_prediction = New_York_lr_org.predict(New_York_org_feature_data18)
Orlando_org_lr_prediction = Orlando_lr_org.predict(Orlando_org_feature_data18)
Philadelphia_org_lr_prediction = Philadelphia_lr_org.predict(Philadelphia_org_feature_data18)
Phoenix_org_lr_prediction = Phoenix_lr_org.predict(Phoenix_org_feature_data18)
Pittsburgh_org_lr_prediction = Pittsburgh_lr_org.predict(Pittsburgh_org_feature_data18)
Portland_org_lr_prediction = Portland_lr_org.predict(Portland_org_feature_data18)
Raleigh_org_lr_prediction = Raleigh_lr_org.predict(Raleigh_org_feature_data18)
Richmond_org_lr_prediction = Richmond_lr_org.predict(Richmond_org_feature_data18)
Roanoke_org_lr_prediction = Roanoke_lr_org.predict(Roanoke_org_feature_data18)
Sacramento_org_lr_prediction = Sacramento_lr_org.predict(Sacramento_org_feature_data18)
San_Diego_org_lr_prediction = San_Diego_lr_org.predict(San_Diego_org_feature_data18)
San_Francisco_org_lr_prediction = San_Francisco_lr_org.predict(San_Francisco_org_feature_data18)
Seattle_org_lr_prediction = Seattle_lr_org.predict(Seattle_org_feature_data18)
Spokane_org_lr_prediction = Spokane_lr_org.predict(Spokane_org_feature_data18)
Syracuse_org_lr_prediction = Syracuse_lr_org.predict(Syracuse_org_feature_data18)
Tampa_org_lr_prediction = Tampa_lr_org.predict(Tampa_org_feature_data18)

In [14]:
# Now we can see how they did

# Conventional

Albany_conv_data18['LinearRegression'] = Albany_conv_lr_prediction
Atlanta_conv_data18['LinearRegression'] = Atlanta_conv_lr_prediction
Baltimore_conv_data18['LinearRegression'] = Baltimore_conv_lr_prediction
Boise_conv_data18['LinearRegression'] = Boise_conv_lr_prediction
Boston_conv_data18['LinearRegression'] = Boston_conv_lr_prediction
Buffalo_conv_data18['LinearRegression'] = Buffalo_conv_lr_prediction
Charlotte_conv_data18['LinearRegression'] = Charlotte_conv_lr_prediction
Chicago_conv_data18['LinearRegression'] = Chicago_conv_lr_prediction
Cincinnati_conv_data18['LinearRegression'] = Cincinnati_conv_lr_prediction
Columbus_conv_data18['LinearRegression'] = Columbus_conv_lr_prediction
Dallas_conv_data18['LinearRegression'] = Dallas_conv_lr_prediction
Denver_conv_data18['LinearRegression'] = Denver_conv_lr_prediction
Detroit_conv_data18['LinearRegression'] = Detroit_conv_lr_prediction
Grand_Rapids_conv_data18['LinearRegression'] = Grand_Rapids_conv_lr_prediction
Harrisburg_conv_data18['LinearRegression'] = Harrisburg_conv_lr_prediction
Hartford_conv_data18['LinearRegression'] = Hartford_conv_lr_prediction
Houston_conv_data18['LinearRegression'] = Houston_conv_lr_prediction
Indianapolis_conv_data18['LinearRegression'] = Indianapolis_conv_lr_prediction
Jacksonville_conv_data18['LinearRegression'] = Jacksonville_conv_lr_prediction
Las_Vegas_conv_data18['LinearRegression'] = Las_Vegas_conv_lr_prediction
Los_Angeles_conv_data18['LinearRegression'] = Los_Angeles_conv_lr_prediction
Louisville_conv_data18['LinearRegression'] = Louisville_conv_lr_prediction
Miami_conv_data18['LinearRegression'] = Miami_conv_lr_prediction
Nashville_conv_data18['LinearRegression'] = Nashville_conv_lr_prediction
New_Orleans_conv_data18['LinearRegression'] = New_Orleans_conv_lr_prediction
New_York_conv_data18['LinearRegression'] = New_York_conv_lr_prediction
Orlando_conv_data18['LinearRegression'] = Orlando_conv_lr_prediction
Philadelphia_conv_data18['LinearRegression'] = Philadelphia_conv_lr_prediction
Phoenix_conv_data18['LinearRegression'] = Phoenix_conv_lr_prediction
Pittsburgh_conv_data18['LinearRegression'] = Pittsburgh_conv_lr_prediction
Portland_conv_data18['LinearRegression'] = Portland_conv_lr_prediction
Raleigh_conv_data18['LinearRegression'] = Raleigh_conv_lr_prediction
Richmond_conv_data18['LinearRegression'] = Richmond_conv_lr_prediction
Roanoke_conv_data18['LinearRegression'] = Roanoke_conv_lr_prediction
Sacramento_conv_data18['LinearRegression'] = Sacramento_conv_lr_prediction
San_Diego_conv_data18['LinearRegression'] = San_Diego_conv_lr_prediction
San_Francisco_conv_data18['LinearRegression'] = San_Francisco_conv_lr_prediction
Seattle_conv_data18['LinearRegression'] = Seattle_conv_lr_prediction
Spokane_conv_data18['LinearRegression'] = Spokane_conv_lr_prediction
Syracuse_conv_data18['LinearRegression'] = Syracuse_conv_lr_prediction
Tampa_conv_data18['LinearRegression'] = Tampa_conv_lr_prediction

# Organic

Albany_org_data18['LinearRegression'] = Albany_org_lr_prediction
Atlanta_org_data18['LinearRegression'] = Atlanta_org_lr_prediction
Baltimore_org_data18['LinearRegression'] = Baltimore_org_lr_prediction
Boise_org_data18['LinearRegression'] = Boise_org_lr_prediction
Boston_org_data18['LinearRegression'] = Boston_org_lr_prediction
Buffalo_org_data18['LinearRegression'] = Buffalo_org_lr_prediction
Charlotte_org_data18['LinearRegression'] = Charlotte_org_lr_prediction
Chicago_org_data18['LinearRegression'] = Chicago_org_lr_prediction
Cincinnati_org_data18['LinearRegression'] = Cincinnati_org_lr_prediction
Columbus_org_data18['LinearRegression'] = Columbus_org_lr_prediction
Dallas_org_data18['LinearRegression'] = Dallas_org_lr_prediction
Denver_org_data18['LinearRegression'] = Denver_org_lr_prediction
Detroit_org_data18['LinearRegression'] = Detroit_org_lr_prediction
Grand_Rapids_org_data18['LinearRegression'] = Grand_Rapids_org_lr_prediction
Harrisburg_org_data18['LinearRegression'] = Harrisburg_org_lr_prediction
Hartford_org_data18['LinearRegression'] = Hartford_org_lr_prediction
Houston_org_data18['LinearRegression'] = Houston_org_lr_prediction
Indianapolis_org_data18['LinearRegression'] = Indianapolis_org_lr_prediction
Jacksonville_org_data18['LinearRegression'] = Jacksonville_org_lr_prediction
Las_Vegas_org_data18['LinearRegression'] = Las_Vegas_org_lr_prediction
Los_Angeles_org_data18['LinearRegression'] = Los_Angeles_org_lr_prediction
Louisville_org_data18['LinearRegression'] = Louisville_org_lr_prediction
Miami_org_data18['LinearRegression'] = Miami_org_lr_prediction
Nashville_org_data18['LinearRegression'] = Nashville_org_lr_prediction
New_Orleans_org_data18['LinearRegression'] = New_Orleans_org_lr_prediction
New_York_org_data18['LinearRegression'] = New_York_org_lr_prediction
Orlando_org_data18['LinearRegression'] = Orlando_org_lr_prediction
Philadelphia_org_data18['LinearRegression'] = Philadelphia_org_lr_prediction
Phoenix_org_data18['LinearRegression'] = Phoenix_org_lr_prediction
Pittsburgh_org_data18['LinearRegression'] = Pittsburgh_org_lr_prediction
Portland_org_data18['LinearRegression'] = Portland_org_lr_prediction
Raleigh_org_data18['LinearRegression'] = Raleigh_org_lr_prediction
Richmond_org_data18['LinearRegression'] = Richmond_org_lr_prediction
Roanoke_org_data18['LinearRegression'] = Roanoke_org_lr_prediction
Sacramento_org_data18['LinearRegression'] = Sacramento_org_lr_prediction
San_Diego_org_data18['LinearRegression'] = San_Diego_org_lr_prediction
San_Francisco_org_data18['LinearRegression'] = San_Francisco_org_lr_prediction
Seattle_org_data18['LinearRegression'] = Seattle_org_lr_prediction
Spokane_org_data18['LinearRegression'] = Spokane_org_lr_prediction
Syracuse_org_data18['LinearRegression'] = Syracuse_org_lr_prediction
Tampa_org_data18['LinearRegression'] = Tampa_org_lr_prediction

In [15]:
# Just a sample showing the organic data for tampa

Tampa_org_data18[['date','average_price', 'LinearRegression']]

Unnamed: 0,date,average_price,LinearRegression
13857,2018-01-07,1.51,1.381491
13856,2018-01-14,1.53,1.434361
13855,2018-01-21,1.52,1.422363
13854,2018-01-28,1.61,1.595862
13853,2018-02-04,1.32,1.402296
13852,2018-02-11,1.34,1.357151
13851,2018-02-18,1.5,1.507428
13850,2018-02-25,1.37,1.352212
13849,2018-03-04,1.51,1.461235
13848,2018-03-11,1.31,1.338164


In [16]:
# Now we just need to combine all 2018 data into a single data set
# Reset the index values to the second dataframe appends properly
# drop=True option avoids adding new index column with old index values

all2018_data = pd.concat([Albany_org_data18, Atlanta_org_data18, Baltimore_org_data18,
           Boise_org_data18, Boston_org_data18, Buffalo_org_data18,
           Charlotte_org_data18, Chicago_org_data18, Cincinnati_org_data18,
           Columbus_org_data18, Dallas_org_data18, Denver_org_data18,
           Detroit_org_data18, Grand_Rapids_org_data18, Harrisburg_org_data18,
           Hartford_org_data18, Houston_org_data18, Indianapolis_org_data18,
           Jacksonville_org_data18, Las_Vegas_org_data18,
           Los_Angeles_org_data18, Louisville_org_data18, Miami_org_data18,
           Nashville_org_data18, New_Orleans_org_data18, New_York_org_data18,
           Orlando_org_data18, Philadelphia_org_data18, Phoenix_org_data18,
           Pittsburgh_org_data18, Portland_org_data18, Raleigh_org_data18,
           Richmond_org_data18, Roanoke_org_data18, Sacramento_org_data18,
           San_Diego_org_data18, San_Francisco_org_data18,
           Seattle_org_data18, Spokane_org_data18, Syracuse_org_data18,
           Tampa_org_data18,Albany_conv_data18, Atlanta_conv_data18,
           Baltimore_conv_data18, Boise_conv_data18, Boston_conv_data18,
           Buffalo_conv_data18, Charlotte_conv_data18, Chicago_conv_data18,
           Cincinnati_conv_data18, Columbus_conv_data18, Dallas_conv_data18,
           Denver_conv_data18, Detroit_conv_data18, Grand_Rapids_conv_data18,
           Harrisburg_conv_data18, Hartford_conv_data18, Houston_conv_data18,
           Indianapolis_conv_data18, Jacksonville_conv_data18,
           Las_Vegas_conv_data18, Los_Angeles_conv_data18,
           Louisville_conv_data18, Miami_conv_data18, Nashville_conv_data18,
           New_Orleans_conv_data18, New_York_conv_data18, Orlando_conv_data18,
           Philadelphia_conv_data18, Phoenix_conv_data18,
           Pittsburgh_conv_data18, Portland_conv_data18, Raleigh_conv_data18,
           Richmond_conv_data18, Roanoke_conv_data18, Sacramento_conv_data18,
           San_Diego_conv_data18, San_Francisco_conv_data18,
           Seattle_conv_data18, Spokane_conv_data18, Syracuse_conv_data18,
           Tampa_conv_data18], axis=0).reset_index(drop=True)

In [17]:
# Then we just export it a file so we can import into our database

all2018_data.reset_index(drop=True)

Unnamed: 0,date,average_price,total_volume,type_4046,type_4225,type_4770,total_bags,small_bags,large_bags,xlarge_bags,type,year,city,state,region,city_state,latitude,longitude,LinearRegression
0,2018-01-07,1.54,4816.90,43.51,412.17,0.00,4361.22,4357.89,3.33,0.00,organic,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987,1.452374
1,2018-01-14,1.47,4140.95,7.30,301.87,0.00,3831.78,3831.78,0.00,0.00,organic,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987,1.512131
2,2018-01-21,1.54,3346.54,14.67,253.01,0.00,3078.86,3078.86,0.00,0.00,organic,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987,1.605408
3,2018-01-28,1.32,6987.56,433.66,374.96,0.00,6178.94,6178.94,0.00,0.00,organic,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987,1.372756
4,2018-02-04,1.52,4124.96,118.38,420.36,0.00,3586.22,3586.22,0.00,0.00,organic,2018,Albany,NY,Northeast,"Albany, NY",42.6664,-73.7987,1.559849
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
979,2018-02-25,1.30,484876.62,308452.46,39379.53,1251.31,135793.32,96039.07,39654.25,100.00,conventional,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451,1.077815
980,2018-03-04,1.14,597351.68,372631.01,48784.93,1465.95,174469.79,88569.48,85746.97,153.34,conventional,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451,0.977224
981,2018-03-11,1.16,580771.43,372746.58,45277.75,1442.66,161304.44,92677.26,68493.85,133.33,conventional,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451,0.997285
982,2018-03-18,1.13,574380.46,372785.73,43017.73,1301.33,157275.67,93201.11,63924.56,150.00,conventional,2018,Tampa,FL,Southeast,"Tampa, FL",27.9942,-82.4451,0.997791


In [18]:
# we can also just combine our new 2018 data with the old data

# just filter out the 2018 data 

no2018 = avodatafile.loc[(avodatafile['year'] !=2018)].reset_index(drop=True)

# Then just add our new data

alldata = pd.concat([no2018,all2018_data])

alldata = alldata.reset_index(drop=True)

In [19]:
# Then export the data to csv

alldata.to_csv('avo_data_withlr.csv', index=False)