# Temperature Population Sea Level and Emissions
### Notebook to combine .csv datasets into one sqlite database for Project 2

In [30]:
# Dependencies and Setup
import pandas as pd
import numpy as np
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)

# File to Load  
temperature_data_to_load = "data/temp_data.csv"
population_data_to_load = "data/population_data.csv"
sealevel_data_to_load = "data/sealevel_data.csv"
co2_data_to_load = "data/CO2_data.csv"

# Read Data  
temperature_data = pd.read_csv(temperature_data_to_load)
population_data = pd.read_csv(population_data_to_load)
sealevel_data = pd.read_csv(sealevel_data_to_load)
co2_data = pd.read_csv(co2_data_to_load)


In [31]:
temperature_data.head(5)

Unnamed: 0,Year,LandAndOceanAverageTemperature,LandAndOceanAverageTemperatureUncertainty
0,1993,15.466417,0.059167
1,1994,15.535,0.058583
2,1995,15.637833,0.060417
3,1996,15.524667,0.0595
4,1997,15.713833,0.059167


In [32]:
population_data.head(5)

Unnamed: 0.1,Unnamed: 0,year,population_millions
0,0,1993,5581597.598
1,1,1994,5663150.428
2,2,1995,5744212.93
3,3,1996,5824891.931
4,4,1997,5905045.647


In [33]:
sealevel_data.head(5)

Unnamed: 0,Year,GMSL
0,1993,90.471622
1,1994,89.516216
2,1995,87.334722
3,1996,85.473243
4,1997,99.442432


In [34]:
co2_data.head(5)

Unnamed: 0,Year,CO2_emissions_tons_per_capita
0,1993,869.636645
1,1994,863.100924
2,1995,858.225479
3,1996,859.062572
4,1997,867.379574


In [35]:
import matplotlib.pyplot as plt
from glob import glob


In [36]:
climate_files = sorted(glob('data/*_data.csv'))

In [37]:
climate_files

['data\\CO2_data.csv',
 'data\\population_data.csv',
 'data\\sealevel_data.csv',
 'data\\temp_data.csv']

In [38]:
climate_combined = pd.concat((pd.read_csv(file).assign(filename = file)
          for file in climate_files), sort= True, ignore_index = True) 

In [39]:
climate_combined

Unnamed: 0.1,CO2_emissions_tons_per_capita,GMSL,LandAndOceanAverageTemperature,LandAndOceanAverageTemperatureUncertainty,Unnamed: 0,Year,filename,population_millions,year
0,869.636645,,,,,1993.0,data\CO2_data.csv,,
1,863.100924,,,,,1994.0,data\CO2_data.csv,,
2,858.225479,,,,,1995.0,data\CO2_data.csv,,
3,859.062572,,,,,1996.0,data\CO2_data.csv,,
4,867.379574,,,,,1997.0,data\CO2_data.csv,,
5,866.162913,,,,,1998.0,data\CO2_data.csv,,
6,854.147358,,,,,1999.0,data\CO2_data.csv,,
7,878.764146,,,,,2000.0,data\CO2_data.csv,,
8,888.096012,,,,,2001.0,data\CO2_data.csv,,
9,884.272209,,,,,2002.0,data\CO2_data.csv,,


In [21]:
climate_combined.columns

Index(['CO2_emissions_tons_per_capita', 'GMSL', 'LandAndOceanAverageTemperature', 'LandAndOceanAverageTemperatureUncertainty', 'Unnamed: 0', 'Year', 'filename', 'population_millions', 'year'], dtype='object')

In [29]:
climate_data = climate_combined

climate_data.rename(columns={'Year':'year',  
                              'Avg Temp':'LandAndOceanAverageTemperature',
                             'Emissions':'CO2_emissions_tons_per_capita',
                             'GMSL':'Avg GMSL',
                             'Avg Population in mil':'population_millions'} )
climate_data

Unnamed: 0.1,CO2_emissions_tons_per_capita,GMSL,LandAndOceanAverageTemperature,LandAndOceanAverageTemperatureUncertainty,Unnamed: 0,Year,filename,population_millions,year
0,869.636645,,,,,1993.0,data\CO2_data.csv,,
1,863.100924,,,,,1994.0,data\CO2_data.csv,,
2,858.225479,,,,,1995.0,data\CO2_data.csv,,
3,859.062572,,,,,1996.0,data\CO2_data.csv,,
4,867.379574,,,,,1997.0,data\CO2_data.csv,,
5,866.162913,,,,,1998.0,data\CO2_data.csv,,
6,854.147358,,,,,1999.0,data\CO2_data.csv,,
7,878.764146,,,,,2000.0,data\CO2_data.csv,,
8,888.096012,,,,,2001.0,data\CO2_data.csv,,
9,884.272209,,,,,2002.0,data\CO2_data.csv,,


In [23]:

climate_data

Unnamed: 0.1,CO2_emissions_tons_per_capita,GMSL,LandAndOceanAverageTemperature,LandAndOceanAverageTemperatureUncertainty,Unnamed: 0,Year,filename,population_millions,year
0,869.636645,,,,,1993.0,data\CO2_data.csv,,
1,863.100924,,,,,1994.0,data\CO2_data.csv,,
2,858.225479,,,,,1995.0,data\CO2_data.csv,,
3,859.062572,,,,,1996.0,data\CO2_data.csv,,
4,867.379574,,,,,1997.0,data\CO2_data.csv,,
5,866.162913,,,,,1998.0,data\CO2_data.csv,,
6,854.147358,,,,,1999.0,data\CO2_data.csv,,
7,878.764146,,,,,2000.0,data\CO2_data.csv,,
8,888.096012,,,,,2001.0,data\CO2_data.csv,,
9,884.272209,,,,,2002.0,data\CO2_data.csv,,


In [None]:
climate_data .to_csv(r'data\combinedclimatedata.csv', index = False)
