In [1]:
import matplotlib.pyplot as plt
import pandas as pd
import scipy.stats as st
import numpy as np
from scipy.stats import linregress
import locale

In [4]:
# Data files
mountain_elevation_data = "data/mountain_elevation.csv"

# Read in the data
mountain_elevation = pd.read_csv(mountain_elevation_data)
mountain_elevation


Unnamed: 0,State,Mountain_Name,Elevation,Latitude / Longitude
0,Alabama,Cheaha Mountain,726 m,33.486 / -85.809
1,Alabama,Talladega Mountain,715 m,33.458 / -85.812
2,Alabama,Odum Point,714 m,33.416 / -85.831
3,Alabama,Hernandez Peak,703 m,33.458 / -85.813
4,Alabama,Bald Rock,696 m,33.495 / -85.808
...,...,...,...,...
505,DC,Mount Hamilton,71 m,38.909 / -76.975
506,DC,Bunker Hill,71 m,38.935 / -76.988
507,DC,Soapstone Valley,65 m,38.948 / -77.065
508,DC,Lees Hill,63 m,38.913 / -77.066


In [5]:
# Remove the 'm' from elevation row

mountain_elevation['Elevation'] = mountain_elevation['Elevation'].map(lambda x: str(x)[:-1])
mountain_elevation

Unnamed: 0,State,Mountain_Name,Elevation,Latitude / Longitude
0,Alabama,Cheaha Mountain,726,33.486 / -85.809
1,Alabama,Talladega Mountain,715,33.458 / -85.812
2,Alabama,Odum Point,714,33.416 / -85.831
3,Alabama,Hernandez Peak,703,33.458 / -85.813
4,Alabama,Bald Rock,696,33.495 / -85.808
...,...,...,...,...
505,DC,Mount Hamilton,71,38.909 / -76.975
506,DC,Bunker Hill,71,38.935 / -76.988
507,DC,Soapstone Valley,65,38.948 / -77.065
508,DC,Lees Hill,63,38.913 / -77.066


In [8]:
# new data frame with split value columns 
new = mountain_elevation["Latitude / Longitude"].str.split("/", n = 1, expand = True) 
  
# making separate first name column from new data frame 
mountain_elevation["Latitude"]= new[0] 
  
# making separate last name column from new data frame 
mountain_elevation["Longitude"]= new[1] 
  
# Dropping old Name columns 
mountain_elevation.drop(columns =["Latitude / Longitude"], inplace = True) 
  
# df display 
mountain_elevation 

Unnamed: 0,State,Mountain_Name,Elevation,Latitude,Longitude
0,Alabama,Cheaha Mountain,726,33.486,-85.809
1,Alabama,Talladega Mountain,715,33.458,-85.812
2,Alabama,Odum Point,714,33.416,-85.831
3,Alabama,Hernandez Peak,703,33.458,-85.813
4,Alabama,Bald Rock,696,33.495,-85.808
...,...,...,...,...,...
505,DC,Mount Hamilton,71,38.909,-76.975
506,DC,Bunker Hill,71,38.935,-76.988
507,DC,Soapstone Valley,65,38.948,-77.065
508,DC,Lees Hill,63,38.913,-77.066


In [9]:
mountain_elevation.dtypes

State            object
Mountain_Name    object
Elevation        object
Latitude         object
Longitude        object
dtype: object

In [15]:
mountain_elevation['Elevation'] = mountain_elevation['Elevation'].str.replace(',', '')
mountain_elevation


Unnamed: 0,State,Mountain_Name,Elevation,Latitude,Longitude
0,Alabama,Cheaha Mountain,726,33.486,-85.809
1,Alabama,Talladega Mountain,715,33.458,-85.812
2,Alabama,Odum Point,714,33.416,-85.831
3,Alabama,Hernandez Peak,703,33.458,-85.813
4,Alabama,Bald Rock,696,33.495,-85.808
...,...,...,...,...,...
505,DC,Mount Hamilton,71,38.909,-76.975
506,DC,Bunker Hill,71,38.935,-76.988
507,DC,Soapstone Valley,65,38.948,-77.065
508,DC,Lees Hill,63,38.913,-77.066


In [16]:
mountain_elevation.head(50)

Unnamed: 0,State,Mountain_Name,Elevation,Latitude,Longitude
0,Alabama,Cheaha Mountain,726,33.486,-85.809
1,Alabama,Talladega Mountain,715,33.458,-85.812
2,Alabama,Odum Point,714,33.416,-85.831
3,Alabama,Hernandez Peak,703,33.458,-85.813
4,Alabama,Bald Rock,696,33.495,-85.808
5,Alabama,Parker High Point,667,33.416,-85.825
6,Alabama,Big Caney Head,648,33.413,-85.834
7,Alabama,McDill Point,648,33.454,-85.822
8,Alabama,Rock Garden,636,33.482,-85.815
9,Alabama,Morton Hill,628,33.693,-85.739


In [18]:

mountain_elevation["Elevation"] = mountain_elevation.Elevation.astype(float)
mountain_elevation["Latitude"] = mountain_elevation.Latitude.astype(float)
mountain_elevation["Longitude"] = mountain_elevation.Longitude.astype(float)
mountain_elevation

Unnamed: 0,State,Mountain_Name,Elevation,Latitude,Longitude
0,Alabama,Cheaha Mountain,726.0,33.486,-85.809
1,Alabama,Talladega Mountain,715.0,33.458,-85.812
2,Alabama,Odum Point,714.0,33.416,-85.831
3,Alabama,Hernandez Peak,703.0,33.458,-85.813
4,Alabama,Bald Rock,696.0,33.495,-85.808
...,...,...,...,...,...
505,DC,Mount Hamilton,71.0,38.909,-76.975
506,DC,Bunker Hill,71.0,38.935,-76.988
507,DC,Soapstone Valley,65.0,38.948,-77.065
508,DC,Lees Hill,63.0,38.913,-77.066


In [19]:
mountain_elevation.dtypes

State             object
Mountain_Name     object
Elevation        float64
Latitude         float64
Longitude        float64
dtype: object

In [20]:
# Export to csv file
mountain_elevation.to_csv(r'data\mountain_elevation_final.csv')