# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [29]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
import json

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

url = "http://api.openweathermap.org/data/2.5/weather?q="
appid = "&appid="
city_df = []

## Generate Cities List

In [30]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

642

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [31]:
# loop thru (cities) and print each name/id
counter = 1

country= []
cityn = []
lats = []
lngs = []
temps = []
max_temps = []
humidities = []
clouds = []
winds = []

for cityname in cities:
    if counter < 500:
        try:
            query_url = url + cityname + appid + weather_api_key
            city_request = requests.get(query_url).json()
            city_name = city_request['name']
            city_lat = city_request['coord']['lat']
            city_long = city_request['coord']['lon']
            city_temp = city_request['main']['temp']
            city_max = city_request['main']['temp_max']
            city_hum = city_request['main']['humidity']
            city_cloud = city_request['clouds']['all']
            city_wind = city_request['wind']['speed']
            # get country info
            country_info = city_request['sys']['country']
            # append city name
            cityn.append(city_name)
            # append country info
            country.append(country_info)
            lats.append(city_lat)
            lngs.append(city_long)
            temps.append(city_temp)
            max_temps.append(city_max)
            humidities.append(city_hum)
            clouds.append(city_cloud)
            winds.append(city_wind)
            print("city name is " + str(city_name) + " and the position is: " + str(counter))
            counter = counter + 1
        except:
            break

city name is Kiryat Gat and the position is: 1
city name is Vaini and the position is: 2
city name is Osorno and the position is: 3
city name is Albany and the position is: 4
city name is Nikolskoye and the position is: 5
city name is Mahébourg and the position is: 6
city name is Hermanus and the position is: 7
city name is Bambous Virieux and the position is: 8
city name is Port Alfred and the position is: 9
city name is Khatanga and the position is: 10
city name is Carnarvon and the position is: 11
city name is Esperance and the position is: 12
city name is New Norfolk and the position is: 13
city name is Hobart and the position is: 14
city name is Mumford and the position is: 15
city name is Bredasdorp and the position is: 16
city name is Shimoda and the position is: 17
city name is Campina Verde and the position is: 18
city name is Saint Paul Harbor and the position is: 19
city name is Oistins and the position is: 20
city name is Marzuq and the position is: 21
city name is Providen

In [32]:
lats

[31.61,
 -21.2,
 -40.5667,
 42.6001,
 59.7035,
 -20.4081,
 -34.4187,
 -20.3428,
 -33.5906,
 71.9667,
 -24.8667,
 -33.8667,
 -42.7826,
 -42.8794,
 5.2618,
 -34.5322,
 34.6667,
 -19.5356,
 57.79,
 13.0667,
 14.4,
 64.3833,
 -41.8697,
 66.8333,
 64.5667,
 44.1667,
 33.0833,
 -37.6167,
 -21.2078,
 -0.7393,
 -14.9003,
 39.2446,
 57.4167]

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [33]:
# api call template: api.openweathermap.org/data/2.5/weather?q={city name}&appid={API key}
#sample call for city yellowknife

#.append not adding
#no .append results in single float point

city_df = []

        

city_df = {
    'country' : country,
           'cityn' : cityn,
    'lats' : lats,
    'lngs' : lngs,
    "temps" : temps,
    'max_temps' : max_temps,
    'humidities' : humidities,
    'clouds' : clouds,
    'winds' : winds
               
} 
city_df





{'country': ['IL',
  'TO',
  'CL',
  'US',
  'RU',
  'MU',
  'ZA',
  'MU',
  'ZA',
  'RU',
  'AU',
  'AU',
  'AU',
  'AU',
  'GH',
  'ZA',
  'JP',
  'BR',
  'US',
  'BB',
  'YE',
  'RU',
  'CL',
  'RU',
  'RU',
  'KZ',
  'PT',
  'CL',
  'CK',
  'EC',
  'MG',
  'TM',
  'LV'],
 'cityn': ['Kiryat Gat',
  'Vaini',
  'Osorno',
  'Albany',
  'Nikolskoye',
  'Mahébourg',
  'Hermanus',
  'Bambous Virieux',
  'Port Alfred',
  'Khatanga',
  'Carnarvon',
  'Esperance',
  'New Norfolk',
  'Hobart',
  'Mumford',
  'Bredasdorp',
  'Shimoda',
  'Campina Verde',
  'Saint Paul Harbor',
  'Oistins',
  'Marzuq',
  'Provideniya',
  'Ancud',
  'Yar-Sale',
  'Ust-Nera',
  'Shīeli',
  'Camacha',
  'Lebu',
  'Avarua',
  'Puerto Ayora',
  'Antalaha',
  'Bereket',
  'Alūksne'],
 'lats': [31.61,
  -21.2,
  -40.5667,
  42.6001,
  59.7035,
  -20.4081,
  -34.4187,
  -20.3428,
  -33.5906,
  71.9667,
  -24.8667,
  -33.8667,
  -42.7826,
  -42.8794,
  5.2618,
  -34.5322,
  34.6667,
  -19.5356,
  57.79,
  13.0667,
  14.

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

AttributeError: 'dict' object has no attribute 'head'

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [36]:

#export to csv 
city_df.to_csv(output_data_file)


AttributeError: 'dict' object has no attribute 'to_csv'

## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

In [37]:
city_df["latn"] = np.where(city_df.OUTCOME > 0, city_df.OUTCOME, 0)
city_df["lats"] = np.where(city_df.OUTCOME < 0, - city_df.OUTCOME, 0) 


city_df.plot.scatter(x='lat', y='temp' )
AxesSubplot:xlabel='Latitude', ylabel='Temperature'


SyntaxError: invalid syntax (<ipython-input-37-b3b74c701d08>, line 6)

## Latitude vs. Humidity Plot

In [38]:
city_df.plot.scatter(x='lat', y='humidity' )
AxesSubplot:xlabel='Latitude', ylabel='Humidity'
    

SyntaxError: invalid syntax (<ipython-input-38-04b5109522d0>, line 2)

## Latitude vs. Cloudiness Plot

In [None]:
city_df.plot.scatter(x='lat', y='all' )
AxesSubplot:xlabel='Latitude', ylabel='Cloudiness'

## Latitude vs. Wind Speed Plot

In [None]:
city_df.plot.scatter(x='lat', y='speed' )
AxesSubplot:xlabel='Latitude', ylabel='Wind Speed'

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_value = city_df['temp_max']
y_value = city_df['latn'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Max Temp")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

In [None]:
x_value = city_df['temp_max']
y_value = city_df['lats'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Max Temp")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_value = city_df['humidity']
y_value = city_df['latn'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Humidity")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

In [None]:
x_value = city_df['humidity']
y_value = city_df['lats'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Humidity")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_value = city_df['all']
y_value = city_df['latn'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Cloudiness")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

In [None]:
x_value = city_df['all']
y_value = city_df['lats'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Cloudiness")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_value = city_df['speed']
y_value = city_df['latn'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Wind Speed")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

In [None]:
x_value = city_df['speed']
y_value = city_df['lats'] 
                       
(slope, intercept, rvalue, pvalue, std)= linregress(x_value, y_value)
regress_value =  x_value * slope + intercept   
line_eq = "y= " + str(slope) + "x " + str(intercept)
plt.scatter(x_value, y_value)
plt.xlabel("Wind Speed")
plt.ylabel("Latitude")
plt.plot(x_value, regress_value)
print("the correlation coefficient is " + str(rvalue))
print("the r squared value is " + str(rvalue**2))
plt.show()