# WeatherPy
----



In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
import json

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "../output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [6]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)


591

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [8]:
# Save url information
url = "http://api.openweathermap.org/data/2.5/weather?"

# Build query URL
query_url = url + "appid=" + weather_api_key + "&q="

# Get weather data for all the random cities, generated in the list cities.

# Creating empty lists to store the data
city_name = []
lat = []
long = []
max_temp = []
humidity = []
cloudines = []
wind_speed = []
country = []
date = []


print("--------------------------") 
print("Beginning Data Retrieval  ")
print("--------------------------")

# Creating counts
Record_count = 0
myset_count = 1

for city in cities:
    try:
        weather_json = requests.get(query_url + city).json()
#         print(json.dumps(weather_json, indent=4, sort_keys=True))
        city_name.append(weather_json["name"])
        lat.append(weather_json["coord"]["lat"])
        long.append(weather_json["coord"]["lon"])
        max_temp.append(weather_json["main"]["temp_max"])
        humidity.append(weather_json["main"]["humidity"])
        cloudines.append(weather_json["clouds"]["all"])
        wind_speed.append(weather_json["wind"]["speed"])
        country.append(weather_json["sys"]["country"])
        date.append(weather_json["dt"])
        Record_count+=1
        print(f"Processing Record {Record_count} of Set {myset_count} | {city}")
#         After 50 requests the program will "sleep" for 60 seconds, so it will not reach the limit of 60 rpm
        if Record_count == 50:
              time.sleep(60)
              Record_count = 0
              myset_count+=1
                
    except KeyError:
        print("City not found. Skipping...")
              
print("--------------------------")              
print("Data Retrieval Complete")
print("--------------------------")
              


--------------------------
Beginning Data Retrieval  
--------------------------
Processing Record 1 of Set 1 | batagay
Processing Record 2 of Set 1 | hithadhoo
Processing Record 3 of Set 1 | horizontina
Processing Record 4 of Set 1 | amga
Processing Record 5 of Set 1 | busselton
Processing Record 6 of Set 1 | esperance
City not found. Skipping...
Processing Record 7 of Set 1 | port elizabeth
Processing Record 8 of Set 1 | hermanus
Processing Record 9 of Set 1 | klyuchevskiy
Processing Record 10 of Set 1 | palatka
Processing Record 11 of Set 1 | saldanha
Processing Record 12 of Set 1 | vaini
Processing Record 13 of Set 1 | albany
Processing Record 14 of Set 1 | severo-kurilsk
Processing Record 15 of Set 1 | ushuaia
Processing Record 16 of Set 1 | punta arenas
Processing Record 17 of Set 1 | butaritari
Processing Record 18 of Set 1 | cockburn town
Processing Record 19 of Set 1 | rikitea
Processing Record 20 of Set 1 | kondinskoye
Processing Record 21 of Set 1 | anchorage
Processing Reco

Processing Record 37 of Set 4 | andrews
Processing Record 38 of Set 4 | dongsheng
Processing Record 39 of Set 4 | mikuni
Processing Record 40 of Set 4 | balkanabat
City not found. Skipping...
Processing Record 41 of Set 4 | college
Processing Record 42 of Set 4 | batemans bay
Processing Record 43 of Set 4 | auchi
Processing Record 44 of Set 4 | praia da vitoria
Processing Record 45 of Set 4 | lagoa
Processing Record 46 of Set 4 | fortuna
Processing Record 47 of Set 4 | sorland
Processing Record 48 of Set 4 | san pedro
Processing Record 49 of Set 4 | santa rosa
Processing Record 50 of Set 4 | portland
Processing Record 1 of Set 5 | upernavik
Processing Record 2 of Set 5 | saulkrasti
Processing Record 3 of Set 5 | severnyy
Processing Record 4 of Set 5 | sri aman
Processing Record 5 of Set 5 | los llanos de aridane
Processing Record 6 of Set 5 | guerrero negro
Processing Record 7 of Set 5 | banda aceh
Processing Record 8 of Set 5 | the valley
Processing Record 9 of Set 5 | terrace bay
Pro

Processing Record 28 of Set 8 | mehtar lam
Processing Record 29 of Set 8 | kahului
Processing Record 30 of Set 8 | mizdah
Processing Record 31 of Set 8 | tuy hoa
Processing Record 32 of Set 8 | talnakh
Processing Record 33 of Set 8 | ancud
Processing Record 34 of Set 8 | inuvik
Processing Record 35 of Set 8 | tahta
Processing Record 36 of Set 8 | husavik
Processing Record 37 of Set 8 | hadejia
City not found. Skipping...
Processing Record 38 of Set 8 | wattegama
Processing Record 39 of Set 8 | mukhtolovo
Processing Record 40 of Set 8 | retalhuleu
Processing Record 41 of Set 8 | kissidougou
Processing Record 42 of Set 8 | bilma
Processing Record 43 of Set 8 | hasaki
Processing Record 44 of Set 8 | kiama
Processing Record 45 of Set 8 | buraydah
Processing Record 46 of Set 8 | abalak
Processing Record 47 of Set 8 | spirit river
Processing Record 48 of Set 8 | kununurra
Processing Record 49 of Set 8 | kirchheim
Processing Record 50 of Set 8 | osorno
Processing Record 1 of Set 9 | gutierrez

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [9]:
data_df = pd.DataFrame({"City": city_name,
                        "Lat": lat,
                        "Lng": long,
                        "Max Temp": max_temp,
                        "Humidity": humidity,
                        "Cloudiness": cloudines,
                        "Wind Speed": wind_speed,
                        "Country": country,
                        "Date": date})
data_df

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Batagay,67.63,134.63,284.19,65,3,1.65,RU,1596913712
1,Hithadhoo,-0.60,73.08,301.36,81,21,5.28,MV,1596913740
2,Horizontina,-27.63,-54.31,297.00,62,0,2.62,BR,1596913740
3,Amga,60.90,131.96,284.93,64,18,0.20,RU,1596913740
4,Busselton,-33.65,115.33,289.26,68,100,3.58,AU,1596913740
...,...,...,...,...,...,...,...,...,...
545,Buala,-8.14,159.59,299.16,83,100,2.41,SB,1596914380
546,Port Keats,-14.25,129.55,292.12,34,40,4.35,AU,1596914380
547,Codrington,-38.27,141.97,283.43,84,18,7.14,AU,1596914380
548,Kortkeros,61.81,51.58,287.15,93,20,1.00,RU,1596914380


In [10]:
data_df.to_csv(output_data_file)

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [None]:
# Extract relevant fields from the data frame


# Export the City_Data into a csv


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

In [None]:
# OPTIONAL: Create a function to create Linear Regression plots

In [None]:
# Create Northern and Southern Hemisphere DataFrames

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression