# WeatherPy
----


In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
#I had a ModuleError here until I figure out they have to be on the same folder 
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

641

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [None]:
#Based on one query, I checked the key values 
# query = query_url + "London"
# response_json = requests.get(query).json()
    
# city = response_json["name"]
# lng = response_json["coord"]["lon"]
# lat = response_json["coord"]["lat"]
# max_temp = response_json["main"]["temp_max"]
# humidity = response_json["main"]["humidity"]
# cloudiness = response_json["clouds"]["all"]
# wind_speed = response_json["wind"]["speed"]
# country = response_json["sys"]["country"]
# date = response_json["dt"]

# print(f"Info on each city:{city}, {city},{lng},{lat},{max_temp},{humidity},{cloudiness},{wind_speed},{country}, {date} ")


In [3]:
#QUERY URL 

url = "http://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

# Build partial query URL
query_url = f"{url}appid={weather_api_key}&units={units}&q="


In [4]:
#empty lists for all my city values 

city = []
lat = []
lng = []
max_temp = []
humidity = []
cloudiness = []
wind_speed = []
country = []
date = []

#Printing message values 
set_count = 1
city_count = 0 


print("Beginning Data Retrieval\n-------------------------")

#Loop through each city
for search in cities:
    
    # Create search query, make request and store in json
    query = query_url + search
    response = requests.get(query)
    response_json = response.json()
    
    # Getting all the data from the cities the API can find 
    try:
        city_count += 1
        city.append(response_json["name"])
        lat.append(response_json["coord"]["lat"])
        lng.append(response_json["coord"]["lon"])
        max_temp.append(response_json["main"]["temp_max"])
        humidity.append(response_json["main"]["humidity"])
        cloudiness.append(response_json["clouds"]["all"])
        wind_speed.append(response_json["wind"]["speed"])
        country.append(response_json["sys"]["country"])
        date.append(response_json["dt"])
        
        print(f"Processing Record {city_count} of Set {set_count}| {search} ")

        
    # Handle exceptions for cities not found 
    except KeyError: 
        print("City not found. Skipping...")
    
    #On the starter book, every set has 50 api calls. 
    #Indicating the set number and reseting the city count to 1. 
    #Because of the import time, setting sleep to pause between city sets. 
    if city_count > 50: 
        set_count +=1
        city_count = 0 
        time.sleep(5)   
    
print("--------------------------\nData Retrieval Complete\n-------------------------")

Beginning Data Retrieval
-------------------------
Processing Record 1 of Set 1| mataura 
Processing Record 2 of Set 1| roding 
Processing Record 3 of Set 1| jamestown 
Processing Record 4 of Set 1| mecca 
Processing Record 5 of Set 1| maceio 
Processing Record 6 of Set 1| rikitea 
Processing Record 7 of Set 1| alofi 
Processing Record 8 of Set 1| randazzo 
Processing Record 9 of Set 1| rio grande 
Processing Record 10 of Set 1| walvis bay 
Processing Record 11 of Set 1| khandyga 
City not found. Skipping...
Processing Record 13 of Set 1| provideniya 
Processing Record 14 of Set 1| dikson 
Processing Record 15 of Set 1| torbay 
Processing Record 16 of Set 1| iqaluit 
Processing Record 17 of Set 1| busselton 
Processing Record 18 of Set 1| bredasdorp 
Processing Record 19 of Set 1| norman wells 
Processing Record 20 of Set 1| liku 
Processing Record 21 of Set 1| nishihara 
Processing Record 22 of Set 1| coihaique 
Processing Record 23 of Set 1| iwanai 
Processing Record 24 of Set 1| upa

Processing Record 2 of Set 5| san carlos de bariloche 
City not found. Skipping...
Processing Record 4 of Set 5| sitka 
Processing Record 5 of Set 5| ufimskiy 
Processing Record 6 of Set 5| seddon 
Processing Record 7 of Set 5| bolshaya glushitsa 
Processing Record 8 of Set 5| vila velha 
City not found. Skipping...
Processing Record 10 of Set 5| oranjestad 
Processing Record 11 of Set 5| naryan-mar 
Processing Record 12 of Set 5| kutum 
Processing Record 13 of Set 5| berbera 
City not found. Skipping...
Processing Record 15 of Set 5| koslan 
Processing Record 16 of Set 5| bonavista 
Processing Record 17 of Set 5| tual 
Processing Record 18 of Set 5| antalaha 
Processing Record 19 of Set 5| dongying 
City not found. Skipping...
Processing Record 21 of Set 5| baoqing 
Processing Record 22 of Set 5| leningradskiy 
Processing Record 23 of Set 5| belle fourche 
Processing Record 24 of Set 5| cam ranh 
City not found. Skipping...
Processing Record 26 of Set 5| joshimath 
Processing Record 2

Processing Record 2 of Set 9| boyabat 
Processing Record 3 of Set 9| flinders 
Processing Record 4 of Set 9| dicabisagan 
Processing Record 5 of Set 9| liling 
City not found. Skipping...
City not found. Skipping...
Processing Record 8 of Set 9| general roca 
Processing Record 9 of Set 9| longyearbyen 
Processing Record 10 of Set 9| yumen 
Processing Record 11 of Set 9| pacific grove 
Processing Record 12 of Set 9| umea 
Processing Record 13 of Set 9| matagami 
Processing Record 14 of Set 9| labuhan 
Processing Record 15 of Set 9| csokmo 
Processing Record 16 of Set 9| awassa 
Processing Record 17 of Set 9| tecoanapa 
Processing Record 18 of Set 9| kungurtug 
Processing Record 19 of Set 9| cayenne 
Processing Record 20 of Set 9| varhaug 
Processing Record 21 of Set 9| mapastepec 
Processing Record 22 of Set 9| ayame 
City not found. Skipping...
Processing Record 24 of Set 9| betare oya 
Processing Record 25 of Set 9| mareeba 
Processing Record 26 of Set 9| evensk 
Processing Record 27 

Processing Record 51 of Set 12| nanakuli 
Processing Record 1 of Set 13| olonets 
Processing Record 2 of Set 13| barranca 
Processing Record 3 of Set 13| chicama 
Processing Record 4 of Set 13| jharsuguda 
Processing Record 5 of Set 13| dwarka 
Processing Record 6 of Set 13| laguna 
City not found. Skipping...
Processing Record 8 of Set 13| maxixe 
Processing Record 9 of Set 13| bundaberg 
Processing Record 10 of Set 13| christchurch 
Processing Record 11 of Set 13| oussouye 
Processing Record 12 of Set 13| hinche 
Processing Record 13 of Set 13| anito 
Processing Record 14 of Set 13| breyten 
Processing Record 15 of Set 13| halifax 
City not found. Skipping...
Processing Record 17 of Set 13| kusadak 
City not found. Skipping...
Processing Record 19 of Set 13| dingle 
Processing Record 20 of Set 13| akyab 
Processing Record 21 of Set 13| erenhot 
Processing Record 22 of Set 13| mairi 
Processing Record 23 of Set 13| sola 
Processing Record 24 of Set 13| half moon bay 
Processing Record

In [5]:
#Checking how many cities were found 
len(city)

582

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [9]:
#Create Data Frame 

cities_complete = pd.DataFrame({"City": city,
                                "Lat": lat,
                                "Lng": lng,
                                "Max Temp": max_temp,
                                "Humidity": humidity,
                                "Cloudiness": cloudiness,
                                "Wind Speed": wind_speed,
                                "Country": country, 
                                "Date": date, 
})

cities_complete

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Mataura,-46.1927,168.8643,44.01,82,72,10.00,NZ,1619379495
1,Roding,49.1964,12.5186,48.20,40,1,9.64,DE,1619379495
2,Jamestown,42.0970,-79.2353,46.00,81,90,11.50,US,1619379496
3,Makkah al Mukarramah,21.4267,39.8261,87.22,33,73,4.16,SA,1619379496
4,Maceió,-9.6658,-35.7353,84.20,65,20,9.22,BR,1619379497
...,...,...,...,...,...,...,...,...,...
577,Tanout,14.9709,8.8879,91.44,13,100,11.32,NE,1619379810
578,Tyrma,50.0833,132.1667,27.97,52,50,2.68,RU,1619379810
579,Port Pirie,-33.1833,138.0167,50.00,93,1,3.44,AU,1619379709
580,Atar,20.5169,-13.0499,86.05,14,0,8.93,MR,1619379612


In [17]:
#Save output to CSV 
cities_complete.to_csv("../output/citiesComplete.csv", index=False, header=True)

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#Use .loc function with conditional over humidity 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression