# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

634

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it's being processed (with the city number and city name).


In [3]:
city

'vaini'

In [4]:
units = "Imperial"
url = "http://api.openweathermap.org/data/2.5/weather?"
query_url = url + "appid=" + weather_api_key + "&units=" + units + "&q="
weather_response = requests.get(query_url)
weather_json = weather_response.json()
weather_json

{'cod': '400', 'message': 'Nothing to geocode'}

In [5]:
weather_json.keys()

dict_keys(['cod', 'message'])

In [6]:
# set up lists to hold reponse info
lat = []
lng = []
max_temp = []
humidity = []
cloudiness = []
wind_speed = []
country = []
date = []
name = []



# Loop through the list of cities and perform a request for data on each
print("Beginning Data Retrieval")     
print("-----------------------------")
      
for city in cities:
    try:
        response = requests.get(query_url + city).json()
        #print(city)
        name.append(response["name"])
        lat.append(response["coord"]["lat"])
        lng.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        cloudiness.append(response['clouds']['all'])
        wind_speed.append(response['wind']['speed'])
        country.append(response['sys']['country'])
        date.append(response['dt'])
    except:
        print("city not found")
        pass
for x in range(len(country)):
    print(name[x], lat[x], lng[x], max_temp[x], humidity[x], cloudiness[x], wind_speed[x], country[x], date[x])    


Beginning Data Retrieval
-----------------------------
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
Saint George 37.1041 -113.5841 97.95 16 1 5.01 US 1628225604
Sohag 26.557 31.6948 88.09 13 0 1.86 EG 1628

Hofn 64.2539 -15.2082 52.61 87 92 2.37 IS 1628225693
Coolum Beach -26.5333 153.1 72.34 64 67 6.78 AU 1628225693
Butterworth 5.3991 100.3638 89.65 62 20 3 MY 1628225694
Roald 62.5833 6.1333 61.32 88 0 8.05 NO 1628225694
Klaksvík 62.2266 -6.589 56.32 97 100 6.98 FO 1628225694
Kargopol' 61.5071 38.9456 59.41 61 100 4.61 RU 1628225695
Upernavik 72.7868 -56.1549 42.58 67 23 5.97 GL 1628225695
Puducherry 11.93 79.83 88.18 62 40 3.44 IN 1628225695
Tura 25.5198 90.2201 86.56 72 100 4.52 IN 1628225589
Esim 4.8699 -2.2405 75.2 88 27 6.82 GH 1628225696
Guerrero Negro 27.9769 -114.0611 71.65 82 2 9.19 MX 1628225696
Dingle 10.9995 122.6711 88.39 61 85 15.5 PH 1628225696
Saint-Pierre -21.3393 55.4781 70.29 59 20 5.75 RE 1628225697
Mandeville 18.0417 -77.5071 73.45 85 68 2.17 JM 1628225697
Belmonte -15.8631 -38.8828 72.1 87 97 13.11 BR 1628225533
Ntchisi -13.5278 33.9149 49.98 72 0 3.18 MW 1628225697
Atambua -9.1061 124.8925 84.33 44 68 2.68 ID 1628225698
Sola -13.8833 167.55 78.71 71 11 0.04 VU 1628

Bairiki Village 1.3292 172.9752 86 62 20 13.8 KI 1628225792
Podyuga 61.095 40.8647 56.84 68 100 3.56 RU 1628225792
Lichinga -13.3128 35.2406 55.49 82 20 5.75 MZ 1628225792
Visby 57.6409 18.296 64.94 82 0 4.61 SE 1628225631
Medvedka 61.1629 46.387 61.14 56 100 1.39 RU 1628225793
Maţāy 28.419 30.7792 88.72 27 0 8.03 EG 1628225793
Half Moon Bay 37.4636 -122.4286 65.19 86 1 8.05 US 1628225794
Salinópolis -0.6136 -47.3561 77.65 86 3 9.44 BR 1628225525
Kichera 55.9375 110.0997 63.18 79 96 3.47 RU 1628225794
Ovalle -30.5983 -71.2003 57.92 71 58 0.16 CL 1628225795
Landau 49.2075 8.1133 63.77 91 100 7.4 DE 1628225795
Ushtobe 45.2514 77.9838 86.56 22 10 15.97 KZ 1628225795
Baie-Comeau 49.2168 -68.1489 68 100 75 4.61 CA 1628225796
Boende -0.2167 20.8667 71.71 89 95 3.02 CD 1628225796
Nome 64.5011 -165.4064 58.15 86 99 10.25 US 1628225797
Oranjemund -28.55 16.4333 53.51 73 1 2.04 NA 1628225797
Thabazimbi -24.5917 27.4116 54.37 39 1 2.55 ZA 1628225651
São Sebastião -23.76 -45.4097 63.16 93 96 4.23 

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [7]:
weather_data = pd.DataFrame({"City": name, "Lat": lat, "Lng": lng, "Max Temp": max_temp, "Humidity": humidity, 
                             "Cloudiness": cloudiness, "Wind Speed": wind_speed, "Country": country, "Date": date})
weather_data.to_csv('../output_data/cities.csv')

weather_data


Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Saint George,37.1041,-113.5841,97.95,16,1,5.01,US,1628225604
1,Sohag,26.5570,31.6948,88.09,13,0,1.86,EG,1628225605
2,Rikitea,-23.1203,-134.9692,74.12,76,10,14.38,PF,1628225605
3,Punta Arenas,-53.1500,-70.9167,35.71,87,75,25.32,CL,1628225550
4,Kavieng,-2.5744,150.7967,84.24,70,46,14.16,PG,1628225605
...,...,...,...,...,...,...,...,...,...
573,Shingū,33.7333,135.9833,87.91,91,100,13.33,JP,1628225803
574,Dunedin,-45.8742,170.5036,51.80,64,2,3.00,NZ,1628225742
575,Knysna,-34.0363,23.0471,48.58,91,89,1.99,ZA,1628225804
576,Nador,35.1740,-2.9287,73.65,56,0,5.75,MA,1628225804


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [38]:
weather_data[(weather_data["Humidity"] > 100)]

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date


In [31]:
weather_data.describe()

Unnamed: 0,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
count,578.0,578.0,578.0,578.0,578.0,578.0,578.0
mean,20.221821,16.138369,69.835311,69.693772,54.100346,7.641263,1628226000.0
std,33.832722,90.366391,13.586031,21.672079,38.537658,5.217602,81.22009
min,-54.8,-179.1667,32.16,11.0,0.0,0.0,1628225000.0
25%,-8.766175,-62.59335,59.5525,55.0,13.0,3.6275,1628226000.0
50%,24.13915,23.64325,71.42,74.5,60.0,6.44,1628226000.0
75%,49.214475,93.849975,79.78,88.0,93.0,10.8225,1628226000.0
max,78.2186,178.4167,107.04,100.0,100.0,32.21,1628226000.0


In [9]:
#  Get the indices of cities that have humidity over 100%.


In [10]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


In [35]:
clean_city_data = weather_data.copy()
clean_city_data


Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Saint George,37.1041,-113.5841,97.95,16,1,5.01,US,1628225604
1,Sohag,26.5570,31.6948,88.09,13,0,1.86,EG,1628225605
2,Rikitea,-23.1203,-134.9692,74.12,76,10,14.38,PF,1628225605
3,Punta Arenas,-53.1500,-70.9167,35.71,87,75,25.32,CL,1628225550
4,Kavieng,-2.5744,150.7967,84.24,70,46,14.16,PG,1628225605
...,...,...,...,...,...,...,...,...,...
573,Shingū,33.7333,135.9833,87.91,91,100,13.33,JP,1628225803
574,Dunedin,-45.8742,170.5036,51.80,64,2,3.00,NZ,1628225742
575,Knysna,-34.0363,23.0471,48.58,91,89,1.99,ZA,1628225804
576,Nador,35.1740,-2.9287,73.65,56,0,5.75,MA,1628225804


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression