# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

639

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it's being processed (with the city number and city name).


In [3]:
city

'leopold'

In [4]:
units = "Imperial"
url = "http://api.openweathermap.org/data/2.5/weather?"
query_url = url + "appid=" + weather_api_key + "&units=" + units + "&q="
weather_response = requests.get(query_url)
weather_json = weather_response.json()
weather_json

{'cod': '400', 'message': 'Nothing to geocode'}

In [5]:
weather_json.keys()

dict_keys(['cod', 'message'])

In [6]:
# set up lists to hold reponse info
lat = []
lng = []
max_temp = []
humidity = []
cloudiness = []
wind_speed = []
country = []
date = []
name = []



# Loop through the list of cities and perform a request for data on each
print("Beginning Data Retrieval")     
print("-----------------------------")
      
for city in cities:
    try:
        response = requests.get(query_url + city).json()
        #print(city)
        name.append(response["name"])
        lat.append(response["coord"]["lat"])
        lng.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        cloudiness.append(response['clouds']['all'])
        wind_speed.append(response['wind']['speed'])
        country.append(response['sys']['country'])
        date.append(response['dt'])
    except:
        print("city not found")
        pass
for x in range(len(country)):
    print(name[x], lat[x], lng[x], max_temp[x], humidity[x], cloudiness[x], wind_speed[x], country[x], date[x])    


Beginning Data Retrieval
-----------------------------
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
city not found
Saldanha -33.01

Hirara 24.8 125.2833 88.07 79 75 18.41 JP 1628218301
Grootfontein -19.5667 18.1167 51.37 46 0 4.61 NA 1628218301
Ust-Nera 64.5667 143.2 58.26 44 92 6.51 RU 1628218302
Sechura -5.5569 -80.8222 65.1 82 0 12.91 PE 1628218302
Guerrero Negro 27.9769 -114.0611 72.09 80 12 13.4 MX 1628218302
Djebeniana 35.035 10.9081 78.6 67 0 10.2 TN 1628218303
Terrell 32.736 -96.2753 82.13 75 1 5.75 US 1628218303
Khovu-Aksy 51.1333 93.6 59.58 75 100 8.28 RU 1628218303
Axum 14.1245 38.7244 56.25 84 71 1.97 ET 1628218304
Lékoni -1.5843 14.2591 72.9 79 61 10.36 GA 1628218304
Linden 6 -58.3 77.14 89 100 1.32 GY 1628218304
New Haven 41.4001 -72.9329 69.46 93 40 0 US 1628218047
Brazzaville -4.2658 15.2832 71.96 83 0 2.3 CG 1628218305
Murdochville 48.9583 -65.5006 65.28 92 100 4.61 CA 1628218305
San Cristobal 7.7669 -72.225 75.38 98 94 5.14 VE 1628218305
Florianópolis -27.6146 -48.5012 59.4 97 75 0 BR 1628218306
Kieta -6.2167 155.6333 82.4 79 100 7.65 PG 1628218306
Nantucket 41.2835 -70.0995 70.02 96 90 12.66 US 1

Launceston -41.45 147.1667 62.62 63 79 8.01 AU 1628218371
Jinchang 38.4953 102.1739 81.91 26 45 7.09 CN 1628218371
Vaitape -16.5167 -151.75 79.12 70 99 5.91 PF 1628218372
Gushikawa 26.3544 127.8686 85.62 83 40 11.5 JP 1628218373
Myanaung 18.2833 95.3167 76.93 95 100 4.21 MM 1628218373
Mackay -21.15 149.2 73.69 46 97 17.27 AU 1628218373
Camacha 33.0833 -16.3333 71.53 94 75 10.36 PT 1628218374
Peniche 39.3558 -9.3811 66.72 83 12 14.12 PT 1628218374
Kununurra -15.7667 128.7333 76.98 15 1 14.97 AU 1628218374
Mikhaylovka 50.06 43.2379 69.08 46 55 6.06 RU 1628218375
Khani 41.9563 42.9566 65.77 58 93 6.51 GE 1628218375
Uyuni -20.4597 -66.825 36.64 19 0 10.29 BO 1628218375
Gallup 35.5281 -108.7426 84.96 20 1 1.01 US 1628218376
Manggar -2.8833 108.2667 85.24 72 100 11.56 ID 1628218376
Binzhou 37.3667 118.0167 91.27 56 0 1.92 CN 1628218376
Semnan 35.5729 53.3971 78.24 29 37 5.66 IR 1628218377
Bodden Town 19.2833 -81.25 84.2 84 20 4.61 KY 1628218377
Pontianak -0.0333 109.3333 84.18 70 20 9.22 ID 

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [7]:
weather_data = pd.DataFrame({"City": name, "Lat": lat, "Lng": lng, "Max Temp": max_temp, "Humidity": humidity, 
                             "Cloudiness": cloudiness, "Wind Speed": wind_speed, "Country": country, "Date": date})
weather_data.to_csv('../output_data/cities.csv')

weather_data


Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Saldanha,-33.0117,17.9442,44.65,86,0,3.00,ZA,1628218140
1,Eureka,40.8021,-124.1637,65.19,81,73,4.00,US,1628218141
2,Vaini,-21.2000,-175.2000,77.16,73,40,12.66,TO,1628218141
3,Butaritari,3.0707,172.7902,83.28,64,28,11.77,KI,1628218141
4,Vultureşti,47.5167,26.4500,64.22,94,100,5.12,RO,1628218142
...,...,...,...,...,...,...,...,...,...
572,Lata,40.1629,-8.3327,64.06,97,46,2.51,PT,1628218400
573,Dhidhdhoo,6.8833,73.1000,81.97,76,100,13.11,MV,1628218400
574,Khorramshahr,30.4397,48.1664,94.95,33,40,4.61,IR,1628218400
575,Shaunavon,49.6501,-108.4181,76.78,35,15,10.78,CA,1628218282


## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [11]:
#weather_data["Lat"].count()
weather_data.describe()

Unnamed: 0,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
count,577.0,577.0,577.0,577.0,577.0,577.0,577.0
mean,21.943032,19.925039,69.546499,69.908146,54.403813,7.270069,1628218000.0
std,33.239329,92.708726,13.044947,21.642379,39.425847,5.077631,78.7282
min,-54.8,-179.1667,33.91,8.0,0.0,0.0,1628218000.0
25%,-4.8769,-65.0192,60.06,58.0,11.0,3.44,1628218000.0
50%,29.5581,23.7833,70.18,75.0,66.0,6.04,1628218000.0
75%,49.5,103.7519,79.59,87.0,94.0,10.33,1628218000.0
max,78.2186,179.3167,106.39,100.0,100.0,26.46,1628218000.0


In [9]:
#  Get the indices of cities that have humidity over 100%.


In [10]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression