# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [None]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "../output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [2]:
data = pd.read_csv(output_data_file)
data.head()

Unnamed: 0,City_ID,City,Cloudiness,Country,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
0,0,ostrovnoy,2,RU,1558378754,72,68.05,39.51,37.5,7.16
1,1,mahebourg,75,MU,1558378503,74,-20.41,57.7,78.8,11.41
2,2,qaanaaq,25,GL,1558378755,73,77.48,-69.36,22.2,2.37
3,3,zhuhai,0,CN,1558378755,39,40.71,112.04,44.6,4.47
4,4,cape town,20,ZA,1558378755,76,-33.93,18.42,55.99,8.05


## Generate Cities List

In [3]:
# List for holding lat_lngs and cities
lat_lngs = []

cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

620

In [None]:
lat_lngs

In [5]:
cities

['asau',
 'bredasdorp',
 'kabanjahe',
 'port alfred',
 'hobart',
 'tabou',
 'hilo',
 'talnakh',
 'barrow',
 'punta arenas',
 'ribeira grande',
 'rawson',
 'vaini',
 'cherskiy',
 'chiredzi',
 'hasaki',
 'klaksvik',
 'bethel',
 'lao cai',
 'kannangad',
 'sentyabrskiy',
 'codrington',
 'ushuaia',
 'qaanaaq',
 'albany',
 'butaritari',
 'belushya guba',
 'palabuhanratu',
 'port elizabeth',
 'hermanus',
 'pevek',
 'vila velha',
 'tsihombe',
 'el alto',
 'zugdidi',
 'san isidro',
 'rikitea',
 'arlit',
 'zabaykalsk',
 'mataura',
 'ixtepec',
 'new waterford',
 'chokurdakh',
 'sorvag',
 'fortuna',
 'wanning',
 'fenton',
 'airai',
 'kaitangata',
 'torbay',
 'tumannyy',
 'bhimunipatnam',
 'nanortalik',
 'east london',
 'solovetskiy',
 'constitucion',
 'oshakati',
 'yellowknife',
 'flinders',
 'tuktoyaktuk',
 'mar del plata',
 'tsienyane',
 'lompoc',
 'taolanaro',
 'saint-augustin',
 'clyde river',
 'puri',
 'saskylakh',
 'ponta do sol',
 'salalah',
 'shangqiu',
 'new norfolk',
 'nieuwpoort',
 'hit

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).

> **HINT:** The OpenWeatherMap API only allows 60 calls per minute under their free plan. Try using `time.sleep(60)` after each set of 50 cities to avoid API errors due to large calls.

In [None]:
# API set up
cities_info = []
base_url = "https://openweathermap.org/api/&key=" + weather_api_key
# to help python count every row in the cities (one by one)
records = 1 
sets = 1 

#enumerate is for loop function  when we need to look for many 
# set is to plit down the 620 cities in cities into smaller group of 10 or 20
# we use two interables i, city , so we need to do enumerate function
for i, city in enumerate(cities):
    # if as soon as the interable we want is 20 rows per count and i>=20 that mean the next 20 rows we put 
    if (i % 20 == 0 and i >= 20):
        sets += 1
        records = 0
        print("End of set. Sleeping for 15 seconds.")
        time.sleep(15)
    # create url for each city 
    city_url = base_url + "&q=" + cities
    print(city_url)
    records += 1
    try:
        cities_collection = requests.get(city_url).json()
        lats = cities_colection["coord"]["lat"]
        longs = cities_colection["coord"]["lon"]
        temperature = cities_colection["main"]["temp"]
        humidity = cities_colection["main"]["humidity"]
        cloudiness = cities_colection["clouds"]["all"]
        wind_speed = cities_colection["wind"]["speed"]
        date = cities_colection["dt"]
        country = cities_collection['sys']['country']
        
        cities_info.append({"city": city,
                           "latitutes": lats,
                            "longtitudes": longs,
                            "temperature (F)": temperature,
                            "humidity": humidity,
                            "cloudiness": cloudiness,
                            "wind speed": wind_speed,
                            "date": date,
                            "country": country
                           })
        
    except:
        print('city error: not found, skipping')
        pass
print('information all collected')
        print(cities_collection)

In [None]:
base_url = "https://openweathermap.org/api/&key=" + weather_api_key
city_url = base_url + "&q=" + cities
cities_collection = requests.get(city_url).json()
pprint(cities_collection)

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [4]:
#  Get the indices of cities that have humidity over 100%.


In [5]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression