# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import random
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

In [2]:
weather_api_key

'd46a2e4e79bb1ea72c61604da1fc17dc'

## Generate Cities List

In [3]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

636

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [4]:
url = "https://api.openweathermap.org/data/2.5/weather?"
units = "imperial"
city = 'ushuaia'

query_url = f"{url}appid={weather_api_key}&units={units}&q={city}"
response = requests.get(query_url).json()
pprint(response)

{'base': 'stations',
 'clouds': {'all': 100},
 'cod': 200,
 'coord': {'lat': -54.8, 'lon': -68.3},
 'dt': 1667579767,
 'id': 3833367,
 'main': {'feels_like': 43.95,
          'humidity': 71,
          'pressure': 1006,
          'temp': 49.66,
          'temp_max': 49.66,
          'temp_min': 49.62},
 'name': 'Ushuaia',
 'sys': {'country': 'AR',
         'id': 8303,
         'sunrise': 1667551092,
         'sunset': 1667606117,
         'type': 1},
 'timezone': -10800,
 'visibility': 10000,
 'weather': [{'description': 'light intensity drizzle',
              'icon': '09d',
              'id': 300,
              'main': 'Drizzle'}],
 'wind': {'deg': 250, 'speed': 16.11}}


In [None]:
# set up list to hold reponse info
city_data = []

# set up counters
city_counter = 1
set_counter = 1

# Save config information.
url = "https://api.openweathermap.org/data/2.5/weather?"
units = "imperial"

# print beginning statement
print(f"Beginning Data Retrieval")     
print(f"-----------------------------")

# Loop through the list of cities and get latitude, longitude, max temperature, humidity, cloudiness, wind speed for cities
for i, city in enumerate(cities):
   
    # Build partial query URL
    query_url = f"{url}appid={weather_api_key}&units={units}&q={city}"
    
    # group the cities in sets of 50 for 13 sets
    if(i % 50 == 0 and i >=50):
        # reset the group or set 
        # add time to avoid blowing out API key 
        time.sleep(2)
        
        set_counter += 1
        city_counter = 1

    # print the city # and city along with its set number     
    print(f"Processing city #{city_counter} of Set #{set_counter} | {city}")
    city_counter += 1


# print(query_url)
    try:
        
        # jsonify response
        response = requests.get(query_url).json()

        # append data to respective lists"
        lat = response['coord']['lat']
        lng = response['coord']['lon']
        temp_max = response['main']['temp_max']
        humidity = response['main']['humidity']
        cloud = response['clouds']['all']
        wind = response['wind']['speed']
        date = response['dt']
        country = response['sys']['country']

        #append the city information to city_data list
        city_data.append({"City": city,
                          "Lat": lat,
                          "Lng": lng,
                          "Max Temp": temp_max,
                          "Humidity": humidity,
                          "Cloudiness": cloud,
                          "Wind Speed": wind,
                          "Country": country, 
                          "Date": date})

    except:
        print(f"{city} not found. Skipping...")
        pass

print(f"-----------------------------")
print(f"Data Retrieval Complete")      
print(f"-----------------------------")
        

Beginning Data Retrieval
-----------------------------
Processing city #1 of Set #1 | artyk
artyk not found. Skipping...
Processing city #2 of Set #1 | srednekolymsk
Processing city #3 of Set #1 | whitianga
Processing city #4 of Set #1 | port augusta
Processing city #5 of Set #1 | chimbote
Processing city #6 of Set #1 | vanimo
Processing city #7 of Set #1 | benjamin constant
Processing city #8 of Set #1 | talakan
Processing city #9 of Set #1 | broome
Processing city #10 of Set #1 | gazojak
Processing city #11 of Set #1 | provideniya
Processing city #12 of Set #1 | kikwit
Processing city #13 of Set #1 | ponta do sol
Processing city #14 of Set #1 | ahar
Processing city #15 of Set #1 | batagay
Processing city #16 of Set #1 | thompson
Processing city #17 of Set #1 | denpasar
Processing city #18 of Set #1 | rohru
Processing city #19 of Set #1 | severo-kurilsk
Processing city #20 of Set #1 | zyryanovsk
Processing city #21 of Set #1 | rikitea
Processing city #22 of Set #1 | ushuaia
Processing

Processing city #39 of Set #4 | wadi maliz
Processing city #40 of Set #4 | guerrero negro
Processing city #41 of Set #4 | bethel
Processing city #42 of Set #4 | miranorte


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [None]:
# pd.DataFrame([{}, {}])

# pd.DataFrame({'col1': [], 'col2':[]})

In [None]:
weatherDF = pd.DataFrame(city_data)
weatherDF

In [None]:
weatherDF.describe()

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression