## WeatherPy Main Workfile

### Initial identification

In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress
from pprint import pprint

# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = "output_data/cities.csv"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

### Generate Cities List

In [2]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count

api_key = weather_api_key
#print(api_key)
len(cities)

610

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).

In [3]:
# parameters

url = 'http://api.openweathermap.org/data/2.5/weather?'
units = 'metric'
query_url = f'{url}appid={api_key}&units={units}&q='


In [4]:
# list names for dataframe
city_name = []
cloudiness = []
dates = []
humidity = []
lat = []
lon = []
max_temp = []
wind_speed = []

In [5]:
# counters to store record counts and sets of 50 counts
record_count = 0
set_count = 1

In [6]:
# loop through list of random cities

print(f'Beginning Data Retrieval')
print('-------------------------------')

for index, city in enumerate(cities):
    
    #time.sleep(1) # Add a one second interval between queries to stay within API query limits   

    try:
        response = requests.get(query_url + city).json()
        city_name.append(response['name'])
        cloudiness.append(response['clouds']['all'])
        dates.append(response['dt'])
        humidity.append(response['main']['humidity'])
        lat.append(response['coord']['lat'])
        lon.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        wind_speed.append(response['wind']['speed'])
        
        if record_count > 49:
            record_count = 0
            set_count += 1
        else:
            record_count += 1

        print(f"Processing Record {record_count} of Set {set_count} | {city}")
  
    except(KeyError, IndexError):
        
        print("City not found. Skipping...")
        
print('-------------------------------')
print('Data Retrieval Complete ')
print('-------------------------------')

Beginning Data Retrieval
-------------------------------
Processing Record 1 of Set 1 | ilhabela
Processing Record 2 of Set 1 | inhambane
Processing Record 3 of Set 1 | butaritari
Processing Record 4 of Set 1 | esperance
Processing Record 5 of Set 1 | ambilobe
Processing Record 6 of Set 1 | clyde river
Processing Record 7 of Set 1 | gori
Processing Record 8 of Set 1 | cherskiy
Processing Record 9 of Set 1 | verkh-usugli
Processing Record 10 of Set 1 | new norfolk
Processing Record 11 of Set 1 | ayagoz
City not found. Skipping...
Processing Record 12 of Set 1 | gandorhun
Processing Record 13 of Set 1 | bluff
Processing Record 14 of Set 1 | saskylakh
Processing Record 15 of Set 1 | grindavik
Processing Record 16 of Set 1 | punta arenas
Processing Record 17 of Set 1 | pevek
Processing Record 18 of Set 1 | albany
Processing Record 19 of Set 1 | pacific grove
Processing Record 20 of Set 1 | bengkulu
Processing Record 21 of Set 1 | altay
Processing Record 22 of Set 1 | beira
Processing Recor

Processing Record 34 of Set 4 | hami
Processing Record 35 of Set 4 | broken hill
Processing Record 36 of Set 4 | krasnaya zarya
Processing Record 37 of Set 4 | izacic
Processing Record 38 of Set 4 | faanui
Processing Record 39 of Set 4 | tazovskiy
Processing Record 40 of Set 4 | pochutla
Processing Record 41 of Set 4 | rapid valley
Processing Record 42 of Set 4 | kaitangata
Processing Record 43 of Set 4 | thompson
City not found. Skipping...
Processing Record 44 of Set 4 | gigmoto
Processing Record 45 of Set 4 | sorong
Processing Record 46 of Set 4 | kuytun
Processing Record 47 of Set 4 | hof
Processing Record 48 of Set 4 | tiksi
Processing Record 49 of Set 4 | mattru
Processing Record 50 of Set 4 | pisco
Processing Record 0 of Set 5 | bafut
Processing Record 1 of Set 5 | egvekinot
Processing Record 2 of Set 5 | imeni poliny osipenko
Processing Record 3 of Set 5 | nome
Processing Record 4 of Set 5 | svetlogorsk
Processing Record 5 of Set 5 | gemena
Processing Record 6 of Set 5 | marybo

Processing Record 22 of Set 8 | port augusta
Processing Record 23 of Set 8 | luorong
Processing Record 24 of Set 8 | omboue
Processing Record 25 of Set 8 | whitecourt
Processing Record 26 of Set 8 | rionero in vulture
Processing Record 27 of Set 8 | carutapera
Processing Record 28 of Set 8 | beawar
Processing Record 29 of Set 8 | severo-yeniseyskiy
Processing Record 30 of Set 8 | camacha
City not found. Skipping...
Processing Record 31 of Set 8 | along
Processing Record 32 of Set 8 | seoul
Processing Record 33 of Set 8 | sakakah
Processing Record 34 of Set 8 | birao
Processing Record 35 of Set 8 | cabo san lucas
Processing Record 36 of Set 8 | thinadhoo
Processing Record 37 of Set 8 | vanimo
Processing Record 38 of Set 8 | dayong
Processing Record 39 of Set 8 | mana
Processing Record 40 of Set 8 | naze
Processing Record 41 of Set 8 | mamlyutka
Processing Record 42 of Set 8 | plainview
Processing Record 43 of Set 8 | thoen
Processing Record 44 of Set 8 | muisne
Processing Record 45 of S

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [9]:
# first create the dataframe for the list of responses and display
city_weather_df = pd.DataFrame({'City': city_name, 
                                  'Lat': lat, 
                                  'Lng': lon, 
                                  'Max Temp': max_temp, 
                                  'Humidity': humidity, 
                                  'Cloudiness': cloudiness, 
                                  'Wind Speed': wind_speed, 
                                  'Date': dates})
city_weather_df.head()

#second save and export dataframe to final outputs folder

city_weather_df.to_csv("Final_Outputs/cities_final.csv", index = False)


### Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [13]:
# check for cities with humidity greater than 100
humidity_check = city_weather_df.loc[city_weather_df['Humidity'] >100,:]
humidity_check

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
