## WeatherPy

In [28]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import json
import requests
import time
from scipy.stats import linregress

# Import API key
from config import weather_api_key
units = 'imperial'

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = 'Output_files/cities_weather.csv'

query_url = f"http://api.openweathermap.org/data/2.5/weather?appid={weather_api_key}&units={units}&q="
units = "imperial"

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)

## General Cities List

In [10]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

619

## Perform API Calls

- Perform a weather check on each city using a series of successive API calls.
- Include a print log of each city as it's being processed

In [13]:
# set lists for the dataframe
city_count = []
lat = []
lng = []
max_temp = []
humidity = []
cloudiness = []
wind_speed = []
country = []
dates = []

# set initial count quantities for organization
counts = 0
sets = 1


print("Beginning Data Retrieval ")
print("-----------------------------")

# loops for creating dataframe columns
for index, city in enumerate(cities, start = 1):
    try:
        response = requests.get(query_url + city.replace(" ","&")).json()
        lat.append(response['coord']['lat'])
        lng.append(response['coord']['lon'])
        max_temp.append(response['main']['temp_max'])
        humidity.append(response['main']['humidity'])
        cloudiness.append(response['clouds']['all'])
        wind_speed.append(response['wind']['speed'])
        country.append(response['sys']['country'])
        dates.append(response['dt'])
        
        if counts > 48:
            counts = 1
            sets += 1
            city_count.append(city)
        else:
            counts += 1
            city_count.append(city)
            
        print(f"Processing Record {counts} of Set {sets} | {city}")
        
    except(KeyError, IndexError):
        print("City not found. Skipping...")
        
print('-----------------------------')
print('Data Retrieval Complete')
print('-----------------------------')

Beginning Data Retrieval 
-----------------------------
Processing Record 1 of Set 1 | busselton
Processing Record 2 of Set 1 | kamenka
Processing Record 3 of Set 1 | port alfred
Processing Record 4 of Set 1 | broome
Processing Record 5 of Set 1 | maragogi
Processing Record 6 of Set 1 | atuona
Processing Record 7 of Set 1 | sangar
Processing Record 8 of Set 1 | punta arenas
Processing Record 9 of Set 1 | kungurtug
Processing Record 10 of Set 1 | dikson
Processing Record 11 of Set 1 | jamestown
Processing Record 12 of Set 1 | rikitea
Processing Record 13 of Set 1 | mys shmidta
Processing Record 14 of Set 1 | bredasdorp
Processing Record 15 of Set 1 | lebu
City not found. Skipping...
City not found. Skipping...
Processing Record 16 of Set 1 | nhulunbuy
Processing Record 17 of Set 1 | tignere
Processing Record 18 of Set 1 | albany
Processing Record 19 of Set 1 | praia da vitoria
Processing Record 20 of Set 1 | ketchikan
Processing Record 21 of Set 1 | port elizabeth
City not found. Skippi

Processing Record 37 of Set 4 | diapaga
Processing Record 38 of Set 4 | lons
Processing Record 39 of Set 4 | muravlenko
Processing Record 40 of Set 4 | comodoro rivadavia
City not found. Skipping...
Processing Record 41 of Set 4 | superior
Processing Record 42 of Set 4 | grand river south east
Processing Record 43 of Set 4 | mongo
Processing Record 44 of Set 4 | bethel
Processing Record 45 of Set 4 | airai
Processing Record 46 of Set 4 | beringovskiy
City not found. Skipping...
Processing Record 47 of Set 4 | izhma
Processing Record 48 of Set 4 | hasaki
Processing Record 49 of Set 4 | tula
Processing Record 1 of Set 5 | baruun-urt
City not found. Skipping...
Processing Record 2 of Set 5 | klaksvik
City not found. Skipping...
Processing Record 3 of Set 5 | bandarbeyla
Processing Record 4 of Set 5 | sovetskaya gavan
Processing Record 5 of Set 5 | esperance
Processing Record 6 of Set 5 | hambantota
Processing Record 7 of Set 5 | kuliyapitiya
Processing Record 8 of Set 5 | helena
Processin

Processing Record 28 of Set 8 | teguldet
Processing Record 29 of Set 8 | namuac
Processing Record 30 of Set 8 | ambon
City not found. Skipping...
Processing Record 31 of Set 8 | sao gabriel da cachoeira
Processing Record 32 of Set 8 | sao simao
Processing Record 33 of Set 8 | port moresby
City not found. Skipping...
Processing Record 34 of Set 8 | landsberg
Processing Record 35 of Set 8 | alice springs
Processing Record 36 of Set 8 | pombia
Processing Record 37 of Set 8 | vila franca do campo
Processing Record 38 of Set 8 | kavieng
Processing Record 39 of Set 8 | samarai
Processing Record 40 of Set 8 | buraydah
Processing Record 41 of Set 8 | aykhal
Processing Record 42 of Set 8 | sembe
City not found. Skipping...
Processing Record 43 of Set 8 | ekhabi
Processing Record 44 of Set 8 | vanavara
Processing Record 45 of Set 8 | palora
Processing Record 46 of Set 8 | shimoda
Processing Record 47 of Set 8 | grand gaube
City not found. Skipping...
Processing Record 48 of Set 8 | kralendijk
Pr

Processing Record 18 of Set 12 | emerald
Processing Record 19 of Set 12 | neryungri
Processing Record 20 of Set 12 | sterling
-----------------------------
Data Retrieval Complete
-----------------------------


## Convert Raw Data to DataFrame
- Export the city data into a csv.
- Display the DataFrame

In [14]:
# Create a panda data frame using data retrieved
weather_df = pd.DataFrame({ 
                "City" : city_count,
                "Lat" : lat,
                "Lng" : lng,
                "Max Temp" : max_temp,
                "Humidity" : humidity,
                "Cloudiness" : cloudiness,
                "Wind Speed" : wind_speed,
                "Country" : country,
                "Date" : dates,
})
weather_df.head()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,busselton,-33.65,115.3333,61.0,75,57,4.0,AU,1612916456
1,kamenka,51.3223,42.7678,12.0,90,100,10.45,RU,1612916148
2,port alfred,-7.0349,29.7638,73.94,73,100,4.0,CD,1612916114
3,broome,42.2506,-75.833,21.2,73,90,8.05,US,1612916297
4,maragogi,-9.0122,-35.2225,78.4,77,27,6.02,BR,1612916636


In [30]:
weather_df.to_csv('../Output_files/cities_weather.csv', index=False, header=True)

In [31]:
# this image was in the starter file but not explicitly stated...
weather_df.describe()

Unnamed: 0,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Date
count,559.0,559.0,559.0,559.0,559.0,559.0,559.0
mean,21.799469,24.360055,48.051574,74.765653,56.071556,7.47449,1612916000.0
std,31.972294,87.252085,31.606712,19.628827,38.47671,5.279656,179.8748
min,-54.8,-175.2,-36.4,15.0,0.0,0.43,1612916000.0
25%,-3.55835,-46.3336,25.215,68.0,19.5,3.44,1612916000.0
50%,25.7,29.635,59.0,81.0,75.0,6.15,1612917000.0
75%,48.64955,98.0788,75.055,88.0,92.5,10.36,1612917000.0
max,78.2186,179.3167,89.6,100.0,100.0,37.98,1612917000.0
