## Decompose the Ask

Add more data to the cities DataFrame so that customers know the weather in the cities when they click on a pop-up marker.

## Identify the Data Sources

OpenWeatherMap is the data source.

## Data Retrieval

In [1]:
# Import the dependencies (packages of code that are needed for this notebook).
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
from datetime import datetime
from scipy.stats import linregress


In [2]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [3]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=2b396ffd8037184849afd69cd267c0d1


In [4]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs 

<zip at 0x1a198b7af0>

In [5]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)
print(coordinates)

[(-67.56223011492317, -20.98283072128666), (-30.01116848910717, 167.61687398219976), (-66.43626462454354, 25.005409915742888), (8.402587289405716, -35.895745653282916), (-35.15540076315803, -96.31003120967021), (-41.18022829363429, 160.7620723837859), (78.89284538654593, -99.61408037716907), (-18.92143593988372, -105.01473513716905), (-40.5081212058012, -127.1498281197409), (35.42907565612789, -17.602671615754105), (14.835143012275125, 21.32481993246074), (6.438995586485106, -48.51683614425676), (-55.68428116325201, -146.17677217013642), (29.087511805908306, 132.55756101945553), (82.80998221435624, -142.00684186275433), (39.62817416228975, 162.88767944088733), (33.0377121693718, -25.846163472746554), (19.239954329011937, 133.09981644556518), (-60.38969930502782, 60.304177836148455), (70.7233404479129, 13.766368147208226), (12.632598483367204, -78.9678928663171), (-83.27274733618196, -121.73443636156651), (5.524828875356135, -1.5923171737769337), (21.58513267270422, 29.13712518899868), 

In [6]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

626

In [8]:
# test cities = ["Oklahoma City", "New York"]
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.
 # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_description = city_weather["weather"][0]["description"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
    # Get rain and/or snow data if it is raining and/or snowing in the cities
        try:
            if city_weather["rain"]:
                city_rain = city_weather["rain"]["1h"]
                print(city_rain)
        except:
            city_rain = 0
            
        try: 
            if city_weather["snow"]:
                city_snow = city_weather["snow"]["3h"]
                print(city_snow)
        except:
            city_snow = 0
    
    # Append the city information into city_data dictionary.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Current Description": city_description,
                          "Rain inches (last 3 hrs)": city_rain,
                          "Snow inches (last 3 hrs)": city_snow,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except: #IndexError as e:
        print("City not found. Skipping...")
        pass



# Indicate that Data Loading is complete.
print("-----------------------------")
print("Initial Data Retrieval Complete      ")
print("-----------------------------")

    


Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | chuy
Processing Record 2 of Set 1 | vao
Processing Record 3 of Set 1 | bredasdorp
Processing Record 4 of Set 1 | itarema
Processing Record 5 of Set 1 | lebu
Processing Record 6 of Set 1 | te anau
Processing Record 7 of Set 1 | yellowknife
Processing Record 8 of Set 1 | puerto ayora
Processing Record 9 of Set 1 | rikitea
Processing Record 10 of Set 1 | camacha
Processing Record 11 of Set 1 | biltine
Processing Record 12 of Set 1 | cayenne
Processing Record 13 of Set 1 | mataura
Processing Record 14 of Set 1 | kushima
Processing Record 15 of Set 1 | tuktoyaktuk
Processing Record 16 of Set 1 | severo-kurilsk
3.06
Processing Record 17 of Set 1 | vila franca do campo
Processing Record 18 of Set 1 | nishihara
Processing Record 19 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 20 of Set 1 | stokmarknes
Processing Record 21 of Set 1 | san andres
Processing Record 22 of Set 1 | punta a

Processing Record 36 of Set 4 | maumere
Processing Record 37 of Set 4 | mackenzie
Processing Record 38 of Set 4 | olafsvik
Processing Record 39 of Set 4 | kodinar
Processing Record 40 of Set 4 | kununurra
Processing Record 41 of Set 4 | fortuna
Processing Record 42 of Set 4 | leningradskiy
Processing Record 43 of Set 4 | nizhneyansk
City not found. Skipping...
Processing Record 44 of Set 4 | dawlatabad
Processing Record 45 of Set 4 | soyo
Processing Record 46 of Set 4 | moose factory
Processing Record 47 of Set 4 | dmitriyevka
Processing Record 48 of Set 4 | talnakh
Processing Record 49 of Set 4 | andevoranto
City not found. Skipping...
Processing Record 50 of Set 4 | carnarvon
Processing Record 1 of Set 5 | isfana
Processing Record 2 of Set 5 | imbituba
Processing Record 3 of Set 5 | jieznas
Processing Record 4 of Set 5 | campana
Processing Record 5 of Set 5 | harnosand
Processing Record 6 of Set 5 | viedma
Processing Record 7 of Set 5 | college
Processing Record 8 of Set 5 | comodoro

Processing Record 22 of Set 8 | alice springs
Processing Record 23 of Set 8 | honiara
Processing Record 24 of Set 8 | hamilton
Processing Record 25 of Set 8 | aklavik
Processing Record 26 of Set 8 | raudeberg
0.51
Processing Record 27 of Set 8 | mendeleyevsk
Processing Record 28 of Set 8 | hami
Processing Record 29 of Set 8 | pindwara
Processing Record 30 of Set 8 | mbanza-ngungu
Processing Record 31 of Set 8 | samdrup jongkhar
Processing Record 32 of Set 8 | margate
Processing Record 33 of Set 8 | lewisporte
Processing Record 34 of Set 8 | crab hill
City not found. Skipping...
Processing Record 35 of Set 8 | beloha
Processing Record 36 of Set 8 | kloulklubed
Processing Record 37 of Set 8 | illertissen
Processing Record 38 of Set 8 | beaufort
Processing Record 39 of Set 8 | puerto princesa
Processing Record 40 of Set 8 | pradera
Processing Record 41 of Set 8 | cairns
0.89
Processing Record 42 of Set 8 | port lincoln
Processing Record 43 of Set 8 | redlands
Processing Record 44 of Set 8

Processing Record 10 of Set 12 | talcahuano
Processing Record 11 of Set 12 | mackay
Processing Record 12 of Set 12 | karamay
City not found. Skipping...
Processing Record 13 of Set 12 | jutai
Processing Record 14 of Set 12 | baghdad
Processing Record 15 of Set 12 | ryotsu
Processing Record 16 of Set 12 | jurado
Processing Record 17 of Set 12 | lata
Processing Record 18 of Set 12 | santa vitoria do palmar
Processing Record 19 of Set 12 | candido mendes
Processing Record 20 of Set 12 | balikpapan
Processing Record 21 of Set 12 | nichinan
Processing Record 22 of Set 12 | peterhead
Processing Record 23 of Set 12 | abha
Processing Record 24 of Set 12 | goderich
Processing Record 25 of Set 12 | boguchany
Processing Record 26 of Set 12 | sirur
Processing Record 27 of Set 12 | vestnes
Processing Record 28 of Set 12 | codrington
Processing Record 29 of Set 12 | naryan-mar
Processing Record 30 of Set 12 | anloga
Processing Record 31 of Set 12 | umba
1.5
Processing Record 32 of Set 12 | port hedl

## Assemble and Clean

In [9]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(5)
#city_data_df.sort_values("Current Status", ascending=False)
# pd.DataFrame.Rain.sort_values(ascending=False)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description,Rain inches (last 3 hrs),Snow inches (last 3 hrs),Country,Date
0,Chuy,-33.7,-53.46,71.78,59,66,4.61,broken clouds,0.0,0.0,UY,2020-02-23 18:32:50
1,Vao,-22.67,167.48,77.65,76,83,14.32,broken clouds,0.0,0.0,NC,2020-02-23 18:28:52
2,Bredasdorp,-34.53,20.04,66.2,59,0,12.75,clear sky,0.0,0.0,ZA,2020-02-23 18:32:51
3,Itarema,-2.92,-39.92,85.75,69,85,4.65,light rain,0.0,0.0,BR,2020-02-23 18:32:51
4,Lebu,-37.62,-73.65,69.19,57,2,9.35,clear sky,0.0,0.0,CL,2020-02-23 18:32:02


In [10]:
# Reordering the columns
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed", "Current Description", "Rain inches (last 3 hrs)", "Snow inches (last 3 hrs)"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description,Rain inches (last 3 hrs),Snow inches (last 3 hrs)
0,Chuy,UY,2020-02-23 18:32:50,-33.7,-53.46,71.78,59,66,4.61,broken clouds,0.0,0.0
1,Vao,NC,2020-02-23 18:28:52,-22.67,167.48,77.65,76,83,14.32,broken clouds,0.0,0.0
2,Bredasdorp,ZA,2020-02-23 18:32:51,-34.53,20.04,66.2,59,0,12.75,clear sky,0.0,0.0
3,Itarema,BR,2020-02-23 18:32:51,-2.92,-39.92,85.75,69,85,4.65,light rain,0.0,0.0
4,Lebu,CL,2020-02-23 18:32:02,-37.62,-73.65,69.19,57,2,9.35,clear sky,0.0,0.0
5,Te Anau,NZ,2020-02-23 18:33:35,-45.42,167.72,47.43,83,38,4.32,scattered clouds,0.0,0.0
6,Yellowknife,CA,2020-02-23 18:31:38,62.46,-114.35,-8.0,69,40,8.05,scattered clouds,0.0,0.0
7,Puerto Ayora,EC,2020-02-23 18:33:35,-0.74,-90.35,84.2,74,20,12.75,few clouds,0.0,0.0
8,Rikitea,PF,2020-02-23 18:33:35,-23.12,-134.97,78.37,74,2,8.25,light rain,0.0,0.0
9,Camacha,PT,2020-02-23 18:32:20,33.08,-16.33,68.0,72,20,19.46,few clouds,0.0,0.0


In [11]:
# Create the output file (CSV).
output_data_file = "weather_data/WeatherPy_challenge.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")

## Analyze for Trends

In [21]:
# Find cities that had rain or snow
city_precip_df = city_data_df[(city_data_df['Rain inches (last 3 hrs)'] > 0) | (city_data_df['Snow inches (last 3 hrs)'] > 0)] 
city_precip_df.head(5)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description,Rain inches (last 3 hrs),Snow inches (last 3 hrs)
15,Severo-Kurilsk,RU,2020-02-23 18:28:15,50.68,156.12,23.5,96,100,37.63,snow,0.0,3.06
46,Mezen,RU,2020-02-23 18:33:52,65.85,44.24,32.18,91,100,22.84,light snow,0.0,0.13
78,Stykkisholmur,IS,2020-02-23 18:34:10,65.08,-22.73,27.95,91,90,8.34,light snow,0.0,0.56
105,Pacific Grove,US,2020-02-23 18:34:22,36.62,-121.92,57.99,76,90,8.05,light rain,0.25,0.0
108,Nanortalik,GL,2020-02-23 18:33:47,60.14,-45.24,26.92,89,100,6.69,light snow,0.0,0.81


In [23]:
len(city_precip_df.index)

35