In [1]:
import pandas as pd 
import numpy as np 
import matplotlib.pyplot as plt
from citipy import citipy

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs 

<zip at 0x1b9e4ee3508>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
coordinates

[(-49.23520606842587, 57.23626153484378),
 (65.31968317519735, 45.70584862146353),
 (67.95540117197959, -32.81093716565525),
 (20.82578209966752, 0.5226981628573526),
 (-32.88976471432518, -4.247311680835537),
 (78.9974738807621, 11.538471043706295),
 (26.122167549790035, 10.292477246354423),
 (-23.98173103244001, -171.9601154779947),
 (-7.080396560166761, -133.53775927521139),
 (41.42155366977974, 10.92528126060165),
 (-85.46332438799315, -116.91536231002844),
 (-46.06882507563362, 163.2969935731826),
 (-63.40205602450379, -148.1265627184845),
 (-84.84337549390962, -96.39878099848347),
 (6.315447987127001, 79.58791306248548),
 (19.008846023786177, 54.59003238093899),
 (-7.801446439952258, 75.25059948799202),
 (13.723166945272567, -161.79395627981455),
 (2.7175581872742214, 152.52871705889606),
 (40.20357069076297, 148.0198431075695),
 (-5.574593342418865, 51.134706823866054),
 (20.590217336802212, 108.00479895563541),
 (-12.797925340746204, 153.7401073565432),
 (27.36836560622355, -11

In [5]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

626

In [6]:
# Import the datetime module from the datetime library.
from datetime import datetime
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [7]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [8]:
# Create an empty list to hold the weather data.
weather_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        city_description = city_weather["weather"][0]["description"]
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        try:
            city_rainfall = city_weather["rain"]["1h"]
        except KeyError:
            city_rainfall = 0
        try:
            city_snowfall = city_weather["snow"]["1h"]
        except:
            city_snowfall = 0
         # Append the city information into city_data list.
        weather_data.append({"City": city.title(),
                            "Lat": city_lat,
                            "Lng": city_lng,
                            "Max Temp": city_max_temp,
                            "Humidity": city_humidity,
                            "Cloudiness": city_clouds,
                            "Wind Speed": city_wind,
                            "Country": city_country,
                            "Current Description": city_description,
                            "Date": city_date,
                            "Rainfall": city_rainfall,
                            "Snowfall":city_snowfall})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 2 of Set 1 | leshukonskoye
Processing Record 3 of Set 1 | tasiilaq
Processing Record 4 of Set 1 | tessalit
Processing Record 5 of Set 1 | jamestown
Processing Record 6 of Set 1 | barentsburg
City not found. Skipping...
Processing Record 7 of Set 1 | gat
Processing Record 8 of Set 1 | vaini
Processing Record 9 of Set 1 | atuona
Processing Record 10 of Set 1 | orbetello
Processing Record 11 of Set 1 | punta arenas
Processing Record 12 of Set 1 | tuatapere
Processing Record 13 of Set 1 | mataura
Processing Record 14 of Set 1 | beruwala
Processing Record 15 of Set 1 | salalah
Processing Record 16 of Set 1 | hithadhoo
Processing Record 17 of Set 1 | makakilo city
Processing Record 18 of Set 1 | kavieng
Processing Record 19 of Set 1 | nemuro
Processing Record 20 of Set 1 | victoria
Processing Record 21 of Set 1 | cam pha
City not found. Skipping..

Processing Record 36 of Set 4 | yunyang
Processing Record 37 of Set 4 | west bay
Processing Record 38 of Set 4 | diu
Processing Record 39 of Set 4 | shebunino
Processing Record 40 of Set 4 | tatui
Processing Record 41 of Set 4 | fort nelson
Processing Record 42 of Set 4 | kilindoni
Processing Record 43 of Set 4 | port keats
Processing Record 44 of Set 4 | ahipara
Processing Record 45 of Set 4 | jiddah
City not found. Skipping...
Processing Record 46 of Set 4 | rincon
Processing Record 47 of Set 4 | kysyl-syr
Processing Record 48 of Set 4 | albanel
Processing Record 49 of Set 4 | hambantota
Processing Record 50 of Set 4 | krasnoselkup
Processing Record 1 of Set 5 | namibe
Processing Record 2 of Set 5 | vaitupu
City not found. Skipping...
Processing Record 3 of Set 5 | bokspits
City not found. Skipping...
Processing Record 4 of Set 5 | tateyama
Processing Record 5 of Set 5 | santa cruz cabralia
Processing Record 6 of Set 5 | dharmanagar
Processing Record 7 of Set 5 | zvishavane
Processin

Processing Record 22 of Set 8 | nushki
Processing Record 23 of Set 8 | sentyabrskiy
City not found. Skipping...
Processing Record 24 of Set 8 | faanui
Processing Record 25 of Set 8 | sola
Processing Record 26 of Set 8 | kaeo
Processing Record 27 of Set 8 | camacha
Processing Record 28 of Set 8 | bibiani
Processing Record 29 of Set 8 | nuuk
Processing Record 30 of Set 8 | suao
City not found. Skipping...
Processing Record 31 of Set 8 | naze
Processing Record 32 of Set 8 | tsihombe
City not found. Skipping...
Processing Record 33 of Set 8 | portland
Processing Record 34 of Set 8 | kirakira
Processing Record 35 of Set 8 | kahului
Processing Record 36 of Set 8 | bluefields
Processing Record 37 of Set 8 | shelburne
Processing Record 38 of Set 8 | gizo
Processing Record 39 of Set 8 | santa rita
Processing Record 40 of Set 8 | isla vista
Processing Record 41 of Set 8 | tamandare
Processing Record 42 of Set 8 | chazuta
Processing Record 43 of Set 8 | pangkalanbuun
Processing Record 44 of Set 8

City not found. Skipping...
Processing Record 14 of Set 12 | alice
Processing Record 15 of Set 12 | wahran
City not found. Skipping...
Processing Record 16 of Set 12 | port moresby
Processing Record 17 of Set 12 | port blair
Processing Record 18 of Set 12 | rio grande
Processing Record 19 of Set 12 | rockland
Processing Record 20 of Set 12 | lata
Processing Record 21 of Set 12 | codajas
Processing Record 22 of Set 12 | bilibino
Processing Record 23 of Set 12 | muhldorf
Processing Record 24 of Set 12 | sairang
Processing Record 25 of Set 12 | atambua
Processing Record 26 of Set 12 | bose
Processing Record 27 of Set 12 | sulangan
Processing Record 28 of Set 12 | tevaitoa
Processing Record 29 of Set 12 | fengzhen
Processing Record 30 of Set 12 | koungheul
Processing Record 31 of Set 12 | villazon
Processing Record 32 of Set 12 | olafsvik
Processing Record 33 of Set 12 | hami
Processing Record 34 of Set 12 | skagastrond
City not found. Skipping...
Processing Record 35 of Set 12 | payson
Pr

In [9]:
len(weather_data)

574

In [10]:
# Convert the array of dictionaries to a Pandas DataFrame.
weather_data_df = pd.DataFrame(weather_data)
weather_data_df

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Current Description,Date,Rainfall,Snowfall
0,Leshukonskoye,64.90,45.76,57.06,46,96,9.10,RU,overcast clouds,2020-06-22 05:17:51,0.0,0
1,Tasiilaq,65.61,-37.64,48.20,70,90,2.24,GL,overcast clouds,2020-06-22 05:17:51,0.0,0
2,Tessalit,20.20,1.01,87.64,12,16,6.78,ML,few clouds,2020-06-22 05:17:51,0.0,0
3,Jamestown,42.10,-79.24,68.00,88,20,4.70,US,few clouds,2020-06-22 05:13:42,0.0,0
4,Gat,31.61,34.76,78.01,80,0,5.97,IL,clear sky,2020-06-22 05:17:02,0.0,0
...,...,...,...,...,...,...,...,...,...,...,...,...
569,Ucluelet,48.93,-125.55,55.99,82,69,6.24,CA,broken clouds,2020-06-22 05:20:06,0.0,0
570,Blackwater,-23.58,148.88,70.61,36,0,9.64,AU,clear sky,2020-06-22 05:20:13,0.0,0
571,Vila Velha,-20.33,-40.29,66.00,93,0,7.05,BR,clear sky,2020-06-22 05:20:13,0.0,0
572,Corner Brook,48.97,-57.95,53.60,81,75,11.41,CA,broken clouds,2020-06-22 05:20:14,0.0,0


In [11]:
#obtaining current order of columns 
weather_data_df.columns

Index(['City', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness',
       'Wind Speed', 'Country', 'Current Description', 'Date', 'Rainfall',
       'Snowfall'],
      dtype='object')

In [12]:
#obtaining new column order 
new_column_order=sorted(weather_data_df.columns.tolist())
weather_data_df= weather_data_df[new_column_order]
weather_data_df

Unnamed: 0,City,Cloudiness,Country,Current Description,Date,Humidity,Lat,Lng,Max Temp,Rainfall,Snowfall,Wind Speed
0,Leshukonskoye,96,RU,overcast clouds,2020-06-22 05:17:51,46,64.90,45.76,57.06,0.0,0,9.10
1,Tasiilaq,90,GL,overcast clouds,2020-06-22 05:17:51,70,65.61,-37.64,48.20,0.0,0,2.24
2,Tessalit,16,ML,few clouds,2020-06-22 05:17:51,12,20.20,1.01,87.64,0.0,0,6.78
3,Jamestown,20,US,few clouds,2020-06-22 05:13:42,88,42.10,-79.24,68.00,0.0,0,4.70
4,Gat,0,IL,clear sky,2020-06-22 05:17:02,80,31.61,34.76,78.01,0.0,0,5.97
...,...,...,...,...,...,...,...,...,...,...,...,...
569,Ucluelet,69,CA,broken clouds,2020-06-22 05:20:06,82,48.93,-125.55,55.99,0.0,0,6.24
570,Blackwater,0,AU,clear sky,2020-06-22 05:20:13,36,-23.58,148.88,70.61,0.0,0,9.64
571,Vila Velha,0,BR,clear sky,2020-06-22 05:20:13,93,-20.33,-40.29,66.00,0.0,0,7.05
572,Corner Brook,75,CA,broken clouds,2020-06-22 05:20:14,81,48.97,-57.95,53.60,0.0,0,11.41


In [13]:
#check for rainfall data
rainfall_cities=weather_data_df.loc[weather_data_df["Rainfall"] > 0]
rainfall_cities

Unnamed: 0,City,Cloudiness,Country,Current Description,Date,Humidity,Lat,Lng,Max Temp,Rainfall,Snowfall,Wind Speed
15,Kavieng,12,PG,light rain,2020-06-22 05:17:55,71,-2.57,150.80,84.72,0.41,0,5.79
22,Busselton,98,AU,moderate rain,2020-06-22 05:17:56,34,-33.65,115.33,66.00,1.04,0,23.98
63,Ganzhou,100,CN,light rain,2020-06-22 05:18:06,65,28.82,115.43,91.58,0.17,0,9.37
67,Dali,59,CN,light rain,2020-06-22 05:18:07,54,25.70,100.18,77.94,0.14,0,7.23
69,New Norfolk,100,AU,moderate rain,2020-06-22 05:16:12,92,-42.78,147.06,54.00,1.27,0,1.01
...,...,...,...,...,...,...,...,...,...,...,...,...
541,Dongsheng,100,CN,light rain,2020-06-22 05:20:06,72,39.82,109.98,62.47,0.12,0,10.18
542,Lokosovo,74,RU,light rain,2020-06-22 05:20:06,72,61.13,74.82,51.96,0.35,0,18.12
551,Fairbanks,90,US,light rain,2020-06-22 05:16:56,93,64.84,-147.72,53.60,0.76,0,12.75
559,Vestmanna,78,FO,light rain,2020-06-22 05:15:55,100,62.16,-7.17,50.00,0.16,0,14.99


In [14]:
#check for snowfall data
snowfall_cities=weather_data_df.loc[weather_data_df["Snowfall"] > 0]
snowfall_cities

Unnamed: 0,City,Cloudiness,Country,Current Description,Date,Humidity,Lat,Lng,Max Temp,Rainfall,Snowfall,Wind Speed


In [15]:
#making an output file in the form of csv file
weather_data_file="data/WeatherPy_Database.csv"
weather_data_df.to_csv(weather_data_file, index_label="City_ID")