In [9]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

# Import the time library and the datetime module from the datetime library 
import time
from datetime import datetime

In [10]:
# Starting URL for Weather Map API Call.
url = "https://api.openweathermap.org/data/2.5/weather?lat={lat}&lon={lon}&appid=" + weather_api_key
print(url)

https://api.openweathermap.org/data/2.5/weather?lat={lat}&lon={lon}&appid=16e412100f28e09225c2b19751ee7e98


In [11]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fd053d08690>

In [12]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [13]:
# Use the print() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(coordinate[0], coordinate[1])

32.15311058352049 -81.72579383163745
-22.924609320787326 -91.45672530208557
49.42419706466828 -122.22734023378231
-53.85518958133153 151.35819103424893
-14.66563816873878 -48.5517364130055
41.07638239173363 -95.00753420352608
-47.01059035051881 -46.52092945834329
-3.7622946293465276 154.6338258259637
-73.61415138590084 51.99238844062202
20.880160888784047 -158.55704195408475
65.61655919612389 -12.608829095144728
-26.571621573695026 -150.76482537245747
-85.25250550104421 -86.05639804771009
85.60961069653806 -73.07462612051043
-14.119008939358622 15.124368908347236
25.146878908413 -30.757055230774682
29.81370064668222 10.141559424543289
-42.60180571409376 116.4831785671845
-84.45152009148704 -11.359982780520113
-54.97747013976365 -46.10264236036741
29.824674065232713 -175.19296281550297
-66.45051587646141 -179.28671296837194
52.13609657605812 -156.90646974993902
14.31845836698976 -71.15440717144628
64.31454166229778 -44.68324732621019
-15.779618347596127 -1.414665986408778
49.12756475080

-87.65647534129293 99.76583580613953
-43.464570851741065 -64.17865025916721
-61.32460959518616 -44.019425601636584
52.95657225887922 -131.76812220976421
39.26646353029747 127.9263731732189
84.84652928239109 -118.75778196331493
67.52323808118535 60.255076617516465
-81.36546614483373 21.692954179986003
-6.572440987217007 -175.21553315404566
74.32746530084768 -105.00299185961947
26.729415756548377 176.01728620177943
11.634224119350492 -167.7734249695452
-11.692419242601574 81.72724641184658
-61.99745416053288 119.92595058699652
49.37394413854568 -158.47366216641723
71.31172434236001 -132.5500303563031
44.76912874110991 -108.5067080142424
-34.94610291289171 -3.837399874257102
12.449355587616012 -156.0167201833168
-82.90095389722677 -81.24564258110333
55.60270371027258 94.30327817842772
46.082323747596604 146.13121426120034
71.43692889644527 -69.13963064733986
-59.353452481169356 98.56453036528359
83.08107585435374 149.78231605392875
-85.7898807932114 -165.81754248287248
-12.177944917993074

In [14]:
from citipy import citipy

In [15]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

581

In [17]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1
    
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | statesboro
Processing Record 2 of Set 1 | pisco
Processing Record 3 of Set 1 | chilliwack
Processing Record 4 of Set 1 | hobart
Processing Record 5 of Set 1 | niquelandia
Processing Record 6 of Set 1 | maryville
Processing Record 7 of Set 1 | mar del plata
Processing Record 8 of Set 1 | namatanai
Processing Record 9 of Set 1 | east london
Processing Record 10 of Set 1 | nanakuli
Processing Record 11 of Set 1 | hofn
Processing Record 12 of Set 1 | mataura
Processing Record 13 of Set 1 | ushuaia
Processing Record 14 of Set 1 | qaanaaq
Processing Record 15 of Set 1 | caconda
Processing Record 16 of Set 1 | ponta do sol
Processing Record 17 of Set 1 | nalut
Processing Record 18 of Set 1 | albany
Processing Record 19 of Set 1 | hermanus
Processing Record 20 of Set 1 | kapaa
Processing Record 21 of Set 1 | vaini
Processing Record 22 of Set 1 | kodiak
Processing Record 23 of Set 1 | oranjestad
Processin

Processing Record 35 of Set 4 | sapao
City not found. Skipping...
Processing Record 36 of Set 4 | puerto ayora
Processing Record 37 of Set 4 | chabahar
Processing Record 38 of Set 4 | novikovo
Processing Record 39 of Set 4 | salekhard
Processing Record 40 of Set 4 | wulanhaote
City not found. Skipping...
Processing Record 41 of Set 4 | saint-joseph
Processing Record 42 of Set 4 | itaqui
Processing Record 43 of Set 4 | san joaquin
Processing Record 44 of Set 4 | norman wells
Processing Record 45 of Set 4 | quatre cocos
Processing Record 46 of Set 4 | beloha
Processing Record 47 of Set 4 | souillac
Processing Record 48 of Set 4 | shache
Processing Record 49 of Set 4 | yar-sale
Processing Record 50 of Set 4 | kasur
Processing Record 1 of Set 5 | haibowan
City not found. Skipping...
Processing Record 2 of Set 5 | barentsburg
City not found. Skipping...
Processing Record 3 of Set 5 | vao
Processing Record 4 of Set 5 | kaitangata
Processing Record 5 of Set 5 | tuatapere
Processing Record 6 o

Processing Record 25 of Set 8 | komsomolskiy
Processing Record 26 of Set 8 | solnechnyy
Processing Record 27 of Set 8 | valparaiso
Processing Record 28 of Set 8 | karaul
City not found. Skipping...
Processing Record 29 of Set 8 | maniitsoq
Processing Record 30 of Set 8 | nizhneyansk
City not found. Skipping...
Processing Record 31 of Set 8 | centralia
Processing Record 32 of Set 8 | kaseda
Processing Record 33 of Set 8 | senneterre
Processing Record 34 of Set 8 | samalaeulu
City not found. Skipping...
Processing Record 35 of Set 8 | alta floresta
Processing Record 36 of Set 8 | enzan
Processing Record 37 of Set 8 | srednekolymsk
Processing Record 38 of Set 8 | cheuskiny
City not found. Skipping...
Processing Record 39 of Set 8 | samusu
City not found. Skipping...
Processing Record 40 of Set 8 | pangody
Processing Record 41 of Set 8 | fria
Processing Record 42 of Set 8 | tarko-sale
Processing Record 43 of Set 8 | avera
Processing Record 44 of Set 8 | dzhebariki-khaya
Processing Record 4

Processing Record 11 of Set 12 | kisangani
Processing Record 12 of Set 12 | aranos
Processing Record 13 of Set 12 | port-gentil
Processing Record 14 of Set 12 | ocampo
Processing Record 15 of Set 12 | ardistan
City not found. Skipping...
Processing Record 16 of Set 12 | gulshat
City not found. Skipping...
Processing Record 17 of Set 12 | sao joao da barra
Processing Record 18 of Set 12 | abomsa
Processing Record 19 of Set 12 | palana
Processing Record 20 of Set 12 | toulepleu
City not found. Skipping...
Processing Record 21 of Set 12 | nelson bay
Processing Record 22 of Set 12 | havelock
Processing Record 23 of Set 12 | yerbogachen
Processing Record 24 of Set 12 | turkistan
Processing Record 25 of Set 12 | leh
Processing Record 26 of Set 12 | coahuayana
Processing Record 27 of Set 12 | dunedin
Processing Record 28 of Set 12 | aripuana
Processing Record 29 of Set 12 | woodward
Processing Record 30 of Set 12 | sungairaya
Processing Record 31 of Set 12 | hay river
------------------------

In [18]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Statesboro,32.4488,-81.7832,299.89,78,75,0.0,US,2022-05-25 15:33:21
1,Pisco,-13.7,-76.2167,291.49,77,2,3.6,PE,2022-05-25 15:34:04
2,Chilliwack,49.1747,-121.9443,285.81,93,100,0.51,CA,2022-05-25 15:34:05
3,Hobart,-42.8794,147.3294,282.19,92,4,2.57,AU,2022-05-25 15:34:05
4,Niquelandia,-14.4739,-48.4597,303.39,24,6,4.14,BR,2022-05-25 15:34:06
5,Maryville,35.7565,-83.9705,300.53,74,100,2.06,US,2022-05-25 15:34:06
6,Mar Del Plata,-38.0023,-57.5575,284.87,76,100,2.24,AR,2022-05-25 15:34:07
7,Namatanai,-3.6667,152.4333,299.0,80,82,2.25,PG,2022-05-25 15:34:08
8,East London,-33.0153,27.9116,291.67,82,0,3.09,ZA,2022-05-25 15:34:09
9,Nanakuli,21.3906,-158.1547,296.54,78,0,2.06,US,2022-05-25 15:34:09


In [20]:
new_column_order = ['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness', 'Wind Speed']
city_data_df = city_data_df[new_column_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Statesboro,US,2022-05-25 15:33:21,32.4488,-81.7832,299.89,78,75,0.00
1,Pisco,PE,2022-05-25 15:34:04,-13.7000,-76.2167,291.49,77,2,3.60
2,Chilliwack,CA,2022-05-25 15:34:05,49.1747,-121.9443,285.81,93,100,0.51
3,Hobart,AU,2022-05-25 15:34:05,-42.8794,147.3294,282.19,92,4,2.57
4,Niquelandia,BR,2022-05-25 15:34:06,-14.4739,-48.4597,303.39,24,6,4.14
...,...,...,...,...,...,...,...,...,...
521,Dunedin,NZ,2022-05-25 16:19:53,-45.8742,170.5036,279.71,65,62,3.13
522,Aripuana,BR,2022-05-25 16:19:54,-9.1667,-60.6333,305.85,42,0,2.15
523,Woodward,US,2022-05-25 16:19:55,36.4337,-99.3904,283.72,96,100,8.23
524,Sungairaya,ID,2022-05-25 16:19:56,0.7000,108.9000,300.27,81,100,1.91


In [21]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")