In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import requests

from config import weather_api_key

In [2]:
# Import the time library and the datetime module from the datetime library 
import time
from datetime import datetime

In [3]:
# Build URL
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [4]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fe8fd2bd080>

In [5]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [6]:
# Use the print() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(coordinate[0], coordinate[1])

-11.953049088655064 -112.75627148651382
25.614948528956972 127.34835497067445
-80.70361274880725 -104.75566928131127
51.43167409069022 -28.91644132718602
-1.0113503650469369 -94.31338652644101
28.14323174167727 171.995866765931
-48.63083298381498 -150.4344322202515
81.33115305659246 -39.390742413194374
-34.03418669358555 -30.398291467882018
-89.29222703402606 -177.55046179515233
-69.10266959957804 140.93457917904158
37.86922828507015 -169.49365001462934
11.826538575252272 59.4126013097692
-34.91370765193991 25.38134816249064
55.087080968012145 -36.51227024083511
-34.0267389297195 39.261418397833154
-52.90241485360787 170.0664888040027
-70.96338768458968 8.92330605447566
38.29845204033123 -138.55423168379212
-13.04319565978139 -117.96190055006464
71.79127286674861 93.57893837922165
83.12549837920108 -119.40381914620345
33.236185549357785 -125.49398416138592
50.67331277018798 109.3298542398635
65.97694623396174 49.20114019350072
78.84474541491875 171.13817162665532
-44.06058600330867 -0.

72.46419502444667 145.60399120230772
51.79227987334227 33.24273107172715
86.62055179411726 141.78812568274162
21.936786219166933 78.87103077004537
-25.38136901308468 -177.92539784286677
79.04905608521682 -101.09788325437304
10.017469879646242 -133.79888731670576
-85.80705991282197 98.12082092216588
81.86443673155574 -44.71277355436149
-23.68936974340407 -143.2150831377437
72.25822970117747 -47.495855955343046
38.217589251712866 26.392703580182285
77.56378657795835 -130.405137839021
-21.66692145483107 -41.42774321758506
-33.672033815579745 175.57114184094524
-34.331562977178464 124.88261130821672
11.93997322840724 92.00070890909348
-50.56279388154389 10.903169489194283
48.791568473928436 -4.7295293653216675
-57.96286325705612 99.9197528011083
39.22878403352948 -167.9442230457629
-37.73026281763361 -10.981888491313526
75.08316365333397 -35.50675412570604
-6.8393570249289155 -93.11150733551423
-7.901954479213188 -135.79073934112122
-61.00238039078654 5.4578361606724
-43.121672487480204 36

In [7]:
from citipy import citipy

In [8]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

610

In [9]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | rikitea
Processing Record 2 of Set 1 | itoman
Processing Record 3 of Set 1 | punta arenas
Processing Record 4 of Set 1 | lagoa
Processing Record 5 of Set 1 | puerto ayora
Processing Record 6 of Set 1 | butaritari
Processing Record 7 of Set 1 | mataura
Processing Record 8 of Set 1 | tasiilaq
Processing Record 9 of Set 1 | arraial do cabo
Processing Record 10 of Set 1 | vaini
Processing Record 11 of Set 1 | hobart
Processing Record 12 of Set 1 | kapaa
Processing Record 13 of Set 1 | salalah
Processing Record 14 of Set 1 | port elizabeth
Processing Record 15 of Set 1 | nanortalik
Processing Record 16 of Set 1 | richards bay
Processing Record 17 of Set 1 | bluff
Processing Record 18 of Set 1 | hermanus
Processing Record 19 of Set 1 | fortuna
Processing Record 20 of Set 1 | talnakh
Processing Record 21 of Set 1 | tuktoyaktuk
Processing Record 22 of Set 1 | pacific grove
Processing Record 23 of Set 1 |

Processing Record 39 of Set 4 | honningsvag
Processing Record 40 of Set 4 | kuznechnoye
Processing Record 41 of Set 4 | kahului
Processing Record 42 of Set 4 | kautokeino
Processing Record 43 of Set 4 | kralendijk
Processing Record 44 of Set 4 | aswan
Processing Record 45 of Set 4 | siuri
Processing Record 46 of Set 4 | mangaratiba
Processing Record 47 of Set 4 | erzin
Processing Record 48 of Set 4 | nichinan
Processing Record 49 of Set 4 | whitehorse
Processing Record 50 of Set 4 | saryshagan
City not found. Skipping...
Processing Record 1 of Set 5 | salou
Processing Record 2 of Set 5 | lavrentiya
Processing Record 3 of Set 5 | auki
Processing Record 4 of Set 5 | dudinka
Processing Record 5 of Set 5 | lebu
Processing Record 6 of Set 5 | bosaso
Processing Record 7 of Set 5 | yanam
Processing Record 8 of Set 5 | tatarskaya kargala
Processing Record 9 of Set 5 | prijepolje
Processing Record 10 of Set 5 | kuche
City not found. Skipping...
Processing Record 11 of Set 5 | lujan
Processing R

Processing Record 30 of Set 8 | karmala
Processing Record 31 of Set 8 | chengde
Processing Record 32 of Set 8 | vardo
Processing Record 33 of Set 8 | coquimbo
Processing Record 34 of Set 8 | umm kaddadah
Processing Record 35 of Set 8 | nieuw nickerie
Processing Record 36 of Set 8 | chara
Processing Record 37 of Set 8 | tezu
Processing Record 38 of Set 8 | aquiraz
Processing Record 39 of Set 8 | hirado
Processing Record 40 of Set 8 | malwan
City not found. Skipping...
Processing Record 41 of Set 8 | gargzdai
Processing Record 42 of Set 8 | zyryanovsk
Processing Record 43 of Set 8 | tomball
Processing Record 44 of Set 8 | santa cruz cabralia
Processing Record 45 of Set 8 | san policarpo
Processing Record 46 of Set 8 | bonthe
Processing Record 47 of Set 8 | pontes e lacerda
Processing Record 48 of Set 8 | umzimvubu
City not found. Skipping...
Processing Record 49 of Set 8 | ketchikan
Processing Record 50 of Set 8 | elko
Processing Record 1 of Set 9 | buraydah
Processing Record 2 of Set 9 

Processing Record 18 of Set 12 | vermillion
Processing Record 19 of Set 12 | saint anthony
Processing Record 20 of Set 12 | teguldet
Processing Record 21 of Set 12 | kargopol
Processing Record 22 of Set 12 | amapa
Processing Record 23 of Set 12 | sigli
Processing Record 24 of Set 12 | naryan-mar
Processing Record 25 of Set 12 | monzon
Processing Record 26 of Set 12 | kvitok
Processing Record 27 of Set 12 | jinchang
Processing Record 28 of Set 12 | jumla
Processing Record 29 of Set 12 | aberystwyth
Processing Record 30 of Set 12 | riyadh
Processing Record 31 of Set 12 | atar
Processing Record 32 of Set 12 | bayji
Processing Record 33 of Set 12 | beira
Processing Record 34 of Set 12 | amahai
Processing Record 35 of Set 12 | karakendzha
City not found. Skipping...
Processing Record 36 of Set 12 | sinop
Processing Record 37 of Set 12 | pueblo
Processing Record 38 of Set 12 | caravelas
Processing Record 39 of Set 12 | oyama
Processing Record 40 of Set 12 | sorland
Processing Record 41 of Se

In [10]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Rikitea,-23.1203,-134.9692,73.72,77,99,18.99,PF,2022-08-09 01:43:52
1,Itoman,26.1247,127.6694,90.37,74,40,10.36,JP,2022-08-09 01:36:39
2,Punta Arenas,-53.15,-70.9167,37.51,81,100,9.22,CL,2022-08-09 01:43:53
3,Lagoa,39.05,-27.9833,73.02,79,3,13.53,PT,2022-08-09 01:33:57
4,Puerto Ayora,-0.7393,-90.3518,69.55,86,92,3.0,EC,2022-08-09 01:43:53
5,Butaritari,3.0707,172.7902,81.84,77,27,15.21,KI,2022-08-09 01:43:54
6,Mataura,-46.1927,168.8643,45.03,57,5,7.72,NZ,2022-08-09 01:43:54
7,Tasiilaq,65.6145,-37.6368,39.36,96,100,0.67,GL,2022-08-09 01:43:55
8,Arraial Do Cabo,-22.9661,-42.0278,70.57,86,100,7.67,BR,2022-08-09 01:43:55
9,Vaini,-21.2,-175.2,78.96,94,75,10.36,TO,2022-08-09 01:43:55


In [14]:
city_data_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[city_data_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Rikitea,PF,2022-08-09 01:43:52,-23.1203,-134.9692,73.72,77,99,18.99
1,Itoman,JP,2022-08-09 01:36:39,26.1247,127.6694,90.37,74,40,10.36
2,Punta Arenas,CL,2022-08-09 01:43:53,-53.15,-70.9167,37.51,81,100,9.22
3,Lagoa,PT,2022-08-09 01:33:57,39.05,-27.9833,73.02,79,3,13.53
4,Puerto Ayora,EC,2022-08-09 01:43:53,-0.7393,-90.3518,69.55,86,92,3.0
5,Butaritari,KI,2022-08-09 01:43:54,3.0707,172.7902,81.84,77,27,15.21
6,Mataura,NZ,2022-08-09 01:43:54,-46.1927,168.8643,45.03,57,5,7.72
7,Tasiilaq,GL,2022-08-09 01:43:55,65.6145,-37.6368,39.36,96,100,0.67
8,Arraial Do Cabo,BR,2022-08-09 01:43:55,-22.9661,-42.0278,70.57,86,100,7.67
9,Vaini,TO,2022-08-09 01:43:55,-21.2,-175.2,78.96,94,75,10.36


In [15]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")