In [1]:
# import dependencies
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [2]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)

lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)

lat_lngs = zip(lats, lngs)

lat_lngs

<zip at 0x2998393b9c8>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Use the print() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(coordinate[0], coordinate[1])

-69.35210919679561 -90.34390865671999
-25.702574872415667 -64.50086512100476
82.89211097771462 -72.57847650879899
-89.21301034973025 -57.51611431703385
-33.485354778282876 79.73712030757952
1.9030828769834756 141.33630966016256
-10.503905891944697 131.9683827568694
-14.957511438089725 -108.25950618785487
-8.645729695189516 25.167925556965287
-85.13079002263076 153.97662448849508
15.267461320030037 178.66804645126382
15.23003927881281 11.276640191934888
-9.418932870918127 129.6169272826724
63.36399020103161 3.3177545109378457
-36.02847702234088 -53.20979411242293
-85.50924961229457 -50.64444163107791
-23.140349958457136 161.64503429066895
67.39640187802428 -128.06630998942205
34.38501810522159 125.52437366771562
-67.66155446041469 -101.07425887215656
68.15690913063548 -157.93622448872472
-32.2015830509537 -178.1756263146234
10.593146476632342 104.95137846604854
-59.680898641837516 72.48549441272158
-67.57285453626807 -147.86991737750492
-49.29867735597769 149.0619567497816
-85.286185456

69.22028826228757 -6.2266147849873335
42.8037341576605 -113.81739811949801
35.31740893442415 158.93984015612534
-41.13592833303368 50.21988515829241
-47.297823205223246 -26.47501682862071
43.856594828433856 -159.99387720821966
-65.22750107857021 74.86518409475113
-60.54549238723307 170.68504414542747
13.647196605975239 81.51675663534337
-10.118633584637834 6.174665195877338
-2.996509668033241 150.817205633583
85.52193141569248 -121.51009013602535
84.39704333992813 172.21658195866212
-25.09594776831173 -148.23077989612432
-36.148562305607356 166.58220026459406
-30.545340895881267 145.59198030240373
21.355829048494954 -165.13332939588145
-28.168786185262974 122.01156265077066
-17.262236044173164 -145.54612625260177
47.6050344583775 145.84071508816987
2.3405234887607946 90.40721936291072
39.920427215566576 -163.66346855729793
-47.74699035703914 -84.0298262800936
12.49752676097394 -131.66202352962765
-48.37893670701254 -161.67653874287126
69.05426252518879 69.23958913067787
-45.24068105493

In [5]:
# Use the citipy module to determine city based on latitude and longitude
from citipy import citipy

# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

# starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [6]:
# Create a list for holding the cities
cities= []

# Identify the nearest city for each lat and  long combo
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then add to cities list
    if city not in cities:
        cities.append(city)
        
# Print the city count to confirm sufficient count
len(cities)

609

In [7]:
# Import the time library and the datetime module from the datetime library
import time

from datetime import datetime

In [8]:
# Create an empty list to hold the weather data
city_data = []

# Print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1

set_count = 1

Beginning Data Retrieval     
-----------------------------


In [9]:
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(1)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | punta arenas
Processing Record 2 of Set 1 | salta
Processing Record 3 of Set 1 | qaanaaq
Processing Record 4 of Set 1 | ushuaia
Processing Record 5 of Set 1 | bambous virieux
Processing Record 6 of Set 1 | vanimo
Processing Record 7 of Set 1 | nguiu
City not found. Skipping...
Processing Record 8 of Set 1 | puerto ayora
Processing Record 9 of Set 1 | kamina
Processing Record 10 of Set 1 | bluff
Processing Record 11 of Set 1 | butaritari
Processing Record 12 of Set 1 | goure
Processing Record 13 of Set 1 | raudeberg
Processing Record 14 of Set 1 | rocha
Processing Record 15 of Set 1 | koumac
Processing Record 16 of Set 1 | norman wells
Processing Record 17 of Set 1 | seoul
Processing Record 18 of Set 1 | barrow
Processing Record 19 of Set 1 | vaini
Processing Record 20 of Set 1 | chau doc
Processing Record 21 of Set 1 | saint-philippe
Processing Record 22 of Set 1 | mataura
Processing Record 23 of Set 1 | hobart
Processing Record 24 of Set 1 | hermanus
Pro

Processing Record 39 of Set 4 | vila velha
Processing Record 40 of Set 4 | port macquarie
Processing Record 41 of Set 4 | hilo
Processing Record 42 of Set 4 | kenai
Processing Record 43 of Set 4 | tabiauea
City not found. Skipping...
Processing Record 44 of Set 4 | longlac
City not found. Skipping...
Processing Record 45 of Set 4 | ciechanow
Processing Record 46 of Set 4 | porterville
Processing Record 47 of Set 4 | geraldton
Processing Record 48 of Set 4 | algiers
Processing Record 49 of Set 4 | constitucion
Processing Record 50 of Set 4 | yanliang
Processing Record 1 of Set 5 | tumannyy
City not found. Skipping...
Processing Record 2 of Set 5 | erzin
Processing Record 3 of Set 5 | sidi ali
Processing Record 4 of Set 5 | tuy hoa
Processing Record 5 of Set 5 | nizwa
Processing Record 6 of Set 5 | usvyaty
Processing Record 7 of Set 5 | yellowknife
Processing Record 8 of Set 5 | madimba
Processing Record 9 of Set 5 | illoqqortoormiut
City not found. Skipping...
Processing Record 10 of Se

Processing Record 29 of Set 8 | oxapampa
Processing Record 30 of Set 8 | channel-port aux basques
Processing Record 31 of Set 8 | castro
Processing Record 32 of Set 8 | bilma
Processing Record 33 of Set 8 | rimos
City not found. Skipping...
Processing Record 34 of Set 8 | caledon
Processing Record 35 of Set 8 | aras
Processing Record 36 of Set 8 | vestmanna
Processing Record 37 of Set 8 | rincon de la victoria
Processing Record 38 of Set 8 | laguna
Processing Record 39 of Set 8 | saleaula
City not found. Skipping...
Processing Record 40 of Set 8 | ostersund
Processing Record 41 of Set 8 | devils lake
Processing Record 42 of Set 8 | mabaruma
Processing Record 43 of Set 8 | sabha
Processing Record 44 of Set 8 | rovaniemi
Processing Record 45 of Set 8 | rio verde de mato grosso
Processing Record 46 of Set 8 | cabedelo
Processing Record 47 of Set 8 | longyearbyen
Processing Record 48 of Set 8 | champoton
Processing Record 49 of Set 8 | xinqing
Processing Record 50 of Set 8 | canberra
Proce

Processing Record 17 of Set 12 | zeya
Processing Record 18 of Set 12 | buala
Processing Record 19 of Set 12 | katherine
Processing Record 20 of Set 12 | samarai
Processing Record 21 of Set 12 | krasnyy profintern
Processing Record 22 of Set 12 | auki
Processing Record 23 of Set 12 | salinas
Processing Record 24 of Set 12 | mingaora
Processing Record 25 of Set 12 | acajutla
Processing Record 26 of Set 12 | preobrazheniye
Processing Record 27 of Set 12 | maniitsoq
Processing Record 28 of Set 12 | yumen
Processing Record 29 of Set 12 | pizarro
Processing Record 30 of Set 12 | karratha
Processing Record 31 of Set 12 | jacareacanga
Processing Record 32 of Set 12 | bonthe
Processing Record 33 of Set 12 | bargal
City not found. Skipping...
Processing Record 34 of Set 12 | catamarca
Processing Record 35 of Set 12 | bayangol
Processing Record 36 of Set 12 | oriximina
Processing Record 37 of Set 12 | adrar
Processing Record 38 of Set 12 | kastamonu
Processing Record 39 of Set 12 | douglas
Proces

In [10]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)

city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Punta Arenas,-53.15,-70.9167,37.11,69,100,12.75,CL,2022-06-28 00:02:34
1,Salta,-24.7859,-65.4117,48.58,83,44,3.0,AR,2022-06-28 00:02:52
2,Qaanaaq,77.484,-69.3632,47.59,57,13,4.27,GL,2022-06-28 00:02:52
3,Ushuaia,-54.8,-68.3,42.46,56,40,11.5,AR,2022-06-28 00:02:53
4,Bambous Virieux,-20.3428,57.7575,66.22,66,77,18.43,MU,2022-06-28 00:02:53
5,Vanimo,-2.6741,141.3028,83.03,68,84,5.55,PG,2022-06-28 00:02:53
6,Puerto Ayora,-0.7393,-90.3518,67.55,97,68,5.01,EC,2022-06-28 00:02:54
7,Kamina,-8.7386,24.9906,56.79,56,8,5.28,CD,2022-06-28 00:02:54
8,Bluff,-46.6,168.3333,38.8,68,7,4.03,NZ,2022-06-28 00:01:13
9,Butaritari,3.0707,172.7902,81.63,80,67,11.97,KI,2022-06-28 00:02:55


In [11]:
# Column order
new_column_order=["City", "Country", "Date", "Lat", "Lng",
                 "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

city_data_df=city_data_df[new_column_order]

city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Punta Arenas,CL,2022-06-28 00:02:34,-53.1500,-70.9167,37.11,69,100,12.75
1,Salta,AR,2022-06-28 00:02:52,-24.7859,-65.4117,48.58,83,44,3.00
2,Qaanaaq,GL,2022-06-28 00:02:52,77.4840,-69.3632,47.59,57,13,4.27
3,Ushuaia,AR,2022-06-28 00:02:53,-54.8000,-68.3000,42.46,56,40,11.50
4,Bambous Virieux,MU,2022-06-28 00:02:53,-20.3428,57.7575,66.22,66,77,18.43
...,...,...,...,...,...,...,...,...,...
556,Livingstone,ZM,2022-06-28 00:06:21,-17.8419,25.8543,56.52,57,62,10.69
557,Tocopilla,CL,2022-06-28 00:06:22,-22.0920,-70.1979,65.86,63,100,13.73
558,Nizhneudinsk,RU,2022-06-28 00:06:22,54.9076,99.0276,71.47,71,45,3.36
559,Port Lincoln,AU,2022-06-28 00:06:22,-34.7333,135.8667,52.95,62,40,14.09


In [12]:
# Create the output file (CSV)
output_data_file="weather_data/cities.csv"

# Export the city_data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")