In [1]:
import pandas as pd
import matplotlib as plt
import numpy as np
from citipy import citipy
from datetime import datetime
from config import api
import requests

In [2]:
#create set of random lat and long combinations
lats = np.random.uniform(-90, 90, size=1500)
lngs = np.random.uniform(-180, 180, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x188bf150888>

In [3]:
#add lats and lngs to a list
coordinates = list(lat_lngs)

In [4]:
coordinates

[(-11.472795897570549, -83.67314574147149),
 (-13.98648179962801, -158.66789299260478),
 (-17.631995065568418, 52.62182212398977),
 (3.958310343918839, 179.62762878070362),
 (66.9212420733713, 135.74575236230936),
 (-46.99766224410159, -83.00222264941131),
 (84.21811549463621, 134.00806703035857),
 (-81.23881975342302, -60.893639254267285),
 (-24.691705831574097, -48.64106354661271),
 (-86.91296990467029, 66.27032571743587),
 (-71.6423166413939, 157.65635968493024),
 (40.272973734523475, -99.08486426944194),
 (57.93189732049737, 114.67381046185119),
 (-81.04490002819394, -64.90481765341687),
 (-1.3854808081852212, 49.69941003457649),
 (-38.04300265426279, 68.56913357198465),
 (-70.41165382861067, 65.61719416320108),
 (-33.63377339885841, 60.80857453549609),
 (-78.28084174981886, -152.03303691714095),
 (71.62920100507512, -45.495229033360516),
 (66.42682807639812, -131.34683584010625),
 (-69.86016517652257, 96.67679960047388),
 (-25.276582538070116, 65.59867659306676),
 (24.699899100982

In [5]:
#create a list for holding cities
cities = []
#id the nearest city for each lat and long comb
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    #if the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)

#print the city count to confirm sufficient count
len(cities)

609

In [6]:
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + api

In [7]:
#create empty list to hold weather data
city_data = []
#print the beginning fo the logging
print("Beginning Data Retrieval    ")
print("----------------------------")

#create counters
record_count = 1
set_count = 1


# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval    
----------------------------
Processing Record 1 of Set 1 | chimbote
Processing Record 2 of Set 1 | avarua
Processing Record 3 of Set 1 | ambodifototra
City not found. Skipping...
Processing Record 4 of Set 1 | rungata
City not found. Skipping...
Processing Record 5 of Set 1 | batagay
Processing Record 6 of Set 1 | castro
Processing Record 7 of Set 1 | nizhneyansk
City not found. Skipping...
Processing Record 8 of Set 1 | ushuaia
Processing Record 9 of Set 1 | apiai
Processing Record 10 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 11 of Set 1 | bluff
Processing Record 12 of Set 1 | kearney
Processing Record 13 of Set 1 | balakhninskiy
Processing Record 14 of Set 1 | mogadishu
Processing Record 15 of Set 1 | mahebourg
Processing Record 16 of Set 1 | saint-philippe
Processing Record 17 of Set 1 | mataura
Processing Record 18 of Set 1 | ilulissat
Processing Record 19 of Set 1 | inuvik
Processing Record 20 of Set 1 | busselton
Processing R

Processing Record 39 of Set 4 | yeehaw junction
City not found. Skipping...
Processing Record 40 of Set 4 | aflu
City not found. Skipping...
Processing Record 41 of Set 4 | sefophe
Processing Record 42 of Set 4 | bonthe
Processing Record 43 of Set 4 | rognan
Processing Record 44 of Set 4 | saint george
Processing Record 45 of Set 4 | sao filipe
Processing Record 46 of Set 4 | felanitx
Processing Record 47 of Set 4 | naze
Processing Record 48 of Set 4 | lata
Processing Record 49 of Set 4 | amderma
City not found. Skipping...
Processing Record 50 of Set 4 | hasaki
Processing Record 1 of Set 5 | kapaa
Processing Record 2 of Set 5 | selizharovo
Processing Record 3 of Set 5 | le port
Processing Record 4 of Set 5 | hovd
Processing Record 5 of Set 5 | margate
Processing Record 6 of Set 5 | tomatlan
Processing Record 7 of Set 5 | fairbanks
Processing Record 8 of Set 5 | novyy svit
Processing Record 9 of Set 5 | sataua
City not found. Skipping...
Processing Record 10 of Set 5 | atbasar
Processi

City not found. Skipping...
Processing Record 31 of Set 8 | cidreira
Processing Record 32 of Set 8 | labuan
Processing Record 33 of Set 8 | loding
Processing Record 34 of Set 8 | umzimvubu
City not found. Skipping...
Processing Record 35 of Set 8 | ossora
Processing Record 36 of Set 8 | tahta
Processing Record 37 of Set 8 | bosaso
Processing Record 38 of Set 8 | korla
Processing Record 39 of Set 8 | encheng
Processing Record 40 of Set 8 | buala
Processing Record 41 of Set 8 | idanre
Processing Record 42 of Set 8 | sorvag
City not found. Skipping...
Processing Record 43 of Set 8 | kyabe
Processing Record 44 of Set 8 | bac lieu
Processing Record 45 of Set 8 | la ronge
Processing Record 46 of Set 8 | quelimane
Processing Record 47 of Set 8 | khash
Processing Record 48 of Set 8 | clarksdale
Processing Record 49 of Set 8 | fort nelson
Processing Record 50 of Set 8 | inhambane
Processing Record 1 of Set 9 | pihani
Processing Record 2 of Set 9 | sohag
Processing Record 3 of Set 9 | tumpat
Pro

Processing Record 14 of Set 12 | usogorsk
Processing Record 15 of Set 12 | olafsvik
Processing Record 16 of Set 12 | olinda
Processing Record 17 of Set 12 | alcantara
Processing Record 18 of Set 12 | mocambique
City not found. Skipping...
Processing Record 19 of Set 12 | bambanglipuro
Processing Record 20 of Set 12 | tyukhtet
Processing Record 21 of Set 12 | mala bilozerka
Processing Record 22 of Set 12 | tarakan
Processing Record 23 of Set 12 | mangrol
Processing Record 24 of Set 12 | bud
Processing Record 25 of Set 12 | hofn
Processing Record 26 of Set 12 | toda raisingh
Processing Record 27 of Set 12 | waingapu
Processing Record 28 of Set 12 | flinders
Processing Record 29 of Set 12 | abu kamal
Processing Record 30 of Set 12 | uribia
Processing Record 31 of Set 12 | mahon
Processing Record 32 of Set 12 | marsh harbour
Processing Record 33 of Set 12 | roebourne
Processing Record 34 of Set 12 | kisangani
Processing Record 35 of Set 12 | olga
Processing Record 36 of Set 12 | yerbogache

In [8]:
#convert the array of dicts to a pd df
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Chimbote,-9.0853,-78.5783,62.24,88,43,9.24,PE,2021-10-24 03:01:53
1,Avarua,-21.2078,-159.775,75.25,53,75,5.75,CK,2021-10-24 02:58:24
2,Batagay,67.6333,134.6333,7.3,92,100,3.8,RU,2021-10-24 03:01:54
3,Castro,-24.7911,-50.0119,58.55,97,100,5.7,BR,2021-10-24 03:01:12
4,Ushuaia,-54.8,-68.3,30.63,94,90,4.52,AR,2021-10-24 03:01:55
5,Apiai,-24.5094,-48.8425,58.33,100,100,1.81,BR,2021-10-24 03:01:55
6,Bluff,-46.6,168.3333,52.32,94,100,5.99,NZ,2021-10-24 03:01:56
7,Kearney,40.6995,-99.0815,54.0,77,100,3.0,US,2021-10-24 03:01:56
8,Balakhninskiy,58.0106,114.2769,35.17,79,82,3.91,RU,2021-10-24 03:01:56
9,Mogadishu,2.0371,45.3438,79.14,81,11,10.58,SO,2021-10-24 02:57:53


In [10]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
re_city_data_df = city_data_df[new_column_order]
re_city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Chimbote,PE,2021-10-24 03:01:53,-9.0853,-78.5783,62.24,88,43,9.24
1,Avarua,CK,2021-10-24 02:58:24,-21.2078,-159.775,75.25,53,75,5.75
2,Batagay,RU,2021-10-24 03:01:54,67.6333,134.6333,7.3,92,100,3.8
3,Castro,BR,2021-10-24 03:01:12,-24.7911,-50.0119,58.55,97,100,5.7
4,Ushuaia,AR,2021-10-24 03:01:55,-54.8,-68.3,30.63,94,90,4.52
5,Apiai,BR,2021-10-24 03:01:55,-24.5094,-48.8425,58.33,100,100,1.81
6,Bluff,NZ,2021-10-24 03:01:56,-46.6,168.3333,52.32,94,100,5.99
7,Kearney,US,2021-10-24 03:01:56,40.6995,-99.0815,54.0,77,100,3.0
8,Balakhninskiy,RU,2021-10-24 03:01:56,58.0106,114.2769,35.17,79,82,3.91
9,Mogadishu,SO,2021-10-24 02:57:53,2.0371,45.3438,79.14,81,11,10.58


In [11]:
#create output csv file
output_data_file = "weather_data/cities.csv"
#export the City_Data into a csv
re_city_data_df.to_csv(output_data_file, index_label="City_ID")