In [1]:
# Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs 

<zip at 0x24ffc0d3088>

In [3]:
# Create a practice set of random latitude and longitude combinations
x = [25.12903645, 25.92017388, 26.62509167, -59.98969384, 37.30571269]
y = [-67.59741259, 11.09532135, 74.84233102, -76.89176677, -61.13376282]
coordinates = zip(x, y)

In [4]:
# Use the tuple() function to display the latitude and longitude combinations
for coordinate in coordinates:
    print(coordinate[0], coordinate[1])

25.12903645 -67.59741259
25.92017388 11.09532135
26.62509167 74.84233102
-59.98969384 -76.89176677
37.30571269 -61.13376282


In [5]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [6]:
# Use the citipy module to determine city based on latitude and longitude
from citipy import citipy

In [7]:
# Use the tuple() function to display the latitude and longitude combinations
for coordinate in coordinates:
    print(citipy.nearest_city(coordinate[0], coordinate[1]).city_name,
          citipy.nearest_city(coordinate[0], coordinate[1]).country_code)

east london za
port alfred za
thanh hoa vn
kieta pg
jamestown sh
sur om
mataura pf
golden us
umtata za
albany au
bambous virieux mu
ushuaia ar
chara ru
cape town za
chapais ca
maragogi br
ancud cl
ormara pk
sao filipe cv
ushuaia ar
salalah om
sampit id
albany au
albany au
mataura pf
bowen au
tanout ne
lata sb
hermanus za
qaanaaq gl
klaksvik fo
paamiut gl
vaini to
tres arroyos ar
coihaique cl
amderma ru
saint george bm
cherskiy ru
qasigiannguit gl
maniitsoq gl
winneba gh
saint-philippe re
bredasdorp za
hilo us
sao filipe cv
taunggyi mm
dossor kz
ushuaia ar
cape town za
anyang cn
rikitea pf
guastatoya gt
udachnyy ru
rikitea pf
hihifo to
atuona pf
palmer us
dikson ru
grindavik is
ikom ng
ambovombe mg
carnarvon au
uyuni bo
hamilton bm
rungata ki
east london za
stanger za
hermanus za
carnarvon au
vaitupu wf
thompson ca
cidreira br
mataura pf
east london za
grindavik is
darhan mn
vaitupu wf
nanortalik gl
zachagansk kz
belushya guba ru
bluff nz
hilo us
kaitangata nz
port elizabeth za
porto be

barrow us
barrow us
guerrero negro mx
jamestown sh
mount isa au
saskylakh ru
quelimane mz
nikolskoye ru
bandarbeyla so
gannan cn
puertollano es
bredasdorp za
faanui pf
pisco pe
cherskiy ru
morant bay jm
dikson ru
marawi sd
busselton au
kruisfontein za
sayyan ye
khatanga ru
padang id
saint-philippe re
hilo us
adrar dz
reggio di calabria it
tautira pf
vanimo pg
tiksi ru
cockburn town tc
ushuaia ar
kamaishi jp
puerto ayora ec
tasiilaq gl
bethel us
bredasdorp za
hofn is
fortuna us
mount gambier au
busselton au
hilo us
elliot za
lebu cl
thompson ca
luganville vu
saskylakh ru
castro cl
blois fr
kavieng pg
rikitea pf
portland au
vadso no
rikitea pf
roma au
atuona pf
punta arenas cl
rikitea pf
atuona pf
cabo san lucas mx
ghanzi bw
bluff nz
kungurtug ru
waingapu id
hithadhoo mv
sukumo jp
kaitangata nz
tiksi ru
westerly us
ilulissat gl
vaini to
cape town za
acapulco mx
taolanaro mg
avarua ck
ushuaia ar
provideniya ru
rikitea pf
vaini to
esperance au
belushya guba ru
tuktoyaktuk ca
port alfred za

In [8]:
# Create a list for holding the cities
cities = []

# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

633

In [9]:
# Import the requests library
import requests

# Import the API key
from config import weather_api_key

In [10]:
# Build the basic URL for the OpenWeatherMap with your weather_api_key added to the URL
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [11]:
# Import the datetime module from the datetime library
from datetime import datetime

In [12]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
    # Run an API request for each of the cities.

    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | east london
Processing Record 2 of Set 1 | port alfred
Processing Record 3 of Set 1 | thanh hoa
Processing Record 4 of Set 1 | kieta
Processing Record 5 of Set 1 | jamestown
Processing Record 6 of Set 1 | sur
Processing Record 7 of Set 1 | mataura
Processing Record 8 of Set 1 | golden
Processing Record 9 of Set 1 | umtata
Processing Record 10 of Set 1 | albany
Processing Record 11 of Set 1 | bambous virieux
Processing Record 12 of Set 1 | ushuaia
Processing Record 13 of Set 1 | chara
Processing Record 14 of Set 1 | cape town
Processing Record 15 of Set 1 | chapais
Processing Record 16 of Set 1 | maragogi
Processing Record 17 of Set 1 | ancud
Processing Record 18 of Set 1 | ormara
Processing Record 19 of Set 1 | sao filipe
Processing Record 20 of Set 1 | salalah
Processing Record 21 of Set 1 | sampit
Processing Record 22 of Set 1 | bowen
Processing Record 23 of Set 1 | tanout
Processing Record 24 

Processing Record 37 of Set 4 | urdzhar
City not found. Skipping...
Processing Record 38 of Set 4 | leh
Processing Record 39 of Set 4 | hanstholm
Processing Record 40 of Set 4 | shahrud
Processing Record 41 of Set 4 | kharp
Processing Record 42 of Set 4 | pahrump
Processing Record 43 of Set 4 | omboue
Processing Record 44 of Set 4 | kununurra
Processing Record 45 of Set 4 | emerald
Processing Record 46 of Set 4 | makung
City not found. Skipping...
Processing Record 47 of Set 4 | laguna
Processing Record 48 of Set 4 | tandil
Processing Record 49 of Set 4 | mogadishu
Processing Record 50 of Set 4 | paragominas
Processing Record 1 of Set 5 | viesca
Processing Record 2 of Set 5 | salinas
Processing Record 3 of Set 5 | cartagena del chaira
Processing Record 4 of Set 5 | tonantins
Processing Record 5 of Set 5 | amzya
Processing Record 6 of Set 5 | siniscola
Processing Record 7 of Set 5 | yaan
Processing Record 8 of Set 5 | puerto del rosario
Processing Record 9 of Set 5 | bridlington
Process

Processing Record 27 of Set 8 | sakakah
Processing Record 28 of Set 8 | viligili
City not found. Skipping...
Processing Record 29 of Set 8 | kulhudhuffushi
Processing Record 30 of Set 8 | frankfort
Processing Record 31 of Set 8 | puerto baquerizo moreno
Processing Record 32 of Set 8 | tuktoyaktuk
Processing Record 33 of Set 8 | palanga
Processing Record 34 of Set 8 | fomboni
Processing Record 35 of Set 8 | sainte-marie
Processing Record 36 of Set 8 | palembang
Processing Record 37 of Set 8 | acapulco
Processing Record 38 of Set 8 | smithers
Processing Record 39 of Set 8 | guerrero negro
Processing Record 40 of Set 8 | mount isa
Processing Record 41 of Set 8 | quelimane
Processing Record 42 of Set 8 | gannan
Processing Record 43 of Set 8 | puertollano
Processing Record 44 of Set 8 | sayyan
Processing Record 45 of Set 8 | padang
Processing Record 46 of Set 8 | adrar
Processing Record 47 of Set 8 | reggio di calabria
Processing Record 48 of Set 8 | tautira
Processing Record 49 of Set 8 | 

Processing Record 20 of Set 12 | wanganui
Processing Record 21 of Set 12 | mantua
Processing Record 22 of Set 12 | lovington
Processing Record 23 of Set 12 | arkhara
Processing Record 24 of Set 12 | huicungo
Processing Record 25 of Set 12 | tsihombe
City not found. Skipping...
Processing Record 26 of Set 12 | greytown
Processing Record 27 of Set 12 | shache
Processing Record 28 of Set 12 | oranjemund
Processing Record 29 of Set 12 | vestmanna
Processing Record 30 of Set 12 | aksu
Processing Record 31 of Set 12 | tacuarembo
Processing Record 32 of Set 12 | alugan
Processing Record 33 of Set 12 | newport
Processing Record 34 of Set 12 | tazovskiy
Processing Record 35 of Set 12 | altamira
Processing Record 36 of Set 12 | coquimbo
Processing Record 37 of Set 12 | neuquen
Processing Record 38 of Set 12 | zharkent
Processing Record 39 of Set 12 | barbosa ferraz
Processing Record 40 of Set 12 | wufeng
Processing Record 41 of Set 12 | helmstedt
Processing Record 42 of Set 12 | udalguri
Process

In [13]:
len(city_data)

587

In [15]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,East London,-33.02,27.91,78.71,32,100,13.29,ZA,2020-07-09 15:30:45
1,Port Alfred,-33.59,26.89,74.23,37,89,14.34,ZA,2020-07-09 15:30:45
2,Thanh Hoa,19.8,105.77,88.77,59,100,10.56,VN,2020-07-09 15:30:45
3,Kieta,-6.22,155.63,79.97,78,100,7.76,PG,2020-07-09 15:30:45
4,Jamestown,42.1,-79.24,82.4,61,20,3.36,US,2020-07-09 15:25:48
5,Sur,22.57,59.53,90.63,50,100,14.65,OM,2020-07-09 15:30:46
6,Mataura,-46.19,168.86,42.87,92,94,5.61,NZ,2020-07-09 15:30:46
7,Golden,39.76,-105.22,79.0,17,20,5.82,US,2020-07-09 15:28:46
8,Umtata,-31.59,28.78,73.4,23,93,1.12,ZA,2020-07-09 15:30:46
9,Albany,42.6,-73.97,84.0,82,4,2.84,US,2020-07-09 15:30:01


In [18]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

In [20]:
city_data_df = city_data_df[new_column_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,East London,ZA,2020-07-09 15:30:45,-33.02,27.91,78.71,32,100,13.29
1,Port Alfred,ZA,2020-07-09 15:30:45,-33.59,26.89,74.23,37,89,14.34
2,Thanh Hoa,VN,2020-07-09 15:30:45,19.80,105.77,88.77,59,100,10.56
3,Kieta,PG,2020-07-09 15:30:45,-6.22,155.63,79.97,78,100,7.76
4,Jamestown,US,2020-07-09 15:25:48,42.10,-79.24,82.40,61,20,3.36
...,...,...,...,...,...,...,...,...,...
582,Boone,US,2020-07-09 15:34:01,39.03,-92.33,86.00,70,61,1.01
583,Drawsko Pomorskie,PL,2020-07-09 15:34:01,53.53,15.81,59.00,87,100,5.66
584,Varde,DK,2020-07-09 15:34:02,55.62,8.48,63.00,59,61,9.17
585,Taltal,CL,2020-07-09 15:34:02,-25.40,-70.48,69.13,34,0,3.69


In [22]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"

# Export the City_Data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")