In [21]:
# Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [22]:
from citipy import citipy

In [23]:
# Import the requests library
import requests
# requests.__version__

# Import the API Key
from config import weather_api_key

In [24]:
# Import the datetime module from the datetime library
from datetime import datetime

In [25]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000,high=90.000,size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats,lngs)
lat_lngs

<zip at 0x7fd8a80b2f40>

In [26]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [27]:
coordinates

[(12.05669298531916, -46.509193181130996),
 (-60.74495789500114, -74.0842323817295),
 (-5.969506958385011, 24.18442768434494),
 (16.447956144211645, -39.13537659387896),
 (48.829741320704414, -48.07493007717491),
 (47.14159724213735, -157.6055138926154),
 (-12.257517170727212, -160.50092638197904),
 (59.0208324033444, -4.716747474951745),
 (-37.97655015168286, -149.81590047345233),
 (41.4023419910485, -25.79771653789237),
 (-4.505997420246686, -146.4482112419697),
 (-42.20252448521915, -130.17266385046867),
 (-69.38999844741517, -6.663736534309152),
 (10.958542040072174, 43.52083922360592),
 (-77.79268425059341, -134.51592527221655),
 (55.78713687059346, -93.49752127423467),
 (-33.27665918644216, -18.839072886767497),
 (71.91913813280823, -146.6552809198125),
 (28.663362987457077, 90.41409574058315),
 (-89.71073356967952, -57.66184835729375),
 (-46.54234286038523, -127.17980956738253),
 (-89.98537305019391, -96.93873514327734),
 (3.217783371269107, 134.85167437610636),
 (14.50539018696

In [29]:
# Create a list for holding the cities
cities = []
# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0],coordinate[1]).city_name
    # If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
    
# Print the city count to confirm sufficient count
len(cities)

588

In [31]:
cities

['cayenne',
 'punta arenas',
 'kabinda',
 'ponta do sol',
 'torbay',
 'kodiak',
 'avarua',
 'ullapool',
 'mataura',
 'praia da vitoria',
 'atuona',
 'rikitea',
 'cape town',
 'jibuti',
 'thompson',
 'jamestown',
 'college',
 'gasa',
 'ushuaia',
 'kloulklubed',
 'bara',
 'port macquarie',
 'belushya guba',
 'albany',
 'upernavik',
 'ribeira grande',
 'hithadhoo',
 'port lincoln',
 'dali',
 'goderich',
 'usinsk',
 'barrow',
 'sandwick',
 'kaitangata',
 'dikson',
 'beira',
 'busselton',
 'smolenka',
 'okandja',
 'geraldton',
 'longyearbyen',
 'russell',
 'bambous virieux',
 'bredasdorp',
 'mayya',
 'vaini',
 'tsihombe',
 'rungata',
 'oum hadjer',
 'diamantina',
 'alice springs',
 'puerto ayora',
 'gimli',
 'maragogi',
 'port alfred',
 'attawapiskat',
 'monte alegre',
 'folldal',
 'ornskoldsvik',
 'vestmannaeyjar',
 'tasiilaq',
 'soyo',
 'hermanus',
 'forlev',
 'halalo',
 'severo-kurilsk',
 'namibe',
 'new norfolk',
 'tabiauea',
 'selizharovo',
 'volgodonsk',
 'kapaa',
 'saskylakh',
 'tuma

In [35]:
# Starting URL for Weather Map API Call
url="http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

# Create an empty list to hold the weather data
city_data = []
# Print the beginning of the logging
print("Beginning Data Retrival  ")
print("-------------------------")

# Create counters
record_count= 1
set_count = 1

# Loop through all the cities in our list
for i, city in enumerate(cities):
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try: 
        # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list
        city_data.append({"City": city.title(),
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_humidity,
                         "Cloudiness": city_clouds,
                         "Wind Speed": city_wind,
                         "Country": city_country,
                         "Date": city_date})

    # If an error is experienced, skip the city
    except: 
        print("City not found, Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-------------------------")
print("Data Retrieval Complete. ")
print("-------------------------")

Beginning Data Retrival  
-------------------------
Processing Record 1 of Set 1 | cayenne
Processing Record 2 of Set 1 | punta arenas
Processing Record 3 of Set 1 | kabinda
Processing Record 4 of Set 1 | ponta do sol
Processing Record 5 of Set 1 | torbay
Processing Record 6 of Set 1 | kodiak
Processing Record 7 of Set 1 | avarua
Processing Record 8 of Set 1 | ullapool
Processing Record 9 of Set 1 | mataura
Processing Record 10 of Set 1 | praia da vitoria
Processing Record 11 of Set 1 | atuona
Processing Record 12 of Set 1 | rikitea
Processing Record 13 of Set 1 | cape town
Processing Record 14 of Set 1 | jibuti
Processing Record 15 of Set 1 | thompson
Processing Record 16 of Set 1 | jamestown
Processing Record 17 of Set 1 | college
Processing Record 18 of Set 1 | gasa
Processing Record 19 of Set 1 | ushuaia
Processing Record 20 of Set 1 | kloulklubed
Processing Record 21 of Set 1 | bara
Processing Record 22 of Set 1 | port macquarie
Processing Record 23 of Set 1 | belushya guba
City n

Processing Record 37 of Set 4 | muravlenko
Processing Record 38 of Set 4 | darhan
Processing Record 39 of Set 4 | qabis
City not found, Skipping...
Processing Record 40 of Set 4 | akhmeta
Processing Record 41 of Set 4 | westport
Processing Record 42 of Set 4 | gboko
Processing Record 43 of Set 4 | igarka
Processing Record 44 of Set 4 | la ronge
Processing Record 45 of Set 4 | batsfjord
Processing Record 46 of Set 4 | hasaki
Processing Record 47 of Set 4 | zhezkazgan
Processing Record 48 of Set 4 | jacareacanga
Processing Record 49 of Set 4 | suyapa de lean
City not found, Skipping...
Processing Record 50 of Set 4 | grand river south east
City not found, Skipping...
Processing Record 1 of Set 5 | faanui
Processing Record 2 of Set 5 | korla
Processing Record 3 of Set 5 | srbobran
Processing Record 4 of Set 5 | trabzon
Processing Record 5 of Set 5 | tuktoyaktuk
Processing Record 6 of Set 5 | buala
Processing Record 7 of Set 5 | omboue
Processing Record 8 of Set 5 | charters towers
Process

Processing Record 25 of Set 8 | lamar
Processing Record 26 of Set 8 | masterton
Processing Record 27 of Set 8 | zhigalovo
Processing Record 28 of Set 8 | belmonte
Processing Record 29 of Set 8 | waingapu
Processing Record 30 of Set 8 | kahului
Processing Record 31 of Set 8 | darlawn
Processing Record 32 of Set 8 | ossora
Processing Record 33 of Set 8 | rudbar
Processing Record 34 of Set 8 | hambantota
Processing Record 35 of Set 8 | pangnirtung
Processing Record 36 of Set 8 | guerrero negro
Processing Record 37 of Set 8 | belaya gora
Processing Record 38 of Set 8 | never
Processing Record 39 of Set 8 | touros
Processing Record 40 of Set 8 | baghdad
Processing Record 41 of Set 8 | hobyo
Processing Record 42 of Set 8 | arlit
Processing Record 43 of Set 8 | strezhevoy
Processing Record 44 of Set 8 | srednyaya akhtuba
Processing Record 45 of Set 8 | salta
Processing Record 46 of Set 8 | pontes e lacerda
Processing Record 47 of Set 8 | port hardy
Processing Record 48 of Set 8 | birao
Proces

Processing Record 17 of Set 12 | kandrian
Processing Record 18 of Set 12 | grand gaube
Processing Record 19 of Set 12 | poum
Processing Record 20 of Set 12 | egvekinot
Processing Record 21 of Set 12 | sitka
Processing Record 22 of Set 12 | palana
Processing Record 23 of Set 12 | yakeshi
Processing Record 24 of Set 12 | batticaloa
Processing Record 25 of Set 12 | la asuncion
Processing Record 26 of Set 12 | hondo
Processing Record 27 of Set 12 | gondanglegi
Processing Record 28 of Set 12 | neryungri
Processing Record 29 of Set 12 | jaswantnagar
Processing Record 30 of Set 12 | silale
Processing Record 31 of Set 12 | plouzane
Processing Record 32 of Set 12 | avera
Processing Record 33 of Set 12 | muana
Processing Record 34 of Set 12 | manmad
Processing Record 35 of Set 12 | tarakan
Processing Record 36 of Set 12 | aztec
Processing Record 37 of Set 12 | tuggurt
City not found, Skipping...
Processing Record 38 of Set 12 | northam
-------------------------
Data Retrieval Complete. 
--------

In [39]:
# Convert the array of dictionaries to a Pandas DataFrame
city_data_df= pd.DataFrame(city_data)
city_data_df.tail()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
541,Muana,-1.5283,-49.2167,79.21,78,87,4.81,BR,2021-05-26 23:10:12
542,Manmad,20.25,74.45,75.18,78,100,23.24,IN,2021-05-26 23:10:12
543,Tarakan,3.3,117.6333,79.61,84,72,4.94,ID,2021-05-26 23:06:55
544,Aztec,36.8222,-107.9929,78.21,13,100,15.86,US,2021-05-26 23:10:13
545,Northam,51.0333,-4.2167,50.31,94,11,2.59,GB,2021-05-26 23:10:13


In [44]:
new_column_order = ["City", "Country","Date","Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]

city_data_df = city_data_df[new_column_order]
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Cayenne,GF,2021-05-26 23:05:36,4.9333,-52.3333,78.84,89,90,3.0
1,Punta Arenas,CL,2021-05-26 23:03:19,-53.15,-70.9167,33.12,74,20,13.85
2,Kabinda,CD,2021-05-26 23:07:31,-6.1333,24.4833,65.35,57,10,3.24
3,Ponta Do Sol,PT,2021-05-26 23:07:32,32.6667,-17.1,66.0,74,96,6.02
4,Torbay,CA,2021-05-26 23:07:32,47.6666,-52.7314,49.75,93,90,8.05


In [45]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
# Export the city_data into CSV
city_data_df.to_csv(output_data_file, index_label= "City_ID")