In [1]:
#import dependencies

import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy

In [2]:
#create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs


<zip at 0x198c9d14bc8>

In [3]:
#add the latitudes and longitudes into a list
coordinates = list(lat_lngs)

In [4]:
#import citipy
from citipy import citipy


In [5]:
#create a list for holding the cities
cities = []

#identify the nearest city for each latitude and longitude combination

for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    #if the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)

#print the city count to confirm sufficient count
len(cities)

632

In [6]:
#import requests library 
import requests

#import weather_api_key
from config import weather_api_key

#build basic URL for OpenWeatherMap
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

#import datetime module from datetime library
from datetime import datetime

In [7]:
#create empty list to hold weather data
city_data = []

#print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

#create counters
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [8]:
#loop through all cities in the list
for i, city in enumerate(cities):
    
    #group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    #create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    #log the URL, record, and set numbers and the city
    print(f'Processing record {record_count} of set {set_count} | {city}')
    
    #add 1 to the record count
    record_count += 1
    
    #run API request for each of the cities
    try:
        #parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        #parse out the needed data
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']
        #convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        #append the city information into the city_data list
        city_data.append({"City": city.title(),
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_humidity,
                         "Cloudiness": city_clouds,
                         "Wind Speed": city_wind,
                         "Country": city_country,
                         "Date": city_date})
    #if an error is experienced, skip the city
    except:
        print('City not found.  Skipping...')
        pass
    
#indicate that the data loading is complete
print("-------------------------")
print("Data retrieval complete  ")
print("-------------------------")


    
            

Processing record 1 of set 1 | talnakh
Processing record 2 of set 1 | carnarvon
Processing record 3 of set 1 | ushuaia
Processing record 4 of set 1 | pacific grove
Processing record 5 of set 1 | jhajjar
Processing record 6 of set 1 | ayios nikolaos
Processing record 7 of set 1 | bredasdorp
Processing record 8 of set 1 | mataura
Processing record 9 of set 1 | bluff
Processing record 10 of set 1 | kaitangata
Processing record 11 of set 1 | mahebourg
Processing record 12 of set 1 | ancud
Processing record 13 of set 1 | colares
Processing record 14 of set 1 | hasaki
Processing record 15 of set 1 | yellowknife
Processing record 16 of set 1 | carutapera
Processing record 17 of set 1 | san cristobal
Processing record 18 of set 1 | victoria
Processing record 19 of set 1 | nerchinskiy zavod
Processing record 20 of set 1 | mount isa
Processing record 21 of set 1 | dankov
Processing record 22 of set 1 | hithadhoo
Processing record 23 of set 1 | taolanaro
City not found.  Skipping...
Processing re

Processing record 39 of set 4 | attawapiskat
City not found.  Skipping...
Processing record 40 of set 4 | namibe
Processing record 41 of set 4 | san patricio
Processing record 42 of set 4 | iqaluit
Processing record 43 of set 4 | salalah
Processing record 44 of set 4 | omaruru
Processing record 45 of set 4 | isangel
Processing record 46 of set 4 | santa cruz
Processing record 47 of set 4 | alenquer
Processing record 48 of set 4 | ngunguru
Processing record 49 of set 4 | viedma
Processing record 50 of set 4 | yumen
Processing record 1 of set 5 | wamba
Processing record 2 of set 5 | bethel
Processing record 3 of set 5 | oban
Processing record 4 of set 5 | tual
Processing record 5 of set 5 | mitu
Processing record 6 of set 5 | amahai
Processing record 7 of set 5 | oranjemund
Processing record 8 of set 5 | kijang
Processing record 9 of set 5 | luderitz
Processing record 10 of set 5 | yanam
Processing record 11 of set 5 | makakilo city
Processing record 12 of set 5 | arman
Processing record

Processing record 33 of set 8 | pangody
Processing record 34 of set 8 | gizo
Processing record 35 of set 8 | chateau-thierry
Processing record 36 of set 8 | selty
Processing record 37 of set 8 | dawei
Processing record 38 of set 8 | catuday
Processing record 39 of set 8 | ilulissat
Processing record 40 of set 8 | sai buri
Processing record 41 of set 8 | alofi
Processing record 42 of set 8 | palu
Processing record 43 of set 8 | palmer
Processing record 44 of set 8 | belyy yar
Processing record 45 of set 8 | guerrero negro
Processing record 46 of set 8 | mehran
Processing record 47 of set 8 | sangar
Processing record 48 of set 8 | camana
Processing record 49 of set 8 | saint-augustin
Processing record 50 of set 8 | nalut
Processing record 1 of set 9 | tynda
Processing record 2 of set 9 | sur
Processing record 3 of set 9 | new glasgow
Processing record 4 of set 9 | khonuu
City not found.  Skipping...
Processing record 5 of set 9 | pocsaj
Processing record 6 of set 9 | roscommon
Processing

Processing record 19 of set 12 | cabimas
Processing record 20 of set 12 | oranjestad
Processing record 21 of set 12 | port-de-paix
City not found.  Skipping...
Processing record 22 of set 12 | urumqi
Processing record 23 of set 12 | west lafayette
Processing record 24 of set 12 | road town
Processing record 25 of set 12 | jalu
Processing record 26 of set 12 | maraa
Processing record 27 of set 12 | betioky
Processing record 28 of set 12 | kostomuksha
Processing record 29 of set 12 | karagaylinskiy
Processing record 30 of set 12 | waingapu
Processing record 31 of set 12 | lander
Processing record 32 of set 12 | seoul
Processing record 33 of set 12 | pontianak
Processing record 34 of set 12 | wadsworth
Processing record 35 of set 12 | juba
Processing record 36 of set 12 | villa carlos paz
Processing record 37 of set 12 | novaya igirma
Processing record 38 of set 12 | villamontes
Processing record 39 of set 12 | filadelfia
Processing record 40 of set 12 | cheremisinovo
Processing record 41

In [9]:
len(city_data)

586

In [10]:
#convert list into dataframe
city_df = pd.DataFrame(city_data)
city_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Talnakh,69.4865,88.3972,66.07,86,79,6.98,RU,2021-07-27 19:43:53
1,Carnarvon,-24.8667,113.6333,59.07,54,90,4.61,AU,2021-07-27 19:43:53
2,Ushuaia,-54.8,-68.3,37.06,87,90,0.0,AR,2021-07-27 19:43:53
3,Pacific Grove,36.6177,-121.9166,93.61,77,1,7.0,US,2021-07-27 19:43:54
4,Jhajjar,28.6063,76.6565,86.32,76,100,5.3,IN,2021-07-27 19:43:54
5,Ayios Nikolaos,38.4167,23.65,88.75,33,0,0.0,GR,2021-07-27 19:43:54
6,Bredasdorp,-34.5322,20.0403,56.52,72,100,17.27,ZA,2021-07-27 19:43:55
7,Mataura,-46.1927,168.8643,48.47,97,25,1.25,NZ,2021-07-27 19:43:55
8,Bluff,-46.6,168.3333,48.79,70,15,16.73,NZ,2021-07-27 19:43:55
9,Kaitangata,-46.2817,169.8464,48.92,63,59,4.45,NZ,2021-07-27 19:43:56


In [12]:
#re-order columns 
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_df = city_df[new_column_order]

city_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Talnakh,RU,2021-07-27 19:43:53,69.4865,88.3972,66.07,86,79,6.98
1,Carnarvon,AU,2021-07-27 19:43:53,-24.8667,113.6333,59.07,54,90,4.61
2,Ushuaia,AR,2021-07-27 19:43:53,-54.8,-68.3,37.06,87,90,0.0
3,Pacific Grove,US,2021-07-27 19:43:54,36.6177,-121.9166,93.61,77,1,7.0
4,Jhajjar,IN,2021-07-27 19:43:54,28.6063,76.6565,86.32,76,100,5.3
5,Ayios Nikolaos,GR,2021-07-27 19:43:54,38.4167,23.65,88.75,33,0,0.0
6,Bredasdorp,ZA,2021-07-27 19:43:55,-34.5322,20.0403,56.52,72,100,17.27
7,Mataura,NZ,2021-07-27 19:43:55,-46.1927,168.8643,48.47,97,25,1.25
8,Bluff,NZ,2021-07-27 19:43:55,-46.6,168.3333,48.79,70,15,16.73
9,Kaitangata,NZ,2021-07-27 19:43:56,-46.2817,169.8464,48.92,63,59,4.45


In [13]:
#create output CSV file
output_data_file = "weather_data/cities.csv"
#export the city_data into CSV
city_df.to_csv(output_data_file, index_label="City_ID")
