In [1]:
# Import dependencies
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [2]:
# Create a set of random latitudes and longitude combinations
lats = np.random.uniform(low= -90.000, high= 90.000, size=1500)
lngs = np.random.uniform(low= -180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x2c4ba727800>

In [3]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [4]:
# import citipy 
from citipy import citipy

In [5]:
# Create a list for holding the cities
cities = []
# Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count
len(cities)

619

In [6]:
# Import requests library
import requests 

# Import weather_api_key
from config import weather_api_key 

# Starting UR: for Weather Map API calls
url = "https://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

# Import the time library and the datetime module from the datetime library 
import time
from datetime import datetime

In [7]:
# Create an empty list to hold the weather data
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [8]:
# Loop through all the cities in the list
#for i in range(len(cities)):
    
    # Group cities in sets of 50 for logging purposes.
    #if (i % 50 == 0 and i >= 50):
       # set_count +=1
       # record_count =1
       # time.sleep(60)
        
    # Create endpoint URL with each city
    #city_url = url + "&q=" + cities[i]

In [9]:
# Loop through all the cities in the list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count +=1
        record_count =1
        time.sleep(60)
        
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ", "+")
    
    # log the URL, record, and set numbers and the city
    print(f"Processing Record {record_count} of Set {set_count}| {city}")
    # Add 1 to the record count
    record_count +=1
    
# Run and API request for each of the cities. 
    try:
        # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # convert the dat to ISO standar
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime("%Y-%m-%d %H:%M:%S")
        # Append the city information into city_data_list
        city_data.append({"City": city.title(), 
                         "Lat": city_lat, 
                         "Lng": city_lng, 
                         "Max Temp": city_max_temp, 
                         "Humidity": city_humidity, 
                         "Cloudiness": city_clouds, 
                         "Wind Speed": city_wind, 
                         "Country": city_country,
                         "Date": city_date})
# If an error is experienced, skip the city
    except: 
        print("City not found. Skipping...")
        pass 

# Indicate that Data Loading is complelte
print("------------------------------")
print("Data Retrieval Complete       ")
print("------------------------------")

Processing Record 1 of Set 1| faridpur
Processing Record 2 of Set 1| ushuaia
Processing Record 3 of Set 1| mehamn
Processing Record 4 of Set 1| iqaluit
Processing Record 5 of Set 1| jamestown
Processing Record 6 of Set 1| grand river south east
City not found. Skipping...
Processing Record 7 of Set 1| yellowknife
Processing Record 8 of Set 1| hobart
Processing Record 9 of Set 1| upernavik
Processing Record 10 of Set 1| punta arenas
Processing Record 11 of Set 1| leningradskiy
Processing Record 12 of Set 1| deputatskiy
Processing Record 13 of Set 1| rikitea
Processing Record 14 of Set 1| kidal
Processing Record 15 of Set 1| pevek
Processing Record 16 of Set 1| cidreira
Processing Record 17 of Set 1| sukumo
Processing Record 18 of Set 1| lokoja
Processing Record 19 of Set 1| kisanga
Processing Record 20 of Set 1| uribia
Processing Record 21 of Set 1| altamira
Processing Record 22 of Set 1| bakel
Processing Record 23 of Set 1| warqla
City not found. Skipping...
Processing Record 24 of Set

Processing Record 45 of Set 4| mollendo
Processing Record 46 of Set 4| orizona
Processing Record 47 of Set 4| samusu
City not found. Skipping...
Processing Record 48 of Set 4| nyurba
Processing Record 49 of Set 4| torbay
Processing Record 50 of Set 4| sidney
Processing Record 1 of Set 5| salinopolis
Processing Record 2 of Set 5| moree
Processing Record 3 of Set 5| mantua
Processing Record 4 of Set 5| khatanga
Processing Record 5 of Set 5| armidale
Processing Record 6 of Set 5| provideniya
Processing Record 7 of Set 5| airai
Processing Record 8 of Set 5| jaciara
Processing Record 9 of Set 5| asyut
Processing Record 10 of Set 5| mount gambier
Processing Record 11 of Set 5| egvekinot
Processing Record 12 of Set 5| anadyr
Processing Record 13 of Set 5| isangel
Processing Record 14 of Set 5| ust-nera
Processing Record 15 of Set 5| nizhneyansk
City not found. Skipping...
Processing Record 16 of Set 5| pochutla
Processing Record 17 of Set 5| nanhai
Processing Record 18 of Set 5| nurota
Proces

City not found. Skipping...
Processing Record 37 of Set 8| asfi
Processing Record 38 of Set 8| ishigaki
Processing Record 39 of Set 8| melong
Processing Record 40 of Set 8| takoradi
Processing Record 41 of Set 8| mocuba
Processing Record 42 of Set 8| husavik
Processing Record 43 of Set 8| santa rosa
Processing Record 44 of Set 8| tiznit
Processing Record 45 of Set 8| labutta
City not found. Skipping...
Processing Record 46 of Set 8| port elizabeth
Processing Record 47 of Set 8| panjab
Processing Record 48 of Set 8| lavrentiya
Processing Record 49 of Set 8| ixtapa
Processing Record 50 of Set 8| acapulco
Processing Record 1 of Set 9| lazaro cardenas
Processing Record 2 of Set 9| haines junction
Processing Record 3 of Set 9| channel-port aux basques
Processing Record 4 of Set 9| taksimo
Processing Record 5 of Set 9| naftah
City not found. Skipping...
Processing Record 6 of Set 9| bastia
Processing Record 7 of Set 9| dicabisagan
Processing Record 8 of Set 9| jiuquan
Processing Record 9 of 

Processing Record 27 of Set 12| aflu
City not found. Skipping...
Processing Record 28 of Set 12| agaro
Processing Record 29 of Set 12| ijaki
City not found. Skipping...
Processing Record 30 of Set 12| kohat
Processing Record 31 of Set 12| wajima
Processing Record 32 of Set 12| aswan
Processing Record 33 of Set 12| edson
Processing Record 34 of Set 12| viedma
Processing Record 35 of Set 12| kalabo
Processing Record 36 of Set 12| saurimo
Processing Record 37 of Set 12| omboue
Processing Record 38 of Set 12| birao
Processing Record 39 of Set 12| alugan
Processing Record 40 of Set 12| opuwo
Processing Record 41 of Set 12| mbinga
Processing Record 42 of Set 12| puerto narino
Processing Record 43 of Set 12| apastovo
Processing Record 44 of Set 12| hargeysa
Processing Record 45 of Set 12| samarai
Processing Record 46 of Set 12| ekhabi
Processing Record 47 of Set 12| okha
Processing Record 48 of Set 12| tucumcari
Processing Record 49 of Set 12| mirnyy
Processing Record 50 of Set 12| tyssedal
P

In [12]:
len(city_data)

568

In [13]:
# Convert the array of dictionaries to a Panda DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Faridpur,23.6,89.8333,75.2,55,13,2.17,BD,2021-11-21 02:50:06
1,Ushuaia,-54.8,-68.3,33.46,93,90,24.16,AR,2021-11-21 02:46:06
2,Mehamn,71.0357,27.8492,27.68,66,100,22.68,NO,2021-11-21 02:50:08
3,Iqaluit,63.7506,-68.5145,10.13,78,90,5.99,CA,2021-11-21 02:50:09
4,Jamestown,42.097,-79.2353,42.39,59,75,5.01,US,2021-11-21 02:46:57
5,Yellowknife,62.456,-114.3525,-2.7,88,20,5.75,CA,2021-11-21 02:46:32
6,Hobart,-42.8794,147.3294,71.02,50,40,1.99,AU,2021-11-21 02:47:21
7,Upernavik,72.7868,-56.1549,8.82,73,100,6.98,GL,2021-11-21 02:50:11
8,Punta Arenas,-53.15,-70.9167,41.11,60,40,24.16,CL,2021-11-21 02:50:12
9,Leningradskiy,69.3833,178.4167,-12.69,88,5,3.2,RU,2021-11-21 02:50:12


In [16]:
# Reorder the column 
new_column = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Faridpur,BD,2021-11-21 02:50:06,23.6,89.8333,75.2,55,13,2.17
1,Ushuaia,AR,2021-11-21 02:46:06,-54.8,-68.3,33.46,93,90,24.16
2,Mehamn,NO,2021-11-21 02:50:08,71.0357,27.8492,27.68,66,100,22.68
3,Iqaluit,CA,2021-11-21 02:50:09,63.7506,-68.5145,10.13,78,90,5.99
4,Jamestown,US,2021-11-21 02:46:57,42.097,-79.2353,42.39,59,75,5.01
5,Yellowknife,CA,2021-11-21 02:46:32,62.456,-114.3525,-2.7,88,20,5.75
6,Hobart,AU,2021-11-21 02:47:21,-42.8794,147.3294,71.02,50,40,1.99
7,Upernavik,GL,2021-11-21 02:50:11,72.7868,-56.1549,8.82,73,100,6.98
8,Punta Arenas,CL,2021-11-21 02:50:12,-53.15,-70.9167,41.11,60,40,24.16
9,Leningradskiy,RU,2021-11-21 02:50:12,69.3833,178.4167,-12.69,88,5,3.2


In [17]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
# Export the City_data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")