In [7]:
# Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import citipy
import requests
import time
from datetime import datetime
from config import weather_api_key

In [8]:
# Create a set of random latitude and longtitude combinations.
lats=np.random.uniform(-90,90, size=1500)
lngs=np.random.uniform(-180,180,size=1500)
lat_lngs=zip(lats, lngs)
coordinates=list(lat_lngs)


In [9]:
from citipy import citipy


In [10]:
# generate a list for holding the cities
cities=[]
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city=citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # if the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
# # Print the city count to confirm sufficient count
len(cities)

636

In [5]:
# import the time library and the datetime module from the datetime library
import time
from datetime import datetime
# import the API key
from config import weather_api_key
url= "https://api.openweathermap.org/data/2.5/weather?units=imperial&appid=" + weather_api_key
# city = "Boston"
# query_url = url + "&q=" + city
# print(query_url)

In [6]:
# Create an empty list to hold weather data
city_data = []
# Print the beginning of the logging
print("Beginning Data Retrieval    ")
print("----------------------------")

# Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list 
for i, city in enumerate(cities):
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count+=1
        record_count=1
        time.sleep(60)
    # Create endpoint URL with each city
    city_url = url + "&q=" + city.replace(" ","+")
    # Log the URL, record, and set numbers and the city
    print(f'Processing Record {record_count} of Set {set_count} | {city}')
    # Add 1 to the record count
    record_count+=1
# Run the API request for each of the cities
    try:
        # Parse the json and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list
        city_data.append({"City":city.title(),
                          "Lat":city_lat,
                          "Lng":city_lng,
                          "Max Temp":city_max_temp,
                          "Humidity":city_humidity,
                          "Cloudiness":city_clouds,
                          "Wind Speed":city_wind,
                          "Country":city_country,
                          "Date":city_date})
    # If an error is experienced, skip the city
    except: 
        print("City not found. Skipping...")
        pass
# Indicate that Data Loading is complete
print("----------------------------")
print("Data Retrieval Complete")
print("----------------------------")

Beginning Data Retrieval    
----------------------------
Processing Record 1 of Set 1 | castro
Processing Record 2 of Set 1 | ushuaia
Processing Record 3 of Set 1 | wittingen
Processing Record 4 of Set 1 | papara
Processing Record 5 of Set 1 | vaini
Processing Record 6 of Set 1 | busselton
Processing Record 7 of Set 1 | mys shmidta
City not found. Skipping...
Processing Record 8 of Set 1 | mzimba
Processing Record 9 of Set 1 | maridi
Processing Record 10 of Set 1 | airai
Processing Record 11 of Set 1 | banjar
Processing Record 12 of Set 1 | hermanus
Processing Record 13 of Set 1 | marsa matruh
Processing Record 14 of Set 1 | khandbari
Processing Record 15 of Set 1 | leningradskiy
Processing Record 16 of Set 1 | belushya guba
City not found. Skipping...
Processing Record 17 of Set 1 | mehamn
Processing Record 18 of Set 1 | price
Processing Record 19 of Set 1 | sawakin
Processing Record 20 of Set 1 | bluff
Processing Record 21 of Set 1 | tomatlan
Processing Record 22 of Set 1 | ngukurr


Processing Record 35 of Set 4 | wichita falls
Processing Record 36 of Set 4 | aykhal
Processing Record 37 of Set 4 | kasongo-lunda
Processing Record 38 of Set 4 | angra
City not found. Skipping...
Processing Record 39 of Set 4 | victoria
Processing Record 40 of Set 4 | muscat
Processing Record 41 of Set 4 | muisne
Processing Record 42 of Set 4 | tiksi
Processing Record 43 of Set 4 | hammerfest
Processing Record 44 of Set 4 | cabo san lucas
Processing Record 45 of Set 4 | saint-augustin
Processing Record 46 of Set 4 | chuy
Processing Record 47 of Set 4 | port elizabeth
Processing Record 48 of Set 4 | rio gallegos
Processing Record 49 of Set 4 | hasaki
Processing Record 50 of Set 4 | fonte boa
Processing Record 1 of Set 5 | uige
Processing Record 2 of Set 5 | port alfred
Processing Record 3 of Set 5 | mollendo
Processing Record 4 of Set 5 | iracoubo
Processing Record 5 of Set 5 | khandyga
Processing Record 6 of Set 5 | mindelo
Processing Record 7 of Set 5 | jaipur hat
City not found. Ski

Processing Record 23 of Set 8 | bandundu
Processing Record 24 of Set 8 | gagra
Processing Record 25 of Set 8 | inderborskiy
City not found. Skipping...
Processing Record 26 of Set 8 | pangnirtung
Processing Record 27 of Set 8 | diapaga
Processing Record 28 of Set 8 | zhigansk
Processing Record 29 of Set 8 | takhatpur
Processing Record 30 of Set 8 | leander
Processing Record 31 of Set 8 | vigrestad
Processing Record 32 of Set 8 | saint george
Processing Record 33 of Set 8 | bograd
Processing Record 34 of Set 8 | saldanha
Processing Record 35 of Set 8 | nelson bay
Processing Record 36 of Set 8 | broumov
Processing Record 37 of Set 8 | lompoc
Processing Record 38 of Set 8 | skelleftea
Processing Record 39 of Set 8 | kamenka
Processing Record 40 of Set 8 | mamallapuram
Processing Record 41 of Set 8 | rhyl
Processing Record 42 of Set 8 | vardo
Processing Record 43 of Set 8 | tapaua
City not found. Skipping...
Processing Record 44 of Set 8 | vao
Processing Record 45 of Set 8 | poltavka
Proce

Processing Record 8 of Set 12 | goderich
Processing Record 9 of Set 12 | bubaque
Processing Record 10 of Set 12 | bellevue
Processing Record 11 of Set 12 | caohai
Processing Record 12 of Set 12 | prince rupert
Processing Record 13 of Set 12 | sicuani
Processing Record 14 of Set 12 | qandahar
City not found. Skipping...
Processing Record 15 of Set 12 | bardiyah
Processing Record 16 of Set 12 | minot
Processing Record 17 of Set 12 | sarankhola
Processing Record 18 of Set 12 | nautla
Processing Record 19 of Set 12 | santiago del estero
Processing Record 20 of Set 12 | mirnyy
Processing Record 21 of Set 12 | malpe
Processing Record 22 of Set 12 | nagorsk
Processing Record 23 of Set 12 | almunecar
Processing Record 24 of Set 12 | kalmunai
Processing Record 25 of Set 12 | kattivakkam
Processing Record 26 of Set 12 | buraydah
Processing Record 27 of Set 12 | goedereede
Processing Record 28 of Set 12 | camocim
Processing Record 29 of Set 12 | shenjiamen
Processing Record 30 of Set 12 | bodden 

In [11]:
len(city_data)

573

In [13]:
#  Convert the array of dictionaries to a Pandas DataFrame
city_data_df=pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Castro,-24.7911,-50.0119,70.5,61,0,3.22,BR,2022-10-04 19:57:42
1,Ushuaia,-54.8,-68.3,56.86,44,20,8.05,AR,2022-10-04 19:57:43
2,Wittingen,52.7269,10.7361,55.4,72,100,8.52,DE,2022-10-04 19:57:43
3,Papara,-3.9839,-38.7273,81.0,51,70,7.63,BR,2022-10-04 19:57:44
4,Vaini,-21.2,-175.2,77.16,88,40,3.44,TO,2022-10-04 19:57:44
5,Busselton,-33.65,115.3333,56.66,78,97,16.49,AU,2022-10-04 19:57:45
6,Mzimba,-11.9,33.6,66.43,41,18,10.89,MW,2022-10-04 19:57:45
7,Maridi,4.9158,29.4742,66.99,95,100,1.39,SS,2022-10-04 19:57:46
8,Airai,-8.9266,125.4092,61.41,87,99,1.54,TL,2022-10-04 19:57:47
9,Banjar,-8.19,114.9675,76.39,91,63,6.26,ID,2022-10-04 19:57:48


In [15]:
# reorder the column so that the dataframe reads different
new_column_order=["City","Country","Date","Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed"]
city_data_df=city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Castro,BR,2022-10-04 19:57:42,-24.7911,-50.0119,70.5,61,0,3.22
1,Ushuaia,AR,2022-10-04 19:57:43,-54.8,-68.3,56.86,44,20,8.05
2,Wittingen,DE,2022-10-04 19:57:43,52.7269,10.7361,55.4,72,100,8.52
3,Papara,BR,2022-10-04 19:57:44,-3.9839,-38.7273,81.0,51,70,7.63
4,Vaini,TO,2022-10-04 19:57:44,-21.2,-175.2,77.16,88,40,3.44
5,Busselton,AU,2022-10-04 19:57:45,-33.65,115.3333,56.66,78,97,16.49
6,Mzimba,MW,2022-10-04 19:57:45,-11.9,33.6,66.43,41,18,10.89
7,Maridi,SS,2022-10-04 19:57:46,4.9158,29.4742,66.99,95,100,1.39
8,Airai,TL,2022-10-04 19:57:47,-8.9266,125.4092,61.41,87,99,1.54
9,Banjar,ID,2022-10-04 19:57:48,-8.19,114.9675,76.39,91,63,6.26


In [16]:
# Create a output csv file
output_data_file="weather_data/cities.csv"
# Export the City_Data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")