In [7]:
#import the dependencies
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from citipy import citipy
import requests
from config import weather_api_key
from datetime import datetime
import time

In [8]:
lats = np.random.uniform(low = -90.000, high = 90.000, size = 1500 )
lngs = np.random.uniform(low = -180.000, high = 180.000, size = 1500 )
lat_lngs = zip(lats,lngs)
coordinates = list(lat_lngs)

In [9]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

636

In [10]:
url = "https://api.openweathermap.org/data/2.5/weather?lat={lat}&lon={lon}&appid=" + weather_api_key

In [11]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
    try:
        #Parse the JSON and retreive data
        city_weather = requests.get(city_url).json()
        
        #Parse out needing data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        #convert the date to ISO standards
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        
        #append the data into city_data list
        
        city_data.append({
            "City": city.title(),
            "Lat": city_lat,
            "Lng": city_lng,
            "Max Temp": city_max_temp,
            "Humidity": city_humidity,
            "Cloudiness": city_clouds,
            "Wind Speed": city_wind,
            "Country" : city_country,
            "Date": city_date
        }
        )
    except:
        print("City not found. Skipping...")
        pass
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")    

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | port alfred
Processing Record 2 of Set 1 | rikitea
Processing Record 3 of Set 1 | padang
Processing Record 4 of Set 1 | butaritari
Processing Record 5 of Set 1 | havoysund
Processing Record 6 of Set 1 | shahreza
Processing Record 7 of Set 1 | lorengau
Processing Record 8 of Set 1 | shingu
Processing Record 9 of Set 1 | cabo san lucas
Processing Record 10 of Set 1 | vaitupu
City not found. Skipping...
Processing Record 11 of Set 1 | tasiilaq
Processing Record 12 of Set 1 | coihaique
Processing Record 13 of Set 1 | mar del plata
Processing Record 14 of Set 1 | punta arenas
Processing Record 15 of Set 1 | srivardhan
Processing Record 16 of Set 1 | san cristobal
Processing Record 17 of Set 1 | vila velha
Processing Record 18 of Set 1 | bumba
Processing Record 19 of Set 1 | khatanga
Processing Record 20 of Set 1 | castro
Processing Record 21 of Set 1 | barrow
Processing Record 22 of Set 1 | mataura
Pr

Processing Record 44 of Set 4 | zunyi
Processing Record 45 of Set 4 | aykhal
Processing Record 46 of Set 4 | hashtrud
Processing Record 47 of Set 4 | cockburn harbour
City not found. Skipping...
Processing Record 48 of Set 4 | ha tinh
Processing Record 49 of Set 4 | kavieng
Processing Record 50 of Set 4 | vestmannaeyjar
Processing Record 1 of Set 5 | vardo
Processing Record 2 of Set 5 | srednekolymsk
Processing Record 3 of Set 5 | palo del colle
Processing Record 4 of Set 5 | ponta do sol
Processing Record 5 of Set 5 | attawapiskat
City not found. Skipping...
Processing Record 6 of Set 5 | saint george
Processing Record 7 of Set 5 | lagoa
Processing Record 8 of Set 5 | moron
Processing Record 9 of Set 5 | georgetown
Processing Record 10 of Set 5 | suleja
Processing Record 11 of Set 5 | porto santo
Processing Record 12 of Set 5 | ndjole
Processing Record 13 of Set 5 | halvad
Processing Record 14 of Set 5 | uribia
Processing Record 15 of Set 5 | belmonte
Processing Record 16 of Set 5 | b

Processing Record 33 of Set 8 | enid
Processing Record 34 of Set 8 | mys shmidta
City not found. Skipping...
Processing Record 35 of Set 8 | atherton
Processing Record 36 of Set 8 | saint joseph
Processing Record 37 of Set 8 | kotka
Processing Record 38 of Set 8 | tarudant
City not found. Skipping...
Processing Record 39 of Set 8 | kenitra
Processing Record 40 of Set 8 | piste
Processing Record 41 of Set 8 | jadu
Processing Record 42 of Set 8 | saldanha
Processing Record 43 of Set 8 | raudeberg
Processing Record 44 of Set 8 | santa rosa
Processing Record 45 of Set 8 | halifax
Processing Record 46 of Set 8 | awbari
Processing Record 47 of Set 8 | nola
Processing Record 48 of Set 8 | bonga
Processing Record 49 of Set 8 | ustka
Processing Record 50 of Set 8 | jalu
Processing Record 1 of Set 9 | adrar
Processing Record 2 of Set 9 | new ross
Processing Record 3 of Set 9 | kodiak
Processing Record 4 of Set 9 | west plains
Processing Record 5 of Set 9 | katherine
Processing Record 6 of Set 9 

Processing Record 20 of Set 12 | ningxiang
Processing Record 21 of Set 12 | hobyo
Processing Record 22 of Set 12 | youkounkoun
Processing Record 23 of Set 12 | daoukro
Processing Record 24 of Set 12 | gizo
Processing Record 25 of Set 12 | kudat
Processing Record 26 of Set 12 | skiros
City not found. Skipping...
Processing Record 27 of Set 12 | bani
Processing Record 28 of Set 12 | laguna
Processing Record 29 of Set 12 | dom pedrito
Processing Record 30 of Set 12 | marzuq
Processing Record 31 of Set 12 | xining
Processing Record 32 of Set 12 | saint-pierre
Processing Record 33 of Set 12 | samusu
City not found. Skipping...
Processing Record 34 of Set 12 | luganville
Processing Record 35 of Set 12 | brae
Processing Record 36 of Set 12 | lesosibirsk
Processing Record 37 of Set 12 | san carlos de bariloche
Processing Record 38 of Set 12 | bathsheba
Processing Record 39 of Set 12 | karaton
Processing Record 40 of Set 12 | belchatow
Processing Record 41 of Set 12 | marshall
Processing Record

In [12]:
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Port Alfred,-33.5906,26.891,290.33,66,0,4.3,ZA,2022-06-10 21:47:01
1,Rikitea,-23.1203,-134.9692,297.51,63,99,7.57,PF,2022-06-10 21:45:26
2,Padang,-0.9492,100.3543,297.29,91,96,0.92,ID,2022-06-10 21:47:02
3,Butaritari,3.0707,172.7902,301.26,72,92,6.08,KI,2022-06-10 21:47:03
4,Havoysund,70.9963,24.6622,279.28,75,92,6.49,NO,2022-06-10 21:47:04
5,Shahreza,32.0339,51.8794,293.77,9,0,0.5,IR,2022-06-10 21:47:04
6,Lorengau,-2.0226,147.2712,301.19,68,13,2.81,PG,2022-06-10 21:47:05
7,Shingu,33.7333,135.9833,293.55,89,100,2.51,JP,2022-06-10 21:47:05
8,Cabo San Lucas,22.8909,-109.9124,306.27,63,11,5.91,MX,2022-06-10 21:47:06
9,Tasiilaq,65.6145,-37.6368,279.24,69,32,1.91,GL,2022-06-10 21:47:07


In [13]:
new_column_order = ["City","Country","Date","Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed"]
city_data_df = city_data_df[new_column_order]

In [17]:
#Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
#Export the City_data into a csv
city_data_df.to_csv(output_data_file, index_label = "City_ID")