In [1]:
# Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combos
lats = np.random.uniform(-90.000, 90.000, size=1500)
lngs = np.random.uniform(-180.000, 180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1e78560aa88>

In [3]:
# Add the lats and longs to a list
coordinates = list(lat_lngs)

In [4]:
# Import citipy
from citipy import citipy

In [5]:
# Create a list for holding the cities
cities = []
# Idenditfy the nearest city for each latitude and longitude combos
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # if the city is unique, then add to cities list
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count
len(cities)

642

In [6]:
# import requests library
import requests

# import API key
from config import weather_api_key

# import datetime
from datetime import datetime

In [7]:
# base URL
url = "http://api.openweathermap.org/data/2.5/weather?q="

In [8]:
# Create empy list for data
city_data = []
# Print beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL w/ city
    city_url = url + city.replace(" ", "+") + "&units=imperial" + "&appid=" + weather_api_key
    
    # Log the URL, record, and set numbers and the city 
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count
    record_count += 1
    
    # Run an AP request for each city
    try:
        # Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out needed datat
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date 
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city info
        city_data.append({
            "City": city.title(),
            "Lat": city_lat,
            "Lng": city_lng,
            "Max Temp": city_max_temp,
            "Humidity": city_humidity,
            "Cloudiness": city_clouds,
            "Wind Speed": city_wind,
            "Country": city_country,
            "Date": city_date})
        
    # If there's an error, skip the city
    except:
        print("City not foud. Skipping...")
        pass

# Indicate that data loading is complete
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | arica
Processing Record 2 of Set 1 | bluff
Processing Record 3 of Set 1 | derzhavinsk
Processing Record 4 of Set 1 | thompson
Processing Record 5 of Set 1 | mukhen
Processing Record 6 of Set 1 | yellowknife
Processing Record 7 of Set 1 | mataura
Processing Record 8 of Set 1 | hermanus
Processing Record 9 of Set 1 | kapaa
Processing Record 10 of Set 1 | sao felix do xingu
Processing Record 11 of Set 1 | new norfolk
Processing Record 12 of Set 1 | tasiilaq
Processing Record 13 of Set 1 | barrow
Processing Record 14 of Set 1 | cherskiy
Processing Record 15 of Set 1 | nikolskoye
Processing Record 16 of Set 1 | castro
Processing Record 17 of Set 1 | albany
Processing Record 18 of Set 1 | shirokiy
Processing Record 19 of Set 1 | saint george
Processing Record 20 of Set 1 | busselton
Processing Record 21 of Set 1 | avarua
Processing Record 22 of Set 1 | asau
Processing Record 23 of Set 1 | dikson
Proces

Processing Record 42 of Set 4 | belushya guba
City not foud. Skipping...
Processing Record 43 of Set 4 | wanning
Processing Record 44 of Set 4 | atar
Processing Record 45 of Set 4 | tautira
Processing Record 46 of Set 4 | ampanihy
Processing Record 47 of Set 4 | faanui
Processing Record 48 of Set 4 | tigil
Processing Record 49 of Set 4 | mocambique
City not foud. Skipping...
Processing Record 50 of Set 4 | bar harbor
Processing Record 1 of Set 5 | tula
Processing Record 2 of Set 5 | fare
Processing Record 3 of Set 5 | gandorhun
Processing Record 4 of Set 5 | pevek
Processing Record 5 of Set 5 | mayo
Processing Record 6 of Set 5 | koungou
Processing Record 7 of Set 5 | san andres
Processing Record 8 of Set 5 | geraldton
Processing Record 9 of Set 5 | sobolevo
Processing Record 10 of Set 5 | martapura
Processing Record 11 of Set 5 | yumen
Processing Record 12 of Set 5 | malibu
Processing Record 13 of Set 5 | nguru
Processing Record 14 of Set 5 | umm lajj
Processing Record 15 of Set 5 | m

Processing Record 31 of Set 8 | ornskoldsvik
Processing Record 32 of Set 8 | faranah
Processing Record 33 of Set 8 | hami
Processing Record 34 of Set 8 | karamea
City not foud. Skipping...
Processing Record 35 of Set 8 | nardaran
Processing Record 36 of Set 8 | paragominas
Processing Record 37 of Set 8 | sioux lookout
Processing Record 38 of Set 8 | matay
Processing Record 39 of Set 8 | rengo
Processing Record 40 of Set 8 | mount gambier
Processing Record 41 of Set 8 | matagami
Processing Record 42 of Set 8 | laramie
Processing Record 43 of Set 8 | churachandpur
Processing Record 44 of Set 8 | karlskoga
Processing Record 45 of Set 8 | flin flon
Processing Record 46 of Set 8 | otane
Processing Record 47 of Set 8 | taltal
Processing Record 48 of Set 8 | san vicente
Processing Record 49 of Set 8 | reo
Processing Record 50 of Set 8 | koslan
Processing Record 1 of Set 9 | senneterre
Processing Record 2 of Set 9 | khajuraho
Processing Record 3 of Set 9 | mana
Processing Record 4 of Set 9 | k

Processing Record 16 of Set 12 | vila franca do campo
Processing Record 17 of Set 12 | ayan
Processing Record 18 of Set 12 | lagoa
Processing Record 19 of Set 12 | yabrud
Processing Record 20 of Set 12 | mundo nuevo
Processing Record 21 of Set 12 | adre
Processing Record 22 of Set 12 | la paz
Processing Record 23 of Set 12 | killybegs
Processing Record 24 of Set 12 | muzhi
Processing Record 25 of Set 12 | guaruja
Processing Record 26 of Set 12 | chapais
Processing Record 27 of Set 12 | wajima
Processing Record 28 of Set 12 | ilulissat
Processing Record 29 of Set 12 | diamantino
Processing Record 30 of Set 12 | togur
Processing Record 31 of Set 12 | aksu
Processing Record 32 of Set 12 | port macquarie
Processing Record 33 of Set 12 | viedma
Processing Record 34 of Set 12 | yanan
City not foud. Skipping...
Processing Record 35 of Set 12 | luanda
Processing Record 36 of Set 12 | sharjah
Processing Record 37 of Set 12 | sistranda
Processing Record 38 of Set 12 | huarmey
Processing Record 3

In [10]:
# Convert array of dictionaries to Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Arica,CL,2021-04-23 00:20:18,-18.475,-70.3042,68.0,68,90,5.75
1,Bluff,NZ,2021-04-23 00:22:29,-46.6,168.3333,57.0,74,100,8.01
2,Derzhavinsk,KZ,2021-04-23 00:20:35,51.1,66.3167,37.56,55,99,11.01
3,Thompson,CA,2021-04-23 00:22:12,55.7435,-97.8558,21.2,63,75,17.27
4,Mukhen,RU,2021-04-23 00:22:29,48.1,136.1,61.93,30,100,9.95
5,Yellowknife,CA,2021-04-23 00:22:29,62.456,-114.3525,16.0,53,90,16.11
6,Mataura,NZ,2021-04-23 00:22:30,-46.1927,168.8643,57.0,74,98,8.01
7,Hermanus,ZA,2021-04-23 00:22:30,-34.4187,19.2345,59.0,85,0,1.99
8,Kapaa,US,2021-04-23 00:19:49,22.0752,-159.319,80.6,65,1,11.5
9,Sao Felix Do Xingu,BR,2021-04-23 00:22:30,-6.6447,-51.995,72.28,97,84,0.22


In [12]:
# Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")