In [1]:
import pandas as pd
import requests
from citipy import citipy
import numpy as np
from config import weather_api_key
from datetime import datetime
import time
import matplotlib.pyplot as plt
import json


In [2]:
# Create a set of random latitude and longitude combinations.
#zip pairs them
lats = np.random.uniform(low=-90.000, high=90.000, size=2000)
lngs = np.random.uniform(low=-180.000, high=180.000, size=2000)
lat_lngs = zip(lats, lngs)

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# create a list to hold the unique cities
cities = []

# find the nearest city for each lng and lat
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # Avoid adding duplicates by checking for dups and appending when unique
    if city not in cities:
        cities.append(city)
        
# amount of cities
len(cities)       

755

In [5]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [6]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=2afbc27f9442a8aebf208c1ccd7a97d2


In [7]:
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_cond = city_weather["weather"][0]["description"]
        city_country = city_weather["sys"]["country"]
       
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Country": city_country,
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Current Conditions": city_cond,})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | albany
Processing Record 2 of Set 1 | ust-kamchatsk
City not found. Skipping...
Processing Record 3 of Set 1 | semenivka
Processing Record 4 of Set 1 | palmer
Processing Record 5 of Set 1 | rikitea
Processing Record 6 of Set 1 | ushuaia
Processing Record 7 of Set 1 | kapaa
Processing Record 8 of Set 1 | palabuhanratu
City not found. Skipping...
Processing Record 9 of Set 1 | itanhandu
Processing Record 10 of Set 1 | punta arenas
Processing Record 11 of Set 1 | paka
Processing Record 12 of Set 1 | sur
Processing Record 13 of Set 1 | vaini
Processing Record 14 of Set 1 | hermanus
Processing Record 15 of Set 1 | mount gambier
Processing Record 16 of Set 1 | jamestown
Processing Record 17 of Set 1 | avarua
Processing Record 18 of Set 1 | barentsburg
City not found. Skipping...
Processing Record 19 of Set 1 | bengkulu
Processing Record 20 of Set 1 | thompson
Processing Record 21 of Set 1 | nara
Processing Record 22 of Set 1 | virginia beach
Processing Record 2

Processing Record 41 of Set 4 | constitucion
Processing Record 42 of Set 4 | tevaitoa
Processing Record 43 of Set 4 | taiyuan
Processing Record 44 of Set 4 | beringovskiy
Processing Record 45 of Set 4 | wewak
Processing Record 46 of Set 4 | lebu
Processing Record 47 of Set 4 | ardahan
Processing Record 48 of Set 4 | peace river
Processing Record 49 of Set 4 | vila velha
Processing Record 50 of Set 4 | isangel
Processing Record 1 of Set 5 | voyinka
Processing Record 2 of Set 5 | puerto penasco
Processing Record 3 of Set 5 | kysyl-syr
Processing Record 4 of Set 5 | juarez
Processing Record 5 of Set 5 | falealupo
City not found. Skipping...
Processing Record 6 of Set 5 | araouane
Processing Record 7 of Set 5 | etne
Processing Record 8 of Set 5 | hithadhoo
Processing Record 9 of Set 5 | moranbah
Processing Record 10 of Set 5 | katha
City not found. Skipping...
Processing Record 11 of Set 5 | haines junction
Processing Record 12 of Set 5 | norman wells
Processing Record 13 of Set 5 | mahano

Processing Record 30 of Set 8 | san juan nepomuceno
Processing Record 31 of Set 8 | bandarbeyla
Processing Record 32 of Set 8 | kodinsk
Processing Record 33 of Set 8 | cabimas
Processing Record 34 of Set 8 | privokzalnyy
City not found. Skipping...
Processing Record 35 of Set 8 | hobyo
Processing Record 36 of Set 8 | kabalo
Processing Record 37 of Set 8 | kaseda
Processing Record 38 of Set 8 | biltine
Processing Record 39 of Set 8 | tagusao
Processing Record 40 of Set 8 | takoradi
Processing Record 41 of Set 8 | rio casca
Processing Record 42 of Set 8 | bindi
Processing Record 43 of Set 8 | beisfjord
Processing Record 44 of Set 8 | urengoy
Processing Record 45 of Set 8 | nagareyama
Processing Record 46 of Set 8 | kakching
Processing Record 47 of Set 8 | tual
Processing Record 48 of Set 8 | danilovka
Processing Record 49 of Set 8 | ternate
Processing Record 50 of Set 8 | victoria
Processing Record 1 of Set 9 | nadym
Processing Record 2 of Set 9 | krasnoselkup
Processing Record 3 of Set 

Processing Record 17 of Set 12 | san matias
Processing Record 18 of Set 12 | wana
Processing Record 19 of Set 12 | saint-felix-de-valois
Processing Record 20 of Set 12 | turukhansk
Processing Record 21 of Set 12 | ngukurr
City not found. Skipping...
Processing Record 22 of Set 12 | rokytne
Processing Record 23 of Set 12 | kismayo
Processing Record 24 of Set 12 | ozark
Processing Record 25 of Set 12 | druzhba
Processing Record 26 of Set 12 | labutta
City not found. Skipping...
Processing Record 27 of Set 12 | luba
Processing Record 28 of Set 12 | along
Processing Record 29 of Set 12 | zacualpan
Processing Record 30 of Set 12 | parthenay
Processing Record 31 of Set 12 | cuiluan
Processing Record 32 of Set 12 | leca da palmeira
Processing Record 33 of Set 12 | port lincoln
Processing Record 34 of Set 12 | riyadh
Processing Record 35 of Set 12 | starotimoshkino
Processing Record 36 of Set 12 | tambopata
Processing Record 37 of Set 12 | waraseoni
Processing Record 38 of Set 12 | jalu
Proces

Processing Record 2 of Set 16 | rawson
Processing Record 3 of Set 16 | lamar
Processing Record 4 of Set 16 | mirganj
Processing Record 5 of Set 16 | iquitos
-----------------------------
Data Retrieval Complete      
-----------------------------


In [8]:
len(city_data)

695

In [9]:
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Country,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Conditions
0,Albany,US,42.6001,-73.9662,9.0,59,17,3.36,few clouds
1,Semenivka,UA,52.1783,32.5818,24.84,97,93,13.13,overcast clouds
2,Palmer,US,42.1584,-72.3287,6.8,66,1,4.61,clear sky
3,Rikitea,PF,-23.1203,-134.9692,78.55,77,44,10.4,light rain
4,Ushuaia,AR,-54.8,-68.3,48.2,61,75,9.22,broken clouds
5,Kapaa,US,22.0752,-159.319,72.0,88,75,17.27,light rain
6,Itanhandu,BR,-22.2958,-44.9347,64.51,87,58,1.01,broken clouds
7,Punta Arenas,CL,-53.15,-70.9167,46.4,81,0,12.66,clear sky
8,Paka,MY,4.6374,103.4368,80.6,83,40,9.22,scattered clouds
9,Sur,OM,22.5667,59.5289,77.07,40,0,6.4,clear sky


In [11]:
# Create the output file (CSV).
output_data_file = "Weather_Database/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")