In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
import requests
from config import weather_api_key
from datetime import datetime

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-190.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x2572d63b048>

In [3]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)
    

In [4]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    # # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.       
len(cities)

605

In [5]:
#Starting URL for weather map API call
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key



In [10]:
#Create an empty list to hold the weather data
city_data = []
#Print the beginning of the logging.
print("Beginning Data Retrieval       ")
print("-------------------------------")

#Create counters
record_count = 1
set_count = 1

# Loop through all the cities in our list.
for i in range(len(cities)):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + "i"
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
   
 #Run an API request for each of the cities
    try:
    #Parse the JSON and retrieve data
        city_weather = requests.get(city_url).json()
        # Parse out the needed data
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        #Convert the date to ISO standard
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        #Append the city information into city_data list
        city_data.append({"City": city.title(), "Lat": city_lng, "Lng": city_lng, "Max Temp": city_max_temp,
                              "Humidity": city_humidity,
                              "Cloudiness": city_clouds,
                              "Wind Speed": city_wind,
                              "Country": city_country,
                              "Date": city_date})
    #If an error is experienced, skip the city
    except:
            print("City not found. Skipping...")
            continue
#Indicate the Data Loading is complete.
print("---------------------------")
print("Data Retrieval Complete    ")
print("---------------------------")

Beginning Data Retrieval       
-------------------------------
Processing Record 1 of Set 13 | ushuaia
Processing Record 2 of Set 13 | mahebourg
Processing Record 3 of Set 13 | bunia
Processing Record 4 of Set 13 | banda aceh
Processing Record 5 of Set 13 | katobu
Processing Record 6 of Set 13 | lebu
Processing Record 7 of Set 13 | yellowknife
Processing Record 8 of Set 13 | rikitea
Processing Record 9 of Set 13 | mataura
Processing Record 10 of Set 13 | shimanovsk
Processing Record 11 of Set 13 | arraial do cabo
Processing Record 12 of Set 13 | innisfail
Processing Record 13 of Set 13 | gogrial
Processing Record 14 of Set 13 | port lincoln
Processing Record 15 of Set 13 | saint-joseph
Processing Record 16 of Set 13 | geraldton
Processing Record 17 of Set 13 | bonavista
Processing Record 18 of Set 13 | pyaozerskiy
Processing Record 19 of Set 13 | barrow
Processing Record 20 of Set 13 | yumen
Processing Record 21 of Set 13 | pisco
Processing Record 22 of Set 13 | hobart
Processing Reco

Processing Record 35 of Set 16 | codrington
Processing Record 36 of Set 16 | tubruq
City not found. Skipping...
Processing Record 37 of Set 16 | half moon bay
Processing Record 38 of Set 16 | pryazha
Processing Record 39 of Set 16 | derzhavinsk
Processing Record 40 of Set 16 | upernavik
Processing Record 41 of Set 16 | mys shmidta
City not found. Skipping...
Processing Record 42 of Set 16 | juegang
Processing Record 43 of Set 16 | san cristobal
Processing Record 44 of Set 16 | ilulissat
Processing Record 45 of Set 16 | cortona
Processing Record 46 of Set 16 | nuuk
Processing Record 47 of Set 16 | banmo
City not found. Skipping...
Processing Record 48 of Set 16 | rosedale
Processing Record 49 of Set 16 | shache
Processing Record 50 of Set 16 | alamogordo
Processing Record 1 of Set 17 | santa fe
Processing Record 2 of Set 17 | baruun-urt
Processing Record 3 of Set 17 | atyashevo
Processing Record 4 of Set 17 | sankheda
Processing Record 5 of Set 17 | makakilo city
Processing Record 6 of 

Processing Record 21 of Set 20 | lisakovsk
Processing Record 22 of Set 20 | oussouye
Processing Record 23 of Set 20 | porbandar
Processing Record 24 of Set 20 | kholm
Processing Record 25 of Set 20 | port-gentil
Processing Record 26 of Set 20 | florida
Processing Record 27 of Set 20 | hermitage
Processing Record 28 of Set 20 | poum
Processing Record 29 of Set 20 | rondonopolis
Processing Record 30 of Set 20 | rio gallegos
Processing Record 31 of Set 20 | kavieng
Processing Record 32 of Set 20 | husavik
Processing Record 33 of Set 20 | emerald
Processing Record 34 of Set 20 | kiunga
Processing Record 35 of Set 20 | spirovo
Processing Record 36 of Set 20 | amarpur
Processing Record 37 of Set 20 | orzu
Processing Record 38 of Set 20 | chokurdakh
Processing Record 39 of Set 20 | port elizabeth
Processing Record 40 of Set 20 | san carlos de bariloche
Processing Record 41 of Set 20 | sovetskiy
Processing Record 42 of Set 20 | natal
Processing Record 43 of Set 20 | berlevag
Processing Record 

Processing Record 8 of Set 24 | dunmore town
Processing Record 9 of Set 24 | kulhudhuffushi
Processing Record 10 of Set 24 | ust-maya
Processing Record 11 of Set 24 | jiwani
Processing Record 12 of Set 24 | nyurba
Processing Record 13 of Set 24 | wewak
Processing Record 14 of Set 24 | fort saint john
City not found. Skipping...
Processing Record 15 of Set 24 | urusha
Processing Record 16 of Set 24 | moranbah
Processing Record 17 of Set 24 | tavda
Processing Record 18 of Set 24 | iralaya
Processing Record 19 of Set 24 | belgrade
Processing Record 20 of Set 24 | olafsvik
Processing Record 21 of Set 24 | nairobi
Processing Record 22 of Set 24 | maltahohe
Processing Record 23 of Set 24 | sao joao da barra
Processing Record 24 of Set 24 | byron bay
Processing Record 25 of Set 24 | westport
Processing Record 26 of Set 24 | ulfborg
Processing Record 27 of Set 24 | toungoo
City not found. Skipping...
Processing Record 28 of Set 24 | seminole
Processing Record 29 of Set 24 | concepcion
Processi

In [11]:
len(city_data)

560

In [13]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Ushuaia,-68.3,-68.3,32.0,95,90,23.04,AR,2020-07-27 00:57:31
1,Mahebourg,57.7,57.7,70.0,70,96,8.99,MU,2020-07-27 00:55:04
2,Bunia,30.25,30.25,62.29,89,37,2.21,CD,2020-07-27 00:48:47
3,Banda Aceh,95.32,95.32,80.28,75,99,5.3,ID,2020-07-27 00:54:02
4,Katobu,122.53,122.53,81.39,72,100,7.2,ID,2020-07-27 00:48:47
5,Lebu,-73.65,-73.65,49.05,82,62,8.23,CL,2020-07-27 00:53:49
6,Yellowknife,-114.35,-114.35,75.99,52,40,11.41,CA,2020-07-27 00:54:08
7,Rikitea,-134.97,-134.97,70.32,79,0,19.89,PF,2020-07-27 00:57:32
8,Mataura,168.86,168.86,49.89,61,0,2.48,NZ,2020-07-27 00:57:32
9,Shimanovsk,127.7,127.7,70.97,89,100,4.21,RU,2020-07-27 00:48:48


In [14]:
city_data_order =["City", "Cloudiness", "Country", "Date", "Humidity", "Lat", "Lng", "Max Temp", "Wind Speed"]
city_data_df = city_data_df[city_data_order]
city_data_df.head()

Unnamed: 0,City,Cloudiness,Country,Date,Humidity,Lat,Lng,Max Temp,Wind Speed
0,Ushuaia,90,AR,2020-07-27 00:57:31,95,-68.3,-68.3,32.0,23.04
1,Mahebourg,96,MU,2020-07-27 00:55:04,70,57.7,57.7,70.0,8.99
2,Bunia,37,CD,2020-07-27 00:48:47,89,30.25,30.25,62.29,2.21
3,Banda Aceh,99,ID,2020-07-27 00:54:02,75,95.32,95.32,80.28,5.3
4,Katobu,100,ID,2020-07-27 00:48:47,72,122.53,122.53,81.39,7.2


In [15]:
#Create the output file (CSV)
output_data_file = "weather_data/cities.csv"
#Export the City_data into a CSV
city_data_df.to_csv(output_data_file, index_label="City_ID")
