In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy
import requests
import json
import time
from datetime import datetime
from config import weather_api_key

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(-90, 90, size=1500)
lngs = np.random.uniform(-180, 180, size=1500)

# we'll pack the latitudes (lats) and longitudes (lngs) as pairs by zipping them (lat_lngs) with the zip() function.
lats_lngs = zip(lats,lngs)
lats_lngs

<zip at 0x2634dc6a508>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lats_lngs)


In [4]:
# Use the print() function to display the latitude and longitude combinations.
# Using CitiPy module, get the nearest city name and country code for the list of lats_lngs.
# First, create a list to hold the cities.
cities = []

for coordinate in coordinates:

    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list
    if city not in cities:
        cities.append(city)
        
print(len(cities))

619


In [5]:
# URL to make the API call and get the weather data.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [6]:
# Create an empty list to hold the weather data
city_data = []

# Print the beginning of the logging
print("Beginning Data Retrieval")
print("------------------------")

# Create counters
record_count = 1
set_Count = 1

# Loop through all the cities in our list.
for i , city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_Count += 1
        record_count = 1
        time.sleep(60)

     # Create endpoint URL with each city.
    city_url = url +"&q=" + city.replace(" ","+")
    
    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_Count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    
    # Exception Handling
    try:
        response = requests.get(city_url)
        city_weather = response.json()
       
         # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime("%Y-%m-%d %H:%M:%S")
  
        # Append the city information into city_data list.
        city_data.append({"City":city.title(),
                             "Latitude":city_lat,
                             "Longitude":city_lng,
                             "Max Temp":city_max_temp,
                             "Humidity":city_humidity,
                             "Clouds":city_clouds,
                             "Wind":city_wind,
                             "Country":city_country,
                             "Date":city_date})
    except:
        print("City not found. Skipping...")
        pass
        
        
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")
       

Beginning Data Retrieval
------------------------
Processing Record 1 of Set 1 | bondo
Processing Record 2 of Set 1 | dali
Processing Record 3 of Set 1 | bull savanna
Processing Record 4 of Set 1 | lebu
Processing Record 5 of Set 1 | fortuna
Processing Record 6 of Set 1 | butaritari
Processing Record 7 of Set 1 | grand river south east
City not found. Skipping...
Processing Record 8 of Set 1 | azul
Processing Record 9 of Set 1 | illela
Processing Record 10 of Set 1 | atasu
Processing Record 11 of Set 1 | qaanaaq
Processing Record 12 of Set 1 | provideniya
Processing Record 13 of Set 1 | saleaula
City not found. Skipping...
Processing Record 14 of Set 1 | rikitea
Processing Record 15 of Set 1 | thompson
Processing Record 16 of Set 1 | saldanha
Processing Record 17 of Set 1 | mahebourg
Processing Record 18 of Set 1 | cidreira
Processing Record 19 of Set 1 | amapa
Processing Record 20 of Set 1 | port elizabeth
Processing Record 21 of Set 1 | kendari
Processing Record 22 of Set 1 | vardo
P

Processing Record 42 of Set 4 | geraldton
Processing Record 43 of Set 4 | porto velho
Processing Record 44 of Set 4 | verkhnyaya inta
Processing Record 45 of Set 4 | kerchevskiy
Processing Record 46 of Set 4 | lagoa
Processing Record 47 of Set 4 | inhambane
Processing Record 48 of Set 4 | teguldet
Processing Record 49 of Set 4 | kattivakkam
Processing Record 50 of Set 4 | seoul
Processing Record 1 of Set 5 | upernavik
Processing Record 2 of Set 5 | iqaluit
Processing Record 3 of Set 5 | daru
Processing Record 4 of Set 5 | novoagansk
Processing Record 5 of Set 5 | havelock
Processing Record 6 of Set 5 | kathmandu
Processing Record 7 of Set 5 | tumannyy
City not found. Skipping...
Processing Record 8 of Set 5 | kokopo
Processing Record 9 of Set 5 | murdochville
Processing Record 10 of Set 5 | bredasdorp
Processing Record 11 of Set 5 | nizhneyansk
City not found. Skipping...
Processing Record 12 of Set 5 | montgomery
Processing Record 13 of Set 5 | saryozek
Processing Record 14 of Set 5 |

Processing Record 33 of Set 8 | oga
Processing Record 34 of Set 8 | gold coast
Processing Record 35 of Set 8 | sola
Processing Record 36 of Set 8 | ghanzi
Processing Record 37 of Set 8 | juli
Processing Record 38 of Set 8 | dakar
Processing Record 39 of Set 8 | sandhaven
City not found. Skipping...
Processing Record 40 of Set 8 | marang
Processing Record 41 of Set 8 | yoichi
Processing Record 42 of Set 8 | boz
Processing Record 43 of Set 8 | baruun-urt
Processing Record 44 of Set 8 | ulaangom
Processing Record 45 of Set 8 | teknaf
Processing Record 46 of Set 8 | swindon
Processing Record 47 of Set 8 | nuuk
Processing Record 48 of Set 8 | bolshaya murta
City not found. Skipping...
Processing Record 49 of Set 8 | bonthe
Processing Record 50 of Set 8 | kaniama
Processing Record 1 of Set 9 | kyra
Processing Record 2 of Set 9 | loandjili
Processing Record 3 of Set 9 | faanui
Processing Record 4 of Set 9 | kango
Processing Record 5 of Set 9 | alihe
Processing Record 6 of Set 9 | leh
Processi

Processing Record 20 of Set 12 | saint-denis
Processing Record 21 of Set 12 | hervey bay
Processing Record 22 of Set 12 | kenora
Processing Record 23 of Set 12 | saint-pierre
Processing Record 24 of Set 12 | santa ines
Processing Record 25 of Set 12 | caceres
Processing Record 26 of Set 12 | palmer
Processing Record 27 of Set 12 | ambilobe
Processing Record 28 of Set 12 | mitu
Processing Record 29 of Set 12 | bur gabo
City not found. Skipping...
Processing Record 30 of Set 12 | murgud
Processing Record 31 of Set 12 | sturgis
Processing Record 32 of Set 12 | airai
Processing Record 33 of Set 12 | pevek
Processing Record 34 of Set 12 | voyvozh
Processing Record 35 of Set 12 | sioux lookout
Processing Record 36 of Set 12 | mullaitivu
City not found. Skipping...
Processing Record 37 of Set 12 | beryslav
Processing Record 38 of Set 12 | cukai
Processing Record 39 of Set 12 | sayansk
Processing Record 40 of Set 12 | muros
Processing Record 41 of Set 12 | farafangana
Processing Record 42 of S

In [7]:
len(city_data)

569

In [8]:
# Convert the array of dictionaries into a DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Latitude,Longitude,Max Temp,Humidity,Clouds,Wind,Country,Date
0,Bondo,3.8146,23.6866,69.19,99,100,1.03,CD,2022-09-14 04:39:21
1,Dali,25.7,100.1833,71.89,66,98,3.69,CN,2022-09-14 04:39:22
2,Bull Savanna,17.8868,-77.5902,77.4,85,94,7.4,JM,2022-09-14 04:39:22
3,Lebu,-37.6167,-73.65,46.87,86,43,3.87,CL,2022-09-14 04:39:22
4,Fortuna,40.5982,-124.1573,57.92,90,64,3.69,US,2022-09-14 04:37:11
5,Butaritari,3.0707,172.7902,80.85,76,7,9.17,KI,2022-09-14 04:37:30
6,Azul,-36.777,-59.8585,48.34,93,1,6.8,AR,2022-09-14 04:39:23
7,Illela,13.7292,5.2975,78.03,80,43,9.17,NG,2022-09-14 04:39:23
8,Atasu,48.6814,71.6433,56.95,27,0,10.69,KZ,2022-09-14 04:39:24
9,Qaanaaq,77.484,-69.3632,33.13,76,92,5.3,GL,2022-09-14 04:35:28


In [9]:
# we'll reorder the columns as City, Country, Date, Lat, Lng, Max Temp, Humidity, Cloudiness, and Wind Speed
new_columns_list = ["City","Country","Date","Latitude","Longitude","Max Temp","Humidity","Clouds","Wind"]

city_data_df = city_data_df[new_columns_list]
city_data_df.columns

Index(['City', 'Country', 'Date', 'Latitude', 'Longitude', 'Max Temp',
       'Humidity', 'Clouds', 'Wind'],
      dtype='object')

In [10]:
# Display the DataFrame
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Latitude,Longitude,Max Temp,Humidity,Clouds,Wind
0,Bondo,CD,2022-09-14 04:39:21,3.8146,23.6866,69.19,99,100,1.03
1,Dali,CN,2022-09-14 04:39:22,25.7,100.1833,71.89,66,98,3.69
2,Bull Savanna,JM,2022-09-14 04:39:22,17.8868,-77.5902,77.4,85,94,7.4
3,Lebu,CL,2022-09-14 04:39:22,-37.6167,-73.65,46.87,86,43,3.87
4,Fortuna,US,2022-09-14 04:37:11,40.5982,-124.1573,57.92,90,64,3.69
5,Butaritari,KI,2022-09-14 04:37:30,3.0707,172.7902,80.85,76,7,9.17
6,Azul,AR,2022-09-14 04:39:23,-36.777,-59.8585,48.34,93,1,6.8
7,Illela,NG,2022-09-14 04:39:23,13.7292,5.2975,78.03,80,43,9.17
8,Atasu,KZ,2022-09-14 04:39:24,48.6814,71.6433,56.95,27,0,10.69
9,Qaanaaq,GL,2022-09-14 04:35:28,77.484,-69.3632,33.13,76,92,5.3


In [11]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"

city_data_df.to_csv(output_data_file, index_label="City_ID")