In [14]:
%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import random

In [15]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fcbf0aced80>

In [16]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [17]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [18]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

614

In [19]:
print (cities)

['port alfred', 'bluff', 'bilma', 'tezu', 'hami', 'dicabisagan', 'mahebourg', 'longyearbyen', 'mar del plata', 'chandler', 'kalabo', 'barroso', 'lagoa', 'bredasdorp', 'hermanus', 'port hardy', 'tuktoyaktuk', 'punta arenas', 'nikolskoye', 'nome', 'nizhneyansk', 'ushuaia', 'shache', 'poya', 'kamenka', 'dikson', 'puerto ayora', 'halalo', 'castro', 'vaini', 'puerto guzman', 'troyes', 'juba', 'mehamn', 'atuona', 'ocos', 'wageningen', 'port elizabeth', 'camana', 'uribia', 'busselton', 'unnao', 'thunder bay', 'kruisfontein', 'albany', 'lebu', 'matara', 'arraial do cabo', 'yellowknife', 'sitka', 'qaanaaq', 'airai', 'fortuna', 'belushya guba', 'saint-philippe', 'erzin', 'rikitea', 'saint-francois', 'barentsburg', 'geraldton', 'westport', 'vestbygda', 'provideniya', 'mataura', 'hilo', 'illoqqortoormiut', 'saint george', 'myitkyina', 'bushehr', 'nicoya', 'xiamen', 'souillac', 'beringovskiy', 'severo-kurilsk', 'nishihara', 'hit', 'miyako', 'saskylakh', 'muscle shoals', 'rupert', 'vila franca do ca

In [31]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [32]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=8350e450ac309ef50939874ef9b64035


In [33]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [34]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
# Run an API request for each of the cities.
try:
    # Parse the JSON and retrieve data.
    city_weather = requests.get(city_url).json()
    # Parse out the needed data.
    city_lat = city_weather["coord"]["lat"]
    city_lng = city_weather["coord"]["lon"]
    city_max_temp = city_weather["main"]["temp_max"]
    city_humidity = city_weather["main"]["humidity"]
    city_clouds = city_weather["clouds"]["all"]
    city_wind = city_weather["wind"]["speed"]
    city_country = city_weather["sys"]["country"]
    # Convert the date to ISO standard.
    city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
    # Append the city information into city_data list.
    city_data.append({"City": city.title(),
                      "Lat": city_lat,
                      "Lng": city_lng,
                      "Max Temp": city_max_temp,
                      "Humidity": city_humidity,
                      "Cloudiness": city_clouds,
                      "Wind Speed": city_wind,
                      "Country": city_country,
                      "Date": city_date})
# If an error is experienced, skip the city.
except:
    print("City not found. Skipping...")
    pass    
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | port alfred
Processing Record 2 of Set 1 | bluff
Processing Record 3 of Set 1 | bilma
Processing Record 4 of Set 1 | tezu
Processing Record 5 of Set 1 | hami
Processing Record 6 of Set 1 | dicabisagan
Processing Record 7 of Set 1 | mahebourg
Processing Record 8 of Set 1 | longyearbyen
Processing Record 9 of Set 1 | mar del plata
Processing Record 10 of Set 1 | chandler
Processing Record 11 of Set 1 | kalabo
Processing Record 12 of Set 1 | barroso
Processing Record 13 of Set 1 | lagoa
Processing Record 14 of Set 1 | bredasdorp
Processing Record 15 of Set 1 | hermanus
Processing Record 16 of Set 1 | port hardy
Processing Record 17 of Set 1 | tuktoyaktuk
Processing Record 18 of Set 1 | punta arenas
Processing Record 19 of Set 1 | nikolskoye
Processing Record 20 of Set 1 | nome
Processing Record 21 of Set 1 | nizhneyansk
Processing Record 22 of Set 1 | ushuaia
Processing Record 23 of Set 1 | shache
P

In [35]:
len(city_data)

1

In [36]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Alexandria,31.2156,29.9553,55.4,62,40,12.66,EG,2021-01-29 05:12:17


In [37]:
city_data_df.tail()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Alexandria,31.2156,29.9553,55.4,62,40,12.66,EG,2021-01-29 05:12:17


In [38]:
# Reorder the columns in the order you want them to appear.
new_column_order = ["City", "Country", "Date", "Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed"]
# Assign the new column order.
city_data_df = city_data_df[new_column_order]

In [39]:
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Alexandria,EG,2021-01-29 05:12:17,31.2156,29.9553,55.4,62,40,12.66


In [40]:
# Create the output file (CSV). 

## instruction was "output_data_file = "weather_data/cities.csv"
# but it was giving me an error even when I changed to Module6 and when I removed all before cities, it saved it
output_data_file = "cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")