In [1]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fc8aff5c800>

In [3]:
# Create a practice set of random latitude and longitude combinations.
x = [25.12903645, 25.92017388, 26.62509167, -59.98969384, 37.30571269]
y = [-67.59741259, 11.09532135, 74.84233102, -76.89176677, -61.13376282]
coordinates = zip(x, y)



In [4]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [5]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [6]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)


615

In [7]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [8]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key


In [9]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [10]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

    # Run an API request for each of the cities.
    try:
    # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
            "Lat": city_lat,
            "Lng": city_lng,
            "Max Temp": city_max_temp,
            "Humidity": city_humidity,
            "Cloudiness": city_clouds,
            "Wind Speed": city_wind,
            "Country": city_country,
            "Date": city_date})

    # If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | hermanus
Processing Record 2 of Set 1 | punta arenas
Processing Record 3 of Set 1 | butaritari
Processing Record 4 of Set 1 | vaini
Processing Record 5 of Set 1 | seoul
Processing Record 6 of Set 1 | kitaibaraki
Processing Record 7 of Set 1 | hithadhoo
Processing Record 8 of Set 1 | ushuaia
Processing Record 9 of Set 1 | sentyabrskiy
City not found. Skipping...
Processing Record 10 of Set 1 | bagdarin
Processing Record 11 of Set 1 | zubtsov
Processing Record 12 of Set 1 | albany
Processing Record 13 of Set 1 | ewa beach
Processing Record 14 of Set 1 | bambous virieux
Processing Record 15 of Set 1 | atar
Processing Record 16 of Set 1 | sibi
Processing Record 17 of Set 1 | east london
Processing Record 18 of Set 1 | samusu
City not found. Skipping...
Processing Record 19 of Set 1 | cayenne
Processing Record 20 of Set 1 | cape town
Processing Record 21 of Set 1 | la rochelle
Processing Record 22 of 

Processing Record 39 of Set 4 | emporia
Processing Record 40 of Set 4 | onega
Processing Record 41 of Set 4 | whitehorse
Processing Record 42 of Set 4 | kieta
Processing Record 43 of Set 4 | itarema
Processing Record 44 of Set 4 | valdivia
Processing Record 45 of Set 4 | fortuna
Processing Record 46 of Set 4 | srednekolymsk
Processing Record 47 of Set 4 | carballo
Processing Record 48 of Set 4 | nouadhibou
Processing Record 49 of Set 4 | vilyuysk
Processing Record 50 of Set 4 | grand centre
City not found. Skipping...
Processing Record 1 of Set 5 | chokurdakh
Processing Record 2 of Set 5 | ketchikan
Processing Record 3 of Set 5 | oranjemund
Processing Record 4 of Set 5 | mahebourg
Processing Record 5 of Set 5 | xushan
Processing Record 6 of Set 5 | innisfail
Processing Record 7 of Set 5 | west plains
Processing Record 8 of Set 5 | murgab
Processing Record 9 of Set 5 | plymouth
Processing Record 10 of Set 5 | puerto madero
Processing Record 11 of Set 5 | dzilam gonzalez
Processing Recor

Processing Record 30 of Set 8 | turukhansk
Processing Record 31 of Set 8 | omsukchan
Processing Record 32 of Set 8 | balikpapan
Processing Record 33 of Set 8 | grand river south east
City not found. Skipping...
Processing Record 34 of Set 8 | laurel
Processing Record 35 of Set 8 | ciudad bolivar
Processing Record 36 of Set 8 | townsville
Processing Record 37 of Set 8 | bubaque
Processing Record 38 of Set 8 | powell river
Processing Record 39 of Set 8 | salalah
Processing Record 40 of Set 8 | kostomuksha
Processing Record 41 of Set 8 | piney green
Processing Record 42 of Set 8 | lasa
Processing Record 43 of Set 8 | coihaique
Processing Record 44 of Set 8 | aklavik
Processing Record 45 of Set 8 | marathon
Processing Record 46 of Set 8 | saleaula
City not found. Skipping...
Processing Record 47 of Set 8 | luanda
Processing Record 48 of Set 8 | da lat
Processing Record 49 of Set 8 | dunedin
Processing Record 50 of Set 8 | wloclawek
Processing Record 1 of Set 9 | ayni
Processing Record 2 of

Processing Record 20 of Set 12 | terney
Processing Record 21 of Set 12 | shahreza
Processing Record 22 of Set 12 | chajul
Processing Record 23 of Set 12 | fort-shevchenko
Processing Record 24 of Set 12 | iracoubo
Processing Record 25 of Set 12 | ipora
Processing Record 26 of Set 12 | waipawa
Processing Record 27 of Set 12 | kulhudhuffushi
Processing Record 28 of Set 12 | punta gorda
Processing Record 29 of Set 12 | kiruna
Processing Record 30 of Set 12 | tabou
Processing Record 31 of Set 12 | platanos
Processing Record 32 of Set 12 | mountain home
Processing Record 33 of Set 12 | haibowan
City not found. Skipping...
Processing Record 34 of Set 12 | ibra
Processing Record 35 of Set 12 | ocampo
Processing Record 36 of Set 12 | tarkwa
Processing Record 37 of Set 12 | mentok
City not found. Skipping...
Processing Record 38 of Set 12 | sinjar
Processing Record 39 of Set 12 | huainan
Processing Record 40 of Set 12 | harper
Processing Record 41 of Set 12 | oranjestad
Processing Record 42 of S

In [11]:
# # Import the dependencies.
# import pandas as pd
# import matplotlib.pyplot as plt
# import numpy as np

# # Create a set of random latitude and longitude combinations.
# lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
# lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
# lat_lngs = zip(lats, lngs)
# lat_lngs

# # Create a practice set of random latitude and longitude combinations.
# x = [25.12903645, 25.92017388, 26.62509167, -59.98969384, 37.30571269]
# y = [-67.59741259, 11.09532135, 74.84233102, -76.89176677, -61.13376282]
# coordinates = zip(x, y)



# # Add the latitudes and longitudes to a list.
# coordinates = list(lat_lngs)

# # Use the citipy module to determine city based on latitude and longitude.
# from citipy import citipy

# # Create a list for holding the cities.
# cities = []
# # Identify the nearest city for each latitude and longitude combination.
# for coordinate in coordinates:
#     city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

#     # If the city is unique, then we will add it to the cities list.
#     if city not in cities:
#         cities.append(city)
# # Print the city count to confirm sufficient count.
# len(cities)


# # Import the requests library.
# import requests

# # Import the API key.
# from config import weather_api_key

# # Starting URL for Weather Map API Call.
# url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key


# # Import the datetime module from the datetime library.
# from datetime import datetime

# # Create an empty list to hold the weather data.
# city_data = []
# # Print the beginning of the logging.
# print("Beginning Data Retrieval     ")
# print("-----------------------------")

# # Create counters.
# record_count = 1
# set_count = 1

# # Loop through all the cities in the list.
# for i, city in enumerate(cities):

#     # Group cities in sets of 50 for logging purposes.
#     if (i % 50 == 0 and i >= 50):
#         set_count += 1
#         record_count = 1
#     # Create endpoint URL with each city.
#     city_url = url + "&q=" + city.replace(" ","+")

#     # Log the URL, record, and set numbers and the city.
#     print(f"Processing Record {record_count} of Set {set_count} | {city}")
#     # Add 1 to the record count.
#     record_count += 1

#     # Run an API request for each of the cities.
#     try:
#     # Parse the JSON and retrieve data.
#         city_weather = requests.get(city_url).json()
#         # Parse out the needed data.
#         city_lat = city_weather["coord"]["lat"]
#         city_lng = city_weather["coord"]["lon"]
#         city_max_temp = city_weather["main"]["temp_max"]
#         city_humidity = city_weather["main"]["humidity"]
#         city_clouds = city_weather["clouds"]["all"]
#         city_wind = city_weather["wind"]["speed"]
#         city_country = city_weather["sys"]["country"]
#         # Convert the date to ISO standard.
#         city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
#         # Append the city information into city_data list.
#         city_data.append({"City": city.title(),
#             "Lat": city_lat,
#             "Lng": city_lng,
#             "Max Temp": city_max_temp,
#             "Humidity": city_humidity,
#             "Cloudiness": city_clouds,
#             "Wind Speed": city_wind,
#             "Country": city_country,
#             "Date": city_date})

#     # If an error is experienced, skip the city.
#     except:
#         print("City not found. Skipping...")
#         pass

# # Indicate that Data Loading is complete.
# print("-----------------------------")
# print("Data Retrieval Complete      ")
# print("-----------------------------")




In [12]:
len(city_data)

576

In [13]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Hermanus,-34.4187,19.2345,54.81,90,57,8.9,ZA,2021-08-01 02:45:34
1,Punta Arenas,-53.15,-70.9167,42.91,70,0,20.71,CL,2021-08-01 02:45:23
2,Butaritari,3.0707,172.7902,82.15,73,13,8.99,KI,2021-08-01 02:48:54
3,Vaini,-21.2,-175.2,77.16,73,20,27.63,TO,2021-08-01 02:45:42
4,Seoul,37.5683,126.9778,90.01,78,90,5.75,KR,2021-08-01 02:51:54
5,Kitaibaraki,36.7833,140.75,91.35,63,7,13.47,JP,2021-08-01 02:54:58
6,Hithadhoo,-0.6,73.0833,81.25,72,75,5.64,MV,2021-08-01 02:45:30
7,Ushuaia,-54.8,-68.3,42.46,65,75,8.05,AR,2021-08-01 02:48:54
8,Bagdarin,54.4333,113.6,59.14,71,94,3.2,RU,2021-08-01 02:54:59
9,Zubtsov,56.1753,34.5894,59.07,78,100,5.26,RU,2021-08-01 02:54:59


In [14]:
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]


In [19]:
city_data_new_df = city_data_df[new_column_order]
city_data_new_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Hermanus,ZA,2021-08-01 02:45:34,-34.4187,19.2345,54.81,90,57,8.90
1,Punta Arenas,CL,2021-08-01 02:45:23,-53.1500,-70.9167,42.91,70,0,20.71
2,Butaritari,KI,2021-08-01 02:48:54,3.0707,172.7902,82.15,73,13,8.99
3,Vaini,TO,2021-08-01 02:45:42,-21.2000,-175.2000,77.16,73,20,27.63
4,Seoul,KR,2021-08-01 02:51:54,37.5683,126.9778,90.01,78,90,5.75
...,...,...,...,...,...,...,...,...,...
571,Lulea,SE,2021-08-01 02:51:19,65.5842,22.1547,59.07,94,90,6.91
572,Tommot,RU,2021-08-01 02:53:19,58.9564,126.2925,69.62,43,100,11.79
573,Wukari,NG,2021-08-01 02:57:24,7.8500,9.7833,72.81,82,100,4.32
574,Kaa-Khem,RU,2021-08-01 02:57:25,51.6833,94.7333,62.83,70,100,6.31


In [21]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_new_df.to_csv(output_data_file, index_label="City_ID")