In [34]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [35]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7f8bb0171690>

In [36]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [37]:
# Use the print() function to display the latitude and longitude combinations.
for coordinate in coordinates:
    print(coordinate[0], coordinate[1])

13.95476665488782 160.0116596078683
-48.464387884807884 122.02404237145277
56.5678058183681 -58.532572601849296
35.91845205307459 -174.08816942085298
65.46591962356973 164.6840619171473
-82.7068303000391 -18.404511710986327
60.65674704244958 126.93410755285976
1.832504153238304 -63.260052270157644
-33.874702063780404 64.3318906456569
27.274639722911658 48.33859655578706
22.59601031912645 167.05489289796878
78.75471491613351 47.76287511038461
2.5353750234782666 -176.9699958932017
35.61744491097035 -3.6743021868128665
-7.272349085674421 67.08163647489661
-38.0468925682179 -10.460284727034775
-0.41384315162808605 -111.34393347571702
44.96201332877982 179.67481159224286
-25.148570520614555 -90.50794244073158
86.24781160218305 49.04233607683926
14.503948064034688 -70.39525070494807
54.68479596089884 100.97325379500353
-87.92225080922594 46.954898530139985
-87.84783605979666 32.71611556695743
-3.2798646828844085 133.24599648275665
-75.01881242665593 -90.12310205358212
-36.05820489423503 55.3

50.38600688418305 146.5778180589624
82.12597219196314 -12.554852171996686
16.564501015407416 9.886518275817167
77.56442719832143 -108.79564599551958
50.07002672641937 -137.97755974989352
44.36672540721014 -154.1718052630178
48.44215167621286 -161.36128280578657
-46.40628084522879 172.24574602224527
29.5155431220104 139.07357784444713
-14.459795572363006 -34.7416191330544
-77.28086306915988 50.691672796213254
0.3931605416677115 164.1238853347088
-37.23320955908258 -148.34944956211015
-67.21786003025525 -35.70488068026512
-71.04958927694233 162.7489198318716
14.31444523103471 156.524343852171
62.11167614990518 106.53893453263794
-52.92989216099241 -149.14204545758906
13.577370021936233 177.86125770940635
49.86631097458661 -2.3441051289924815
-82.36873038694554 66.79261590138645
-45.358479648588236 178.73934609000656
-12.733386113816238 64.22485745778621
33.963553586154035 119.13312567290728
10.524197121364693 120.81601930086435
23.649756840112573 60.38363579090327
-78.88929770435325 -23.

In [38]:
from citipy import citipy

In [39]:
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
            cities.append(city)

# Print the city count to confirm sufficient count.
len(cities)

591

In [40]:
# Map out, at a high level, how we will get the weather data for 
# each city for the website.

#1 Import our dependencies and initialize counters and an empty list that will hold the weather data.
#2 Loop through the cities list.
#3 Group the cities in sets of 50 to log the process as we find the weather data for each city.
    # Two counters will be needed here: one to log the city count from 1 to 50, and another for the sets.
#4 Build the city_url or endpoint for each city.
#5 Log the URL and the record and set numbers.
#6 Make an API request for each city.
#7 Parse the JSON weather data for the following:
    # City, country, and date
    # Latitude and longitude
    # Maximum temperature
    # Humidity
    # Cloudiness
    # Wind speed
#8 Add the data to a list in a dictionary format and then convert the list to a DataFrame.

In [41]:
# Import the time library and the datetime module from the datetime library 
import time
from datetime import datetime

In [42]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [43]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
#print(url)

In [44]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [45]:
# # Loop through all the cities in our list.
# for i in range(len(cities)):

#     # Group cities in sets of 50 for logging purposes.
#     if (i % 50 == 0 and i >= 50):
#         set_count += 1
#         record_count = 1
#         time.sleep(60)

#     # Create endpoint URL with each city.
#     city_url = url + "&q=" + cities[i]

In [46]:
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | butaritari
Processing Record 2 of Set 1 | albany
Processing Record 3 of Set 1 | saint-augustin
Processing Record 4 of Set 1 | kapaa
Processing Record 5 of Set 1 | bilibino
Processing Record 6 of Set 1 | ushuaia
Processing Record 7 of Set 1 | berdigestyakh
Processing Record 8 of Set 1 | boa vista
Processing Record 9 of Set 1 | souillac
Processing Record 10 of Set 1 | safwah
City not found. Skipping...
Processing Record 11 of Set 1 | belushya guba
City not found. Skipping...
Processing Record 12 of Set 1 | vaitupu
City not found. Skipping...
Processing Record 13 of Set 1 | melilla
Processing Record 14 of Set 1 | hithadhoo
Processing Record 15 of Set 1 | jamestown
Processing Record 16 of Set 1 | ixtapa
Processing Record 17 of Set 1 | nikolskoye
Processing Record 18 of Set 1 | pisco
Processing Record 19 of Set 1 | oranjestad
Processing Record 20 of Set 1 | tulun
Processing Record 21 of Set 1 | port alfred
Processing Record 22 of Set 1 | port elizabeth
Process

Processing Record 40 of Set 4 | tiksi
Processing Record 41 of Set 4 | esperance
Processing Record 42 of Set 4 | chuy
Processing Record 43 of Set 4 | trapani
Processing Record 44 of Set 4 | wamba
Processing Record 45 of Set 4 | cabo san lucas
Processing Record 46 of Set 4 | tigil
Processing Record 47 of Set 4 | nyurba
Processing Record 48 of Set 4 | iguape
Processing Record 49 of Set 4 | chokurdakh
Processing Record 50 of Set 4 | jibuti
Processing Record 1 of Set 5 | fairbanks
Processing Record 2 of Set 5 | christchurch
Processing Record 3 of Set 5 | paciran
Processing Record 4 of Set 5 | carbonia
Processing Record 5 of Set 5 | batticaloa
Processing Record 6 of Set 5 | bonavista
Processing Record 7 of Set 5 | saint helens
Processing Record 8 of Set 5 | airai
Processing Record 9 of Set 5 | iqaluit
Processing Record 10 of Set 5 | romilly-sur-seine
Processing Record 11 of Set 5 | peniche
Processing Record 12 of Set 5 | barentsburg
City not found. Skipping...
Processing Record 13 of Set 5 |

Processing Record 29 of Set 8 | haicheng
Processing Record 30 of Set 8 | medea
Processing Record 31 of Set 8 | buraydah
Processing Record 32 of Set 8 | barentu
Processing Record 33 of Set 8 | port macquarie
Processing Record 34 of Set 8 | aripuana
Processing Record 35 of Set 8 | vila franca do campo
Processing Record 36 of Set 8 | balikpapan
Processing Record 37 of Set 8 | kinshasa
Processing Record 38 of Set 8 | nizhniy kuranakh
Processing Record 39 of Set 8 | kismayo
Processing Record 40 of Set 8 | sinnamary
Processing Record 41 of Set 8 | znamensk
Processing Record 42 of Set 8 | lata
Processing Record 43 of Set 8 | mount isa
Processing Record 44 of Set 8 | linxia
Processing Record 45 of Set 8 | san patricio
Processing Record 46 of Set 8 | lagoa
Processing Record 47 of Set 8 | sokolo
Processing Record 48 of Set 8 | saint combs
City not found. Skipping...
Processing Record 49 of Set 8 | zhigalovo
Processing Record 50 of Set 8 | khandyga
Processing Record 1 of Set 9 | lanzhou
Processin

Processing Record 15 of Set 12 | conde
Processing Record 16 of Set 12 | bairiki
Processing Record 17 of Set 12 | yerbogachen
Processing Record 18 of Set 12 | octeville
Processing Record 19 of Set 12 | waipawa
Processing Record 20 of Set 12 | gaogou
Processing Record 21 of Set 12 | suba
Processing Record 22 of Set 12 | baturite
Processing Record 23 of Set 12 | kirovskiy
Processing Record 24 of Set 12 | hakkari
Processing Record 25 of Set 12 | ahuimanu
Processing Record 26 of Set 12 | novopokrovka
Processing Record 27 of Set 12 | kailua
Processing Record 28 of Set 12 | yumen
Processing Record 29 of Set 12 | long xuyen
Processing Record 30 of Set 12 | mehamn
Processing Record 31 of Set 12 | eureka
Processing Record 32 of Set 12 | zarand
Processing Record 33 of Set 12 | mounana
Processing Record 34 of Set 12 | garmsar
Processing Record 35 of Set 12 | formoso do araguaia
City not found. Skipping...
Processing Record 36 of Set 12 | quatre cocos
Processing Record 37 of Set 12 | maarianhamina


In [47]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Butaritari,3.0707,172.7902,81.88,77,50,14.05,KI,2022-08-12 22:35:58
1,Albany,42.6001,-73.9662,75.85,40,3,8.43,US,2022-08-12 22:35:58
2,Saint-Augustin,51.226,-58.6502,64.65,91,77,12.39,CA,2022-08-12 22:35:59
3,Kapaa,22.0752,-159.319,83.19,75,20,12.66,US,2022-08-12 22:32:59
4,Bilibino,68.0546,166.4372,48.36,79,99,2.82,RU,2022-08-12 22:31:23
5,Ushuaia,-54.8,-68.3,35.26,75,75,5.75,AR,2022-08-12 22:31:47
6,Berdigestyakh,62.0989,126.6992,60.48,93,100,5.64,RU,2022-08-12 22:33:12
7,Boa Vista,2.8197,-60.6733,80.58,69,75,17.27,BR,2022-08-12 22:34:03
8,Souillac,-20.5167,57.5167,66.58,77,40,11.5,MU,2022-08-12 22:36:00
9,Melilla,35.2937,-2.9383,82.78,83,0,5.75,ES,2022-08-12 22:36:01


In [53]:
# Rearrange column order.
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Butaritari,KI,2022-08-12 22:35:58,3.0707,172.7902,81.88,77,50,14.05
1,Albany,US,2022-08-12 22:35:58,42.6001,-73.9662,75.85,40,3,8.43
2,Saint-Augustin,CA,2022-08-12 22:35:59,51.226,-58.6502,64.65,91,77,12.39
3,Kapaa,US,2022-08-12 22:32:59,22.0752,-159.319,83.19,75,20,12.66
4,Bilibino,RU,2022-08-12 22:31:23,68.0546,166.4372,48.36,79,99,2.82
5,Ushuaia,AR,2022-08-12 22:31:47,-54.8,-68.3,35.26,75,75,5.75
6,Berdigestyakh,RU,2022-08-12 22:33:12,62.0989,126.6992,60.48,93,100,5.64
7,Boa Vista,BR,2022-08-12 22:34:03,2.8197,-60.6733,80.58,69,75,17.27
8,Souillac,MU,2022-08-12 22:36:00,-20.5167,57.5167,66.58,77,40,11.5
9,Melilla,ES,2022-08-12 22:36:01,35.2937,-2.9383,82.78,83,0,5.75


Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Butaritari,KI,2022-08-12 22:35:58,3.0707,172.7902,81.88,77,50,14.05
1,Albany,US,2022-08-12 22:35:58,42.6001,-73.9662,75.85,40,3,8.43
2,Saint-Augustin,CA,2022-08-12 22:35:59,51.226,-58.6502,64.65,91,77,12.39
3,Kapaa,US,2022-08-12 22:32:59,22.0752,-159.319,83.19,75,20,12.66
4,Bilibino,RU,2022-08-12 22:31:23,68.0546,166.4372,48.36,79,99,2.82
5,Ushuaia,AR,2022-08-12 22:31:47,-54.8,-68.3,35.26,75,75,5.75
6,Berdigestyakh,RU,2022-08-12 22:33:12,62.0989,126.6992,60.48,93,100,5.64
7,Boa Vista,BR,2022-08-12 22:34:03,2.8197,-60.6733,80.58,69,75,17.27
8,Souillac,MU,2022-08-12 22:36:00,-20.5167,57.5167,66.58,77,40,11.5
9,Melilla,ES,2022-08-12 22:36:01,35.2937,-2.9383,82.78,83,0,5.75


In [54]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")