In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from citipy import citipy


In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000,high=90.000, size =1500)
lngs = np.random.uniform(low=-180.000,high=180.00, size =1500)
lat_lngs = zip(lats,lngs)
lat_lngs

<zip at 0x153b54ee2c8>

The zip object packs each pair of lats and lngs having the same index in their respective array into a tuple. If there are 1,500 latitudes and longitudes, there will be 1,500 tuples of paired latitudes and longitudes, where each latitude and longitude in a tuple can be accessed by the index of 0 and 1, respectively

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)
coordinates

[(-66.01992294947748, -7.065011517829504),
 (-4.299084284709551, -132.29796399422636),
 (-60.80244643754202, 116.10214372628542),
 (-70.49969709252662, -35.70708961945084),
 (-72.59399555008233, -143.0861630991301),
 (68.17398360763733, -143.23008081145045),
 (61.2410659424028, 23.168271949616724),
 (-74.01436974304251, -176.78347393656338),
 (78.22686291025758, 67.10063530392054),
 (-81.07424529738792, 106.36475973735895),
 (15.558531946154673, -158.4722465403466),
 (42.29867232806356, 146.7805960911811),
 (-8.64719792153464, 71.78532385001651),
 (63.38401388542414, -75.11283473223811),
 (51.9385560040505, 72.49783811760807),
 (-46.83398115467477, 166.87359055709055),
 (49.40509362532339, 70.04400425457578),
 (-62.58549260226745, -60.332381568734405),
 (24.337947553797008, 13.678789535715794),
 (-7.192783630264174, -83.21503355063706),
 (-86.79956197902965, -63.42408057948629),
 (-23.2233459476183, -60.309374140811826),
 (-75.64909823538258, 171.0499098020469),
 (-78.19513023963344, 8

You can only unzip a zipped tuple once before it is removed from the computer's memory. Make sure you unzip the latitudes and longitudes into the coordinates list before moving on.

In [4]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
print(cities)
len(cities)

['cape town', 'atuona', 'albany', 'ushuaia', 'mataura', 'fairbanks', 'vammala', 'vaini', 'amderma', 'hilo', 'nemuro', 'hithadhoo', 'iqaluit', 'ereymentau', 'tuatapere', 'atasu', 'marzuq', 'sechura', 'filadelfia', 'bluff', 'busselton', 'guadalupe y calvo', 'saint-philippe', 'sao sepe', 'lebu', 'kavieng', 'kapaa', 'zeya', 'deder', 'rikitea', 'porto walter', 'henties bay', 'husavik', 'saint george', 'luderitz', 'katsuura', 'pevek', 'whitehorse', 'dingle', 'raga', 'leh', 'puerto ayora', 'hermanus', 'north mankato', 'clyde river', 'hobart', 'yellowknife', 'cayenne', 'suraabad', 'mahebourg', 'jamestown', 'carnarvon', 'saleaula', 'paveh', 'chapais', 'rio claro', 'sorong', 'nabire', 'chuy', 'sao joao da barra', 'mount gambier', 'margate', 'sindand', 'khatanga', 'barrow', 'swan river', 'illoqqortoormiut', 'polyarnyy', 'yunguyo', 'arraial do cabo', 'punta arenas', 'cabo san lucas', 'korla', 'nikolskoye', 'tuktoyaktuk', 'chipinge', 'kurilsk', 'upernavik', 'hamilton', 'talakan', 'los llanos de ari

616

# Get the City Weather Data


## Import Dependencies, and Initialize an Empty List and Counters

In [5]:
import requests
# Import the API key.
from config import weather_api_key

In [6]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [7]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [8]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in our list.
# use the enumerate() method to get the index of the city for logging purposes and the city for creating an endpoint URL
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | cape town
Processing Record 2 of Set 1 | atuona
Processing Record 3 of Set 1 | albany
Processing Record 4 of Set 1 | ushuaia
Processing Record 5 of Set 1 | mataura
Processing Record 6 of Set 1 | fairbanks
Processing Record 7 of Set 1 | vammala
Processing Record 8 of Set 1 | vaini
Processing Record 9 of Set 1 | amderma
City not found. Skipping...
Processing Record 10 of Set 1 | hilo
Processing Record 11 of Set 1 | nemuro
Processing Record 12 of Set 1 | hithadhoo
Processing Record 13 of Set 1 | iqaluit
Processing Record 14 of Set 1 | ereymentau
Processing Record 15 of Set 1 | tuatapere
Processing Record 16 of Set 1 | atasu
Processing Record 17 of Set 1 | marzuq
Processing Record 18 of Set 1 | sechura
Processing Record 19 of Set 1 | filadelfia
Processing Record 20 of Set 1 | bluff
Processing Record 21 of Set 1 | busselton
Processing Record 22 of Set 1 | guadalupe y calvo
Processing Record 23 of Set 

Processing Record 34 of Set 4 | vardo
Processing Record 35 of Set 4 | attawapiskat
City not found. Skipping...
Processing Record 36 of Set 4 | bambanglipuro
Processing Record 37 of Set 4 | berlevag
Processing Record 38 of Set 4 | broken hill
Processing Record 39 of Set 4 | kirundo
Processing Record 40 of Set 4 | urdzhar
City not found. Skipping...
Processing Record 41 of Set 4 | tessalit
Processing Record 42 of Set 4 | castro
Processing Record 43 of Set 4 | longyearbyen
Processing Record 44 of Set 4 | luan
Processing Record 45 of Set 4 | gannan
Processing Record 46 of Set 4 | kabalo
Processing Record 47 of Set 4 | sindor
Processing Record 48 of Set 4 | roald
Processing Record 49 of Set 4 | oum hadjer
Processing Record 50 of Set 4 | saldanha
Processing Record 1 of Set 5 | kupang
Processing Record 2 of Set 5 | methoni
Processing Record 3 of Set 5 | rincon
Processing Record 4 of Set 5 | bredasdorp
Processing Record 5 of Set 5 | cassilandia
Processing Record 6 of Set 5 | warwick
Processing

Processing Record 22 of Set 8 | antigonish
Processing Record 23 of Set 8 | pandan
Processing Record 24 of Set 8 | novikovo
Processing Record 25 of Set 8 | ende
Processing Record 26 of Set 8 | arica
Processing Record 27 of Set 8 | praia
Processing Record 28 of Set 8 | kharp
Processing Record 29 of Set 8 | cartagena del chaira
Processing Record 30 of Set 8 | portland
Processing Record 31 of Set 8 | coahuayana
Processing Record 32 of Set 8 | mokshan
Processing Record 33 of Set 8 | bargal
City not found. Skipping...
Processing Record 34 of Set 8 | ortona
Processing Record 35 of Set 8 | ondorhaan
City not found. Skipping...
Processing Record 36 of Set 8 | rocha
Processing Record 37 of Set 8 | buala
Processing Record 38 of Set 8 | bur gabo
City not found. Skipping...
Processing Record 39 of Set 8 | vallenar
Processing Record 40 of Set 8 | ambulu
Processing Record 41 of Set 8 | bathsheba
Processing Record 42 of Set 8 | buluang
Processing Record 43 of Set 8 | ahipara
Processing Record 44 of Se

Processing Record 12 of Set 12 | half moon bay
Processing Record 13 of Set 12 | namibe
Processing Record 14 of Set 12 | viedma
Processing Record 15 of Set 12 | assis
Processing Record 16 of Set 12 | walvis bay
Processing Record 17 of Set 12 | sumbawa
City not found. Skipping...
Processing Record 18 of Set 12 | dianopolis
City not found. Skipping...
Processing Record 19 of Set 12 | solsvik
City not found. Skipping...
Processing Record 20 of Set 12 | taitung
Processing Record 21 of Set 12 | moerai
Processing Record 22 of Set 12 | yertarskiy
Processing Record 23 of Set 12 | zaraza
Processing Record 24 of Set 12 | tias
Processing Record 25 of Set 12 | kragujevac
Processing Record 26 of Set 12 | oxford
Processing Record 27 of Set 12 | shahr-e kord
Processing Record 28 of Set 12 | benghazi
Processing Record 29 of Set 12 | pyaozerskiy
Processing Record 30 of Set 12 | touros
Processing Record 31 of Set 12 | sand springs
Processing Record 32 of Set 12 | sabha
Processing Record 33 of Set 12 | so

# Create a DataFrame of the City Weather Data from the API get request

In [9]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Cape Town,-33.93,18.42,62.01,62,20,16.11,ZA,2020-11-26 23:16:03
1,Atuona,-9.8,-139.03,77.5,74,99,16.78,PF,2020-11-26 23:17:51
2,Albany,42.6,-73.97,53.01,99,67,5.03,US,2020-11-26 23:17:51
3,Ushuaia,-54.8,-68.3,51.8,57,75,14.99,AR,2020-11-26 23:14:36
4,Mataura,-46.19,168.86,55.0,71,82,18.01,NZ,2020-11-26 23:17:51
5,Fairbanks,64.84,-147.72,23.0,95,99,4.88,US,2020-11-26 23:17:41
6,Vammala,61.33,22.9,32.0,94,90,10.29,FI,2020-11-26 23:17:51
7,Vaini,-21.2,-175.2,82.4,78,40,14.99,TO,2020-11-26 23:17:51
8,Hilo,19.73,-155.09,75.99,84,56,1.99,US,2020-11-26 23:13:30
9,Nemuro,43.32,145.57,33.12,87,9,8.72,JP,2020-11-26 23:17:51


## Reorder columns in a DataFrame 

In [10]:
# change column order as City, Country, Date, Lat, Lng, Max Temp, Humidity, Cloudiness, and Wind Speed
new_column_order = ["City","Country","Date","Lat","Lng","Max Temp","Humidity", "Cloudiness", "Wind Speed"]
city_data_df_reorder = city_data_df[new_column_order]

In [11]:
city_data_df_reorder

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Cape Town,ZA,2020-11-26 23:16:03,-33.93,18.42,62.01,62,20,16.11
1,Atuona,PF,2020-11-26 23:17:51,-9.80,-139.03,77.50,74,99,16.78
2,Albany,US,2020-11-26 23:17:51,42.60,-73.97,53.01,99,67,5.03
3,Ushuaia,AR,2020-11-26 23:14:36,-54.80,-68.30,51.80,57,75,14.99
4,Mataura,NZ,2020-11-26 23:17:51,-46.19,168.86,55.00,71,82,18.01
...,...,...,...,...,...,...,...,...,...
556,Cherskiy,RU,2020-11-26 23:18:46,68.75,161.30,24.04,93,100,20.69
557,Tilichiki,RU,2020-11-26 23:18:46,60.47,166.10,-0.58,95,96,7.31
558,Tabou,CI,2020-11-26 23:18:46,4.42,-7.35,77.76,89,100,8.52
559,Huancabamba,PE,2020-11-26 23:18:46,-5.24,-79.45,62.28,72,93,3.42


In [12]:
# reorder looks good, change the original dataframe
city_data_df= city_data_df_reorder

## Output Dataframe to CSV

In [14]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")
# The last line in the code block will export the DataFrame to a CSV file, with the index label (or column A) header as "City_ID." 
# If we ever need to export the CSV file to a DataFrame, that header will be present in the DataFrame
