In [4]:
#Importing dependencies

import pandas as pd 
import matplotlib.pyplot as plt 
import numpy as np 

In [5]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x2c4729fe708>

In [6]:
#Adding the latitudes and longitudes to a list. 

coordinates = list(lat_lngs)

In [7]:
#Use the citypy module to determine city based on latitude and longitude.

from citipy import citipy

In [8]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

622

In [9]:
#Importing the requests library. 
import requests

#Importing the API key. 
from config import weather_api_key

#Importing the datetime module form the datetime library
from datetime import datetime

In [10]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [11]:
#Create an empty list to hold the weather data. 

city_data = []

#Print the beginning of the logging. 
print('Beginning Data Retrieval     ')
print('-----------------------------')

#Create counters. 
record_count = 1 
set_count = 1

#Looping through all the cities in our list. 

for i,city in enumerate(cities):

    #Group cities in sets of 50 for logging purposes. 
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city. 
    city_url = url + '&q=' + city.replace(' ','+')

    #Log the URL, record, and set numbers and the city. 
    print(f'Processing Record {record_count} of Set {set_count} | {city}')

    #Add 1 to the record count. 
    record_count += 1

    #Run an API 

    try:
        #Parse the JSON and retrieve data. 
        city_weather = requests.get(city_url).json()
        #Parse out the needed data. 
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather ['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']
        #Convert the date to ISO standard. 
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        #Append the city information into the city_data list. 
        city_data.append({"City": city.title(),
                        "Lat": city_lat, 
                        "Lng": city_lng, 
                        "Max Temp": city_max_temp, 
                        "Humidity": city_humidity, 
                        "Cloudiness": city_clouds, 
                        "Wind Speed": city_wind,
                        "Country": city_country, 
                        "Date": city_date})
        #If an error is experienced, skip the city
    except:
        print('City not found. Skipping...')
        pass

#Indicate the Data loading is complete
print('---------------------------')
print('Data Retrieval Complete    ')
print('---------------------------')

Record 12 of Set 4 | tinlot
Processing Record 13 of Set 4 | northam
Processing Record 14 of Set 4 | vestmannaeyjar
Processing Record 15 of Set 4 | batagay-alyta
Processing Record 16 of Set 4 | dingle
Processing Record 17 of Set 4 | ewa beach
Processing Record 18 of Set 4 | muroto
Processing Record 19 of Set 4 | arcachon
Processing Record 20 of Set 4 | ndioum
Processing Record 21 of Set 4 | hounde
Processing Record 22 of Set 4 | linares
Processing Record 23 of Set 4 | karaul
City not found. Skipping...
Processing Record 24 of Set 4 | maymyo
Processing Record 25 of Set 4 | mindif
Processing Record 26 of Set 4 | mount gambier
Processing Record 27 of Set 4 | praia da vitoria
Processing Record 28 of Set 4 | muros
Processing Record 29 of Set 4 | richards bay
Processing Record 30 of Set 4 | beringovskiy
Processing Record 31 of Set 4 | samusu
City not found. Skipping...
Processing Record 32 of Set 4 | upington
Processing Record 33 of Set 4 | bani
Processing Record 34 of Set 4 | kitimat
Process

In [13]:
#Converting the array of dictionaries into a Pandas DataFrame.

city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Isla Vista,34.4133,-119.861,81.34,53,1,6.91,US,2021-05-23 21:48:31
1,Lebu,-37.6167,-73.65,53.15,78,100,2.26,CL,2021-05-23 21:44:47
2,Saskylakh,71.9167,114.0833,36.82,94,100,15.21,RU,2021-05-23 21:44:56
3,Aklavik,68.2191,-135.0107,36.43,72,89,22.37,CA,2021-05-23 21:48:32
4,Port Hardy,50.6996,-127.4199,55.58,76,75,11.5,CA,2021-05-23 21:48:32
5,San Patricio,28.017,-97.5169,88.21,67,96,10.31,US,2021-05-23 21:39:45
6,Butaritari,3.0707,172.7902,82.89,78,71,17.87,KI,2021-05-23 21:44:41
7,Santa Isabel,-23.3156,-46.2214,72.97,92,100,7.94,BR,2021-05-23 21:48:33
8,Kapaa,22.0752,-159.319,81.48,69,40,3.0,US,2021-05-23 21:44:18
9,Punta Arenas,-53.15,-70.9167,39.31,83,40,7.67,CL,2021-05-23 21:44:03


In [14]:
#Reordering the columns

new_column_order = ['City','Country','Date','Lat','Lng','Max Temp','Humidity','Cloudiness','Wind Speed']

city_data_df = city_data_df[new_column_order]

city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Isla Vista,US,2021-05-23 21:48:31,34.4133,-119.861,81.34,53,1,6.91
1,Lebu,CL,2021-05-23 21:44:47,-37.6167,-73.65,53.15,78,100,2.26
2,Saskylakh,RU,2021-05-23 21:44:56,71.9167,114.0833,36.82,94,100,15.21
3,Aklavik,CA,2021-05-23 21:48:32,68.2191,-135.0107,36.43,72,89,22.37
4,Port Hardy,CA,2021-05-23 21:48:32,50.6996,-127.4199,55.58,76,75,11.5
5,San Patricio,US,2021-05-23 21:39:45,28.017,-97.5169,88.21,67,96,10.31
6,Butaritari,KI,2021-05-23 21:44:41,3.0707,172.7902,82.89,78,71,17.87
7,Santa Isabel,BR,2021-05-23 21:48:33,-23.3156,-46.2214,72.97,92,100,7.94
8,Kapaa,US,2021-05-23 21:44:18,22.0752,-159.319,81.48,69,40,3.0
9,Punta Arenas,CL,2021-05-23 21:44:03,-53.15,-70.9167,39.31,83,40,7.67


In [16]:
#Creating the output file
output_data_file = 'weather_data/cities.csv'

#Exporint the City_Data into a CSV. 

city_data_df.to_csv(output_data_file, index_label='City_ID')