In [1]:
# Import dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [2]:
# Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x7fe278d3f190>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [5]:
# Create a list for holding the cities.
cities = []

# Identify the nearest city for each latitude and longitude combinations.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count.
len(cities)

579

In [6]:
cities

['belushya guba',
 'caluquembe',
 'new plymouth',
 'mataura',
 'lufkin',
 'suifenhe',
 'kahului',
 'wanning',
 'vaini',
 'tshela',
 'klaksvik',
 'deputatskiy',
 'east london',
 'tongren',
 'rock sound',
 'lebu',
 'arraial do cabo',
 'benguela',
 'killybegs',
 'marevo',
 'rikitea',
 'bredasdorp',
 'yellowknife',
 'port alfred',
 'fallon',
 'ushuaia',
 'butaritari',
 'nyurba',
 'jamestown',
 'touros',
 'tuktoyaktuk',
 'maroantsetra',
 'bethel',
 'hobart',
 'bambous virieux',
 'hermanus',
 'chuy',
 'kenora',
 'manta',
 'hit',
 'karaul',
 'san miguel',
 'torbay',
 'berea',
 'kapaa',
 'cabo san lucas',
 'karratha',
 'esperance',
 'nemuro',
 'busselton',
 'portage',
 'hilo',
 'atuona',
 'bluff',
 'mookane',
 'haines junction',
 'basti',
 'bengkulu',
 'finschhafen',
 'port lincoln',
 'kalmunai',
 'punta arenas',
 'nanlong',
 'gat',
 'keta',
 'half moon bay',
 'salalah',
 'benjamin hill',
 'albany',
 'ayagoz',
 'olinda',
 'port elizabeth',
 'mayskiy',
 'northam',
 'novodugino',
 'barentsburg',

In [7]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [8]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [9]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [10]:
# Create an empty list to hold the weather data.
city_data = []

# Print the beginning of the logging.
print('Beginning Data Retrieval       ')
print('-------------------------------')

# Create counters.
record_count = 1
set_count = 1

# Loop through all the cities in our list.
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    
    # Create endpoint URL with each city.
    city_url = url + '&q=' + city.replace(' ','+')
    
    # Log the URL, record, and set numbers and the city.
    print(f'Processing Record {record_count} of Set {set_count} | {city}')
    
    # Add 1 to the record count
    record_count += 1

# Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve the data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_clouds = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_country = city_weather['sys']['country']
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({'City': city.title(),
                         'Lat': city_lat,
                         'Lng': city_lng,
                         'Max Temp': city_max_temp,
                         'Humidity': city_humidity,
                         'Cloudiness': city_clouds,
                         'Wind Speed': city_wind,
                         'Country': city_country,
                         'Date': city_date})
        
# If an error is experienced, skip the city.
    except:
        print('City not found. Skipping...')
        pass

# Indicate that Dat Loading is complete.
print('-------------------------------')
print('Data Retrieval Complete        ')
print('-------------------------------')

Beginning Data Retrieval       
-------------------------------
Processing Record 1 of Set 1 | belushya guba
City not found. Skipping...
Processing Record 2 of Set 1 | caluquembe
Processing Record 3 of Set 1 | new plymouth
Processing Record 4 of Set 1 | mataura
Processing Record 5 of Set 1 | lufkin
Processing Record 6 of Set 1 | suifenhe
Processing Record 7 of Set 1 | kahului
Processing Record 8 of Set 1 | wanning
Processing Record 9 of Set 1 | vaini
Processing Record 10 of Set 1 | tshela
Processing Record 11 of Set 1 | klaksvik
Processing Record 12 of Set 1 | deputatskiy
Processing Record 13 of Set 1 | east london
Processing Record 14 of Set 1 | tongren
Processing Record 15 of Set 1 | rock sound
Processing Record 16 of Set 1 | lebu
Processing Record 17 of Set 1 | arraial do cabo
Processing Record 18 of Set 1 | benguela
Processing Record 19 of Set 1 | killybegs
Processing Record 20 of Set 1 | marevo
Processing Record 21 of Set 1 | rikitea
Processing Record 22 of Set 1 | bredasdorp
Proc

Processing Record 40 of Set 4 | saint george
Processing Record 41 of Set 4 | lima
Processing Record 42 of Set 4 | moron
Processing Record 43 of Set 4 | ozgon
City not found. Skipping...
Processing Record 44 of Set 4 | taolanaro
City not found. Skipping...
Processing Record 45 of Set 4 | jardim
Processing Record 46 of Set 4 | puerto ayora
Processing Record 47 of Set 4 | puerto narino
Processing Record 48 of Set 4 | kota kinabalu
Processing Record 49 of Set 4 | santa isabel do rio negro
Processing Record 50 of Set 4 | alta floresta
Processing Record 1 of Set 5 | barrow
Processing Record 2 of Set 5 | bathsheba
Processing Record 3 of Set 5 | palmeira das missoes
Processing Record 4 of Set 5 | aklavik
Processing Record 5 of Set 5 | sandy bay
Processing Record 6 of Set 5 | eydhafushi
Processing Record 7 of Set 5 | anchorage
Processing Record 8 of Set 5 | aswan
Processing Record 9 of Set 5 | avarua
Processing Record 10 of Set 5 | takoradi
Processing Record 11 of Set 5 | la ronge
Processing Re

Processing Record 29 of Set 8 | tumannyy
City not found. Skipping...
Processing Record 30 of Set 8 | minab
Processing Record 31 of Set 8 | tuatapere
Processing Record 32 of Set 8 | bridgetown
Processing Record 33 of Set 8 | taraz
Processing Record 34 of Set 8 | san javier
Processing Record 35 of Set 8 | vao
Processing Record 36 of Set 8 | ivanivka
Processing Record 37 of Set 8 | heihe
Processing Record 38 of Set 8 | x-can
City not found. Skipping...
Processing Record 39 of Set 8 | hobyo
Processing Record 40 of Set 8 | poum
Processing Record 41 of Set 8 | nouadhibou
Processing Record 42 of Set 8 | veraval
Processing Record 43 of Set 8 | praia
Processing Record 44 of Set 8 | sturgeon bay
Processing Record 45 of Set 8 | north bend
Processing Record 46 of Set 8 | zhenjiang
Processing Record 47 of Set 8 | malkangiri
Processing Record 48 of Set 8 | nanortalik
Processing Record 49 of Set 8 | ust-nera
Processing Record 50 of Set 8 | guerrero negro
Processing Record 1 of Set 9 | sola
Processing

Processing Record 15 of Set 12 | san juan
Processing Record 16 of Set 12 | saint-augustin
Processing Record 17 of Set 12 | matagami
Processing Record 18 of Set 12 | calabozo
Processing Record 19 of Set 12 | acarau
Processing Record 20 of Set 12 | chato
Processing Record 21 of Set 12 | waitara
Processing Record 22 of Set 12 | ruidoso
Processing Record 23 of Set 12 | gagnoa
Processing Record 24 of Set 12 | davila
Processing Record 25 of Set 12 | jurmala
Processing Record 26 of Set 12 | tezu
Processing Record 27 of Set 12 | martapura
Processing Record 28 of Set 12 | taybad
Processing Record 29 of Set 12 | pacific grove
-------------------------------
Data Retrieval Complete        
-------------------------------


In [11]:
len(city_data)

531

In [12]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Caluquembe,-13.78,14.68,61.79,60,13,7.09,AO,2020-08-24 20:28:27
1,New Plymouth,-39.07,174.08,48.0,95,100,1.99,NZ,2020-08-24 20:24:15
2,Mataura,-46.19,168.86,45.0,85,99,15.01,NZ,2020-08-24 20:28:28
3,Lufkin,31.34,-94.73,95.0,36,40,11.41,US,2020-08-24 20:28:28
4,Suifenhe,44.4,131.17,64.6,100,100,5.06,CN,2020-08-24 20:28:28
5,Kahului,20.89,-156.47,87.8,52,40,17.22,US,2020-08-24 20:27:46
6,Wanning,18.8,110.4,81.0,82,6,9.8,CN,2020-08-24 20:28:28
7,Vaini,-21.2,-175.2,77.0,83,20,9.17,TO,2020-08-24 20:28:28
8,Tshela,-4.98,12.93,72.97,84,100,3.87,CD,2020-08-24 20:28:28
9,Klaksvik,62.23,-6.59,46.4,75,5,10.29,FO,2020-08-24 20:28:28


In [14]:
# Reorder the columns
new_column_order = ['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness', 'Wind Speed']
city_data_df = city_data_df[new_column_order]

In [16]:
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Caluquembe,AO,2020-08-24 20:28:27,-13.78,14.68,61.79,60,13,7.09
1,New Plymouth,NZ,2020-08-24 20:24:15,-39.07,174.08,48.0,95,100,1.99
2,Mataura,NZ,2020-08-24 20:28:28,-46.19,168.86,45.0,85,99,15.01
3,Lufkin,US,2020-08-24 20:28:28,31.34,-94.73,95.0,36,40,11.41
4,Suifenhe,CN,2020-08-24 20:28:28,44.4,131.17,64.6,100,100,5.06
5,Kahului,US,2020-08-24 20:27:46,20.89,-156.47,87.8,52,40,17.22
6,Wanning,CN,2020-08-24 20:28:28,18.8,110.4,81.0,82,6,9.8
7,Vaini,TO,2020-08-24 20:28:28,-21.2,-175.2,77.0,83,20,9.17
8,Tshela,CD,2020-08-24 20:28:28,-4.98,12.93,72.97,84,100,3.87
9,Klaksvik,FO,2020-08-24 20:28:28,62.23,-6.59,46.4,75,5,10.29


In [17]:
# Create the output file (CSV).
output_data_file = 'weather_data/cities.csv'

# Export the City_Data into a csv.
city_data_df.to_csv(output_data_file, index_label='City_ID')