In [1]:
# import dependencies
import pandas as pd
import numpy as np
import timeit
import matplotlib.pyplot as plt
# Import the requests library.
import requests
# Import the API key.
from config import weather_api_key
# Import the datetime module from the datetime library.
from datetime import datetime
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy
# Import the time module.
import time
# Import linear regression from the SciPy stats module.
from scipy.stats import linregress

In [2]:
# create a list of latitudes and Longitudes and zip them
lat=np.random.uniform(low=-90.000,high=90.000, size=1500)
lngs=np.random.uniform(low=-180.000,high=180.000,size=1500)
lat_lngs=zip(lat,lngs)
lat_lngs

<zip at 0x7fc1a24d1300>

In [3]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [4]:
coordinates

[(34.51018828027024, 111.49768583747226),
 (60.830748475825175, -94.23248683369246),
 (-28.878026221123733, 160.022186628587),
 (-16.462268136681033, -170.19480499648887),
 (5.619529761798972, 142.2104427972642),
 (68.36667822973712, -87.31005372998186),
 (-74.75752615042987, -66.42671610632631),
 (-11.11090318260301, 36.60565529243499),
 (-75.57053200118325, -60.42624440035301),
 (-37.6548080123073, -11.386246616196473),
 (66.02053211980518, -103.11392698570181),
 (3.0262972990605164, 28.85294963241938),
 (36.493682674139464, 52.763462615303695),
 (17.574006887957694, 15.876878929759357),
 (41.045279395701215, 163.68276695007478),
 (10.560127819807434, -158.08164106495326),
 (7.582199616077503, 62.862416545211346),
 (49.67474971674096, -33.10349696342129),
 (-13.053690106048364, 135.40881511670364),
 (-86.02486387880806, -53.58494186041446),
 (49.88653643362207, 64.74427124170691),
 (-83.35723440997913, 121.95450954754455),
 (67.57691514880503, -3.9843586696598834),
 (69.9140872684021

In [5]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

591

In [6]:
cities

['sanmenxia',
 'thompson',
 'byron bay',
 'alofi',
 'airai',
 'attawapiskat',
 'ushuaia',
 'tunduru',
 'jamestown',
 'la ronge',
 'watsa',
 'babol',
 'bilma',
 'severo-kurilsk',
 'hilo',
 'kavaratti',
 'lagoa',
 'galiwinku',
 'derzhavinsk',
 'new norfolk',
 'klaksvik',
 'illoqqortoormiut',
 'zaysan',
 'butaritari',
 'tsihombe',
 'husavik',
 'vaini',
 'rikitea',
 'chokurdakh',
 'jiddah',
 'riachao',
 'luderitz',
 'roald',
 'la tuque',
 'bargal',
 'avarua',
 'westport',
 'santander',
 'fortuna',
 'nador',
 'mys shmidta',
 'balao',
 'bluff',
 'flinders',
 'georgetown',
 'mataura',
 'kalachinsk',
 'bolungarvik',
 'sao joao da barra',
 'salinopolis',
 'faanui',
 'hermanus',
 'atuona',
 'albany',
 'torbay',
 'kavieng',
 'santa eulalia del rio',
 'bredasdorp',
 'dolbeau',
 'maningrida',
 'barentsburg',
 'sola',
 'ponta delgada',
 'hovd',
 'moranbah',
 'kapaa',
 'zykovo',
 'tasiilaq',
 'dunedin',
 'upernavik',
 'dolores',
 'punta arenas',
 'ler',
 'amderma',
 'kaniv',
 'riyadh',
 'kushima',
 '

In [7]:
# Starting URL for Weather Map API Call.
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)# Starting URL for Weather Map API Call.

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=70871b6d4ef4b088296e3a8e6c1a4e1e


In [8]:
# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [9]:
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1
    # Run an API request for each of the cities.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# #If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | sanmenxia
Processing Record 2 of Set 1 | thompson
Processing Record 3 of Set 1 | byron bay
Processing Record 4 of Set 1 | alofi
Processing Record 5 of Set 1 | airai
Processing Record 6 of Set 1 | attawapiskat
City not found. Skipping...
Processing Record 7 of Set 1 | ushuaia
Processing Record 8 of Set 1 | tunduru
City not found. Skipping...
Processing Record 9 of Set 1 | jamestown
Processing Record 10 of Set 1 | la ronge
Processing Record 11 of Set 1 | watsa
Processing Record 12 of Set 1 | babol
Processing Record 13 of Set 1 | bilma
Processing Record 14 of Set 1 | severo-kurilsk
Processing Record 15 of Set 1 | hilo
Processing Record 16 of Set 1 | kavaratti
Processing Record 17 of Set 1 | lagoa
Processing Record 18 of Set 1 | galiwinku
City not found. Skipping...
Processing Record 19 of Set 1 | derzhavinsk
Processing Record 20 of Set 1 | new norfolk
Processing Record 21 of Set 1 | klaksvik
Processing Record 22 of Set 1 | illoqqortoormiut
City not found. Sk

Processing Record 34 of Set 4 | lima
Processing Record 35 of Set 4 | saldanha
Processing Record 36 of Set 4 | geraldton
Processing Record 37 of Set 4 | gorontalo
Processing Record 38 of Set 4 | kirakira
Processing Record 39 of Set 4 | khatanga
Processing Record 40 of Set 4 | poso
Processing Record 41 of Set 4 | saleaula
City not found. Skipping...
Processing Record 42 of Set 4 | broken hill
Processing Record 43 of Set 4 | akdepe
Processing Record 44 of Set 4 | koroni
Processing Record 45 of Set 4 | ussuriysk
Processing Record 46 of Set 4 | belaya gora
Processing Record 47 of Set 4 | dana point
Processing Record 48 of Set 4 | onguday
Processing Record 49 of Set 4 | tiksi
Processing Record 50 of Set 4 | kodiak
Processing Record 1 of Set 5 | kulhudhuffushi
Processing Record 2 of Set 5 | bhakkar
Processing Record 3 of Set 5 | kaihua
Processing Record 4 of Set 5 | manado
Processing Record 5 of Set 5 | bograd
Processing Record 6 of Set 5 | san ramon
Processing Record 7 of Set 5 | cabedelo
Pr

Processing Record 24 of Set 8 | mullaitivu
City not found. Skipping...
Processing Record 25 of Set 8 | tuktoyaktuk
Processing Record 26 of Set 8 | hammerfest
Processing Record 27 of Set 8 | ushtobe
Processing Record 28 of Set 8 | sisophon
Processing Record 29 of Set 8 | peace river
Processing Record 30 of Set 8 | whitehorse
Processing Record 31 of Set 8 | niagara falls
Processing Record 32 of Set 8 | porto empedocle
Processing Record 33 of Set 8 | buta
Processing Record 34 of Set 8 | novyy urengoy
Processing Record 35 of Set 8 | beidao
Processing Record 36 of Set 8 | port elizabeth
Processing Record 37 of Set 8 | rolim de moura
City not found. Skipping...
Processing Record 38 of Set 8 | koutsouras
Processing Record 39 of Set 8 | ranong
Processing Record 40 of Set 8 | san jeronimo
Processing Record 41 of Set 8 | marion
Processing Record 42 of Set 8 | sao filipe
Processing Record 43 of Set 8 | brandon
Processing Record 44 of Set 8 | doha
Processing Record 45 of Set 8 | coquimbo
Processin

Processing Record 14 of Set 12 | zharkent
Processing Record 15 of Set 12 | gilgit
Processing Record 16 of Set 12 | takefu
Processing Record 17 of Set 12 | kampot
Processing Record 18 of Set 12 | borogontsy
Processing Record 19 of Set 12 | labutta
City not found. Skipping...
Processing Record 20 of Set 12 | crestview
Processing Record 21 of Set 12 | shemursha
Processing Record 22 of Set 12 | nemuro
Processing Record 23 of Set 12 | okhotsk
Processing Record 24 of Set 12 | bom jesus da lapa
Processing Record 25 of Set 12 | jesup
Processing Record 26 of Set 12 | olafsvik
Processing Record 27 of Set 12 | kenora
Processing Record 28 of Set 12 | dokka
Processing Record 29 of Set 12 | ozgon
City not found. Skipping...
Processing Record 30 of Set 12 | nimbahera
Processing Record 31 of Set 12 | henties bay
Processing Record 32 of Set 12 | phillaur
Processing Record 33 of Set 12 | sonder bjert
Processing Record 34 of Set 12 | alyangula
Processing Record 35 of Set 12 | estelle
Processing Record 36

In [10]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head()

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Sanmenxia,34.7747,111.1814,76.41,92,100,5.03,CN,2021-06-13 21:33:14
1,Thompson,55.7435,-97.8558,53.76,76,75,10.36,CA,2021-06-13 21:30:15
2,Byron Bay,-28.65,153.6167,51.06,71,11,5.55,AU,2021-06-13 21:33:15
3,Alofi,-19.0595,-169.9187,80.49,74,53,13.8,NU,2021-06-13 21:29:57
4,Airai,-8.9266,125.4092,57.02,87,57,2.01,TL,2021-06-13 21:33:15


In [12]:
city_data_df=city_data_df[['City', 'Country', 'Date', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness', 'Wind Speed']]
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Sanmenxia,CN,2021-06-13 21:33:14,34.7747,111.1814,76.41,92,100,5.03
1,Thompson,CA,2021-06-13 21:30:15,55.7435,-97.8558,53.76,76,75,10.36
2,Byron Bay,AU,2021-06-13 21:33:15,-28.65,153.6167,51.06,71,11,5.55
3,Alofi,NU,2021-06-13 21:29:57,-19.0595,-169.9187,80.49,74,53,13.8
4,Airai,TL,2021-06-13 21:33:15,-8.9266,125.4092,57.02,87,57,2.01


In [13]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")