In [1]:
#Import the dependencies
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
#Use citipy module to determine city based on latitude and longitude
from citipy import citipy

In [2]:
#Create a set of random latitude and longitude combinations.
lats = np.random.uniform(low=-90.000, high=90.000, size = 1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size = 1500)
lats_lngs = zip(lats, lngs)
lats_lngs

<zip at 0x11f91cf50>

In [3]:
coordinates=list(lats_lngs)

In [4]:
#Create a list to hold the cities
cities=[]
#Identify the nearest city for each latitude and longitude combination
for coordinate in coordinates:
    city=(citipy.nearest_city(coordinate[0],coordinate[1]).city_name)
    
    #If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
#Print the city count to confirm sufficient count.
len(cities)

621

In [5]:
print(lats,lngs)

[ 25.78038947 -56.75776963 -62.86847935 ... -10.45867501  70.95684784
 -82.64967756] [-137.75730366  -95.67721846  -99.05606484 ...  135.06652988  179.77925344
   36.24237138]


In [6]:
import requests
from config import weather_api_key
from datetime import datetime

In [7]:

city_url = url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [8]:
# Create an empty list to hold the weather data
city_data = []
#print the beginning of the logging.
print("Beginning Data Retrieval   ")
print("---------------------------")

#Create counters.
record_count = 1
set_count = 1
# Loop through all the cities in the list.
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")
    # Run an API request for each of the cities.
    try:

        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})
            # Log the URL, record, and set numbers and the city.
        print(f"Processing Record {record_count} of Set {set_count} | {city}")

    
# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass
# Add 1 to the record count.
record_count += 1
# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")




Beginning Data Retrieval   
---------------------------
Processing Record 1 of Set 1 | hilo
Processing Record 1 of Set 1 | punta arenas
Processing Record 1 of Set 1 | hobart
Processing Record 1 of Set 1 | trapani
Processing Record 1 of Set 1 | mataura
Processing Record 1 of Set 1 | bubaque
Processing Record 1 of Set 1 | castro
Processing Record 1 of Set 1 | columbus
Processing Record 1 of Set 1 | cumra
Processing Record 1 of Set 1 | port hardy
Processing Record 1 of Set 1 | pochutla
Processing Record 1 of Set 1 | patitirion
Processing Record 1 of Set 1 | albany
Processing Record 1 of Set 1 | kushmurun
Processing Record 1 of Set 1 | puerto ayora
Processing Record 1 of Set 1 | sitka
Processing Record 1 of Set 1 | grand gaube
Processing Record 1 of Set 1 | busselton
Processing Record 1 of Set 1 | jamestown
Processing Record 1 of Set 1 | roma
Processing Record 1 of Set 1 | jiexiu
Processing Record 1 of Set 1 | vila franca do campo
Processing Record 1 of Set 1 | carnarvon
Processing Record 

Processing Record 1 of Set 5 | raga
Processing Record 1 of Set 5 | inhambane
Processing Record 1 of Set 5 | almeirim
Processing Record 1 of Set 5 | lasa
Processing Record 1 of Set 5 | trzcianka
Processing Record 1 of Set 5 | bethel
City not found. Skipping...
Processing Record 1 of Set 5 | yenagoa
Processing Record 1 of Set 5 | deqing
Processing Record 1 of Set 5 | sao cristovao
Processing Record 1 of Set 5 | ilulissat
Processing Record 1 of Set 5 | cheyenne
Processing Record 1 of Set 5 | namibe
Processing Record 1 of Set 5 | phan thiet
Processing Record 1 of Set 5 | tazovskiy
Processing Record 1 of Set 5 | torbay
Processing Record 1 of Set 5 | aquiraz
Processing Record 1 of Set 5 | omboue
Processing Record 1 of Set 5 | souillac
Processing Record 1 of Set 5 | coahuayana
Processing Record 1 of Set 5 | kurchum
Processing Record 1 of Set 5 | vestmanna
Processing Record 1 of Set 5 | banyliv
Processing Record 1 of Set 5 | esperance
Processing Record 1 of Set 5 | gambo
Processing Record 1 of

Processing Record 1 of Set 9 | ozernovskiy
Processing Record 1 of Set 9 | les cayes
Processing Record 1 of Set 9 | wanlaweyn
Processing Record 1 of Set 9 | srem
Processing Record 1 of Set 9 | ternate
Processing Record 1 of Set 9 | rio gallegos
Processing Record 1 of Set 9 | margate
Processing Record 1 of Set 9 | petropavlovsk-kamchatskiy
Processing Record 1 of Set 9 | buarcos
Processing Record 1 of Set 9 | kununurra
Processing Record 1 of Set 9 | mecca
Processing Record 1 of Set 9 | saint-joseph
Processing Record 1 of Set 9 | tallahassee
Processing Record 1 of Set 9 | price
Processing Record 1 of Set 9 | ahipara
Processing Record 1 of Set 9 | oussouye
Processing Record 1 of Set 9 | portland
Processing Record 1 of Set 9 | boone
Processing Record 1 of Set 9 | ayagoz
Processing Record 1 of Set 9 | karratha
Processing Record 1 of Set 9 | ocampo
Processing Record 1 of Set 9 | akdepe
Processing Record 1 of Set 9 | kailua
Processing Record 1 of Set 9 | san policarpo
Processing Record 1 of Set

In [12]:
city_data[-1]

{'City': 'Shache',
 'Lat': 38.4167,
 'Lng': 77.2406,
 'Max Temp': 44.76,
 'Humidity': 54,
 'Cloudiness': 6,
 'Wind Speed': 2.68,
 'Country': 'CN',
 'Date': '2021-04-03 03:23:31'}

In [31]:
#Convert the list of dictionaries to a Pandas DataFrame
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Hilo,19.7297,-155.09,75.2,64,1,9.22,US,2021-04-03 03:15:38
1,Punta Arenas,-53.15,-70.9167,44.6,93,90,12.66,CL,2021-04-03 03:12:20
2,Hobart,-42.8794,147.3294,87.8,12,0,23.02,AU,2021-04-03 03:15:18
3,Trapani,37.8333,12.6667,64.0,82,0,4.61,IT,2021-04-03 03:17:09
4,Mataura,-46.1927,168.8643,62.01,57,98,10.0,NZ,2021-04-03 03:15:07
5,Bubaque,11.2833,-15.8333,75.38,81,43,13.62,GW,2021-04-03 03:15:40
6,Castro,-24.7911,-50.0119,53.67,96,0,4.5,BR,2021-04-03 03:15:22
7,Columbus,39.9612,-82.9988,35.6,55,1,1.74,US,2021-04-03 03:21:16
8,Cumra,37.5732,32.7745,33.8,86,5,6.91,TR,2021-04-03 03:21:38
9,Port Hardy,50.6996,-127.4199,46.4,65,75,8.05,CA,2021-04-03 03:15:17


In [38]:
new_city_data = ["City","Country","Date","Lat","Lng","Max Temp","Humidity","Cloudiness","Wind Speed"]
city_data_df[new_city_data].head(20)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Hilo,US,2021-04-03 03:15:38,19.7297,-155.09,75.2,64,1,9.22
1,Punta Arenas,CL,2021-04-03 03:12:20,-53.15,-70.9167,44.6,93,90,12.66
2,Hobart,AU,2021-04-03 03:15:18,-42.8794,147.3294,87.8,12,0,23.02
3,Trapani,IT,2021-04-03 03:17:09,37.8333,12.6667,64.0,82,0,4.61
4,Mataura,NZ,2021-04-03 03:15:07,-46.1927,168.8643,62.01,57,98,10.0
5,Bubaque,GW,2021-04-03 03:15:40,11.2833,-15.8333,75.38,81,43,13.62
6,Castro,BR,2021-04-03 03:15:22,-24.7911,-50.0119,53.67,96,0,4.5
7,Columbus,US,2021-04-03 03:21:16,39.9612,-82.9988,35.6,55,1,1.74
8,Cumra,TR,2021-04-03 03:21:38,37.5732,32.7745,33.8,86,5,6.91
9,Port Hardy,CA,2021-04-03 03:15:17,50.6996,-127.4199,46.4,65,75,8.05


In [40]:
#Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
#Export the city_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")