In [1]:
# Dependencies 
import pandas as pd 
import matplotlib.pyplot as plt
import numpy as np
import random
from citipy import citipy
from datetime import datetime 
from config import weather_api_key
import requests
import time
from scipy.stats import linregress

In [2]:
# Create list for weather data
city_data = []

# Print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

Beginning Data Retrieval     
-----------------------------


In [3]:
# Create basic url for API
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [4]:
# Create 1500 random latitude and longitude coordinates 
latitudes = np.random.uniform(-90, 90, size = 1500)
longitudes = np.random.uniform(-180, 180, size = 1500)
coordinates = zip(latitudes, longitudes)
coordinates

<zip at 0x21762568f00>

In [5]:
# Add coordinates to a list 
coordinates_lst = list(coordinates)

In [6]:
# Create list for cities 
cities = []

# Use citipy to find nearest cities using coordinate list
for coordinate in coordinates_lst:
    city = citipy.nearest_city(coordinate[0],coordinate[1])
    city_name = city.city_name
    country_name = city.country_code
    
    # Find unique cities to add to cities list
    if city_name not in cities:
        cities.append(city_name)
    
    # See cities and contries
    # print(f'{city_name}, {country_name}')

# Count amount of unique cities
len(cities)

633

In [7]:
# Loop through city Lists 
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 
    if (i % 50 == 0 and i >= 50):
        set_count += 1 
        record_count = 1 
    
    # Create URL for each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log URL, set, and record numbers for each city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    record_count += 1

# Make an API request for each city 
    try:
       
        # Parse the JSON data
        city_weather = requests.get(city_url).json()

        # Compile needed data
        city_city = city.title()
        city_country = city_weather['sys']['country']
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_hum = city_weather['main']['humidity']
        city_cloud = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']

        # Fill City Data list 
        city_data.append({"City": city_city,
                         "Country": city_country,
                         "Date": city_date,
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_hum,
                         "Cloudiness": city_cloud,
                         "Wind Speed": city_wind,
                         })
    #If an error occurs
    except: 
        print("City not found. Skipping")
        pass

    # Complete Data Retrieval    
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | jamestown
Processing Record 2 of Set 1 | illoqqortoormiut
City not found. Skipping
Processing Record 3 of Set 1 | avera
Processing Record 4 of Set 1 | punta arenas
Processing Record 5 of Set 1 | dingras
Processing Record 6 of Set 1 | pisco
Processing Record 7 of Set 1 | georgetown
Processing Record 8 of Set 1 | saldanha
Processing Record 9 of Set 1 | lebu
Processing Record 10 of Set 1 | saint-philippe
Processing Record 11 of Set 1 | codrington
Processing Record 12 of Set 1 | waiuku
Processing Record 13 of Set 1 | arona
Processing Record 14 of Set 1 | port hardy
Processing Record 15 of Set 1 | alamor
Processing Record 16 of Set 1 | rikitea
Processing Record 17 of Set 1 | tabuk
Processing Record 18 of Set 1 | roald
Processing Record 19 of Set 1 | ushuaia
Processing Record 20 of Set 1 | airai
Processing Record 21 of Set 1 | roanoke rapids
Processing Record 22 of Set 1 | bredasdorp
Processing Record 23 of Set 1 | mar del plata
Processing Record 24 of Set 1 | 

Processing Record 40 of Set 4 | kavieng
Processing Record 41 of Set 4 | zhigansk
Processing Record 42 of Set 4 | hobart
Processing Record 43 of Set 4 | opobo
City not found. Skipping
Processing Record 44 of Set 4 | chachapoyas
Processing Record 45 of Set 4 | katsuura
Processing Record 46 of Set 4 | laguna
Processing Record 47 of Set 4 | sompeta
Processing Record 48 of Set 4 | ponta do sol
Processing Record 49 of Set 4 | juneau
Processing Record 50 of Set 4 | grand river south east
City not found. Skipping
Processing Record 1 of Set 5 | bathsheba
Processing Record 2 of Set 5 | hermanus
Processing Record 3 of Set 5 | kondoa
Processing Record 4 of Set 5 | fairbanks
Processing Record 5 of Set 5 | ashington
Processing Record 6 of Set 5 | vastervik
City not found. Skipping
Processing Record 7 of Set 5 | dingle
Processing Record 8 of Set 5 | amderma
City not found. Skipping
Processing Record 9 of Set 5 | bonavista
Processing Record 10 of Set 5 | atuona
Processing Record 11 of Set 5 | chuy
Pro

Processing Record 30 of Set 8 | santa rosalia
Processing Record 31 of Set 8 | tigil
Processing Record 32 of Set 8 | sokoni
Processing Record 33 of Set 8 | nicoya
Processing Record 34 of Set 8 | ucluelet
Processing Record 35 of Set 8 | bay roberts
Processing Record 36 of Set 8 | ekhabi
Processing Record 37 of Set 8 | talnakh
Processing Record 38 of Set 8 | olinda
Processing Record 39 of Set 8 | along
Processing Record 40 of Set 8 | sonari
Processing Record 41 of Set 8 | kiama
Processing Record 42 of Set 8 | tuggurt
City not found. Skipping
Processing Record 43 of Set 8 | cabedelo
Processing Record 44 of Set 8 | oranjestad
Processing Record 45 of Set 8 | kamskiye polyany
Processing Record 46 of Set 8 | camopi
Processing Record 47 of Set 8 | bam
Processing Record 48 of Set 8 | cururupu
Processing Record 49 of Set 8 | jalostotitlan
Processing Record 50 of Set 8 | honningsvag
Processing Record 1 of Set 9 | kodiak
Processing Record 2 of Set 9 | bandarbeyla
Processing Record 3 of Set 9 | gouy

Processing Record 19 of Set 12 | hue
Processing Record 20 of Set 12 | springbok
Processing Record 21 of Set 12 | bubaque
Processing Record 22 of Set 12 | haibowan
City not found. Skipping
Processing Record 23 of Set 12 | kargopol
Processing Record 24 of Set 12 | bahia blanca
Processing Record 25 of Set 12 | yumen
Processing Record 26 of Set 12 | sept-iles
Processing Record 27 of Set 12 | sangar
Processing Record 28 of Set 12 | maloshuyka
City not found. Skipping
Processing Record 29 of Set 12 | pipri
Processing Record 30 of Set 12 | ngukurr
City not found. Skipping
Processing Record 31 of Set 12 | itupiranga
Processing Record 32 of Set 12 | goderich
Processing Record 33 of Set 12 | mezen
Processing Record 34 of Set 12 | chifeng
Processing Record 35 of Set 12 | mayor pablo lagerenza
Processing Record 36 of Set 12 | umm lajj
Processing Record 37 of Set 12 | half moon bay
Processing Record 38 of Set 12 | marzuq
Processing Record 39 of Set 12 | vao
Processing Record 40 of Set 12 | ouidah
P

In [8]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Jamestown,US,2022-04-18 18:39:07,42.097,-79.2353,36.52,65,100,17.27
1,Avera,US,2022-04-18 18:41:38,33.194,-82.5271,67.51,71,63,9.37
2,Punta Arenas,CL,2022-04-18 18:41:39,-53.15,-70.9167,51.91,62,75,10.36
3,Dingras,PH,2022-04-18 18:41:39,18.1032,120.6967,76.75,83,20,3.44
4,Pisco,PE,2022-04-18 18:41:40,-13.7,-76.2167,68.05,73,0,9.22
5,Georgetown,MY,2022-04-18 18:37:25,5.4112,100.3354,80.53,93,20,3.44
6,Saldanha,ZA,2022-04-18 18:37:01,-33.0117,17.9442,64.45,78,0,9.82
7,Lebu,CL,2022-04-18 18:41:41,-37.6167,-73.65,58.08,85,100,6.22
8,Saint-Philippe,RE,2022-04-18 18:41:41,-21.3585,55.7679,77.22,88,22,11.18
9,Codrington,AU,2022-04-18 18:41:42,-38.2667,141.9667,55.74,82,100,9.66
