In [None]:
# Dependencies 
import pandas as pd 
import matplotlib.pyplot as plt
import numpy as np
import random
from citipy import citipy
from datetime import datetime 
from config import weather_api_key
import requests
import time
from scipy.stats import linregress
import gmaps
from config import g_key

In [2]:
# Create list for weather data
city_data = []

# Print the beginning of the logging
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters
record_count = 1
set_count = 1

# Create basic url for API
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

Beginning Data Retrieval     
-----------------------------


In [3]:
# Create 2000 random latitude and longitude coordinates 
latitudes = np.random.uniform(-90, 90, size = 2000)
longitudes = np.random.uniform(-180, 180, size = 2000)
coordinates = zip(latitudes, longitudes)
coordinates

# Add coordinates to a list 
coordinates_lst = list(coordinates)

In [4]:
# Create list for cities 
cities = []

# Use citipy to find nearest cities using coordinate list
for coordinate in coordinates_lst:
    city = citipy.nearest_city(coordinate[0],coordinate[1])
    city_name = city.city_name
    country_name = city.country_code
    
    # Find unique cities to add to cities list
    if city_name not in cities:
        cities.append(city_name)
    
    # See cities and contries
    # print(f'{city_name}, {country_name}')

# Count amount of unique cities
len(cities)

730

In [5]:
# Loop through city Lists 
for i, city in enumerate(cities):
    
    # Group cities in sets of 50 
    if (i % 50 == 0 and i >= 50):
        set_count += 1 
        record_count = 1 
    
    # Create URL for each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log URL, set, and record numbers for each city
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    record_count += 1

# Make an API request for each city 
    try:
       
        # Parse the JSON data
        city_weather = requests.get(city_url).json()

        # Compile needed data
        city_city = city.title()
        city_country = city_weather['sys']['country']
        city_date = datetime.utcfromtimestamp(city_weather['dt']).strftime('%Y-%m-%d %H:%M:%S')
        city_lat = city_weather['coord']['lat']
        city_lng = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_hum = city_weather['main']['humidity']
        city_cloud = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_desc = city_weather['weather'][0]['description']

        # Fill City Data list 
        city_data.append({"City": city_city,
                         "Country": city_country,
                         "Date": city_date,
                         "Lat": city_lat,
                         "Lng": city_lng,
                         "Max Temp": city_max_temp,
                         "Humidity": city_hum,
                         "Cloudiness": city_cloud,
                         "Wind Speed": city_wind,
                         "Current Description": city_desc,
                         })
        
    #If an error occurs
    except: 
        print("City not found. Skipping")
        pass

    # Complete Data Retrieval    
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Processing Record 1 of Set 1 | aklavik
Processing Record 2 of Set 1 | rikitea
Processing Record 3 of Set 1 | presque isle
Processing Record 4 of Set 1 | jamestown
Processing Record 5 of Set 1 | manaus
Processing Record 6 of Set 1 | vaini
Processing Record 7 of Set 1 | bluff
Processing Record 8 of Set 1 | carnarvon
Processing Record 9 of Set 1 | lolua
City not found. Skipping
Processing Record 10 of Set 1 | kashin
Processing Record 11 of Set 1 | kruisfontein
Processing Record 12 of Set 1 | lebu
Processing Record 13 of Set 1 | qui nhon
Processing Record 14 of Set 1 | chokurdakh
Processing Record 15 of Set 1 | margate
Processing Record 16 of Set 1 | mys shmidta
City not found. Skipping
Processing Record 17 of Set 1 | hermanus
Processing Record 18 of Set 1 | codrington
Processing Record 19 of Set 1 | bambous virieux
Processing Record 20 of Set 1 | albany
Processing Record 21 of Set 1 | amderma
City not found. Skipping
Processing Record 22 of Set 1 | longyearbyen
Processing Record 23 of Set

Processing Record 40 of Set 4 | monteagudo
Processing Record 41 of Set 4 | talcahuano
Processing Record 42 of Set 4 | kupang
Processing Record 43 of Set 4 | saint-philippe
Processing Record 44 of Set 4 | buraydah
Processing Record 45 of Set 4 | viedma
Processing Record 46 of Set 4 | hammerfest
Processing Record 47 of Set 4 | elesbao veloso
Processing Record 48 of Set 4 | bogorodskoye
Processing Record 49 of Set 4 | nizhneyansk
City not found. Skipping
Processing Record 50 of Set 4 | conde
Processing Record 1 of Set 5 | farah
Processing Record 2 of Set 5 | ca mau
Processing Record 3 of Set 5 | beira
Processing Record 4 of Set 5 | riaba
City not found. Skipping
Processing Record 5 of Set 5 | hofn
Processing Record 6 of Set 5 | kaoma
Processing Record 7 of Set 5 | pokhara
Processing Record 8 of Set 5 | urengoy
Processing Record 9 of Set 5 | palabuhanratu
City not found. Skipping
Processing Record 10 of Set 5 | pevek
Processing Record 11 of Set 5 | deputatskiy
Processing Record 12 of Set 5

Processing Record 31 of Set 8 | matamoros
Processing Record 32 of Set 8 | mayo
Processing Record 33 of Set 8 | toguchin
Processing Record 34 of Set 8 | chicama
Processing Record 35 of Set 8 | mitu
Processing Record 36 of Set 8 | nakhon phanom
Processing Record 37 of Set 8 | antofagasta
Processing Record 38 of Set 8 | marrakesh
Processing Record 39 of Set 8 | haines junction
Processing Record 40 of Set 8 | esperance
Processing Record 41 of Set 8 | charleston
Processing Record 42 of Set 8 | turukhansk
Processing Record 43 of Set 8 | ha giang
Processing Record 44 of Set 8 | mapiripan
Processing Record 45 of Set 8 | chimbote
Processing Record 46 of Set 8 | panguna
Processing Record 47 of Set 8 | itoman
Processing Record 48 of Set 8 | honningsvag
Processing Record 49 of Set 8 | faanui
Processing Record 50 of Set 8 | bathsheba
Processing Record 1 of Set 9 | panaba
Processing Record 2 of Set 9 | mount holly
Processing Record 3 of Set 9 | chirongui
Processing Record 4 of Set 9 | fuyu
Processin

Processing Record 21 of Set 12 | dubno
Processing Record 22 of Set 12 | weinan
Processing Record 23 of Set 12 | gao
Processing Record 24 of Set 12 | meulaboh
Processing Record 25 of Set 12 | dinar
Processing Record 26 of Set 12 | acarau
Processing Record 27 of Set 12 | angoche
Processing Record 28 of Set 12 | lac du bonnet
Processing Record 29 of Set 12 | sao gabriel da cachoeira
Processing Record 30 of Set 12 | pachino
Processing Record 31 of Set 12 | imuris
Processing Record 32 of Set 12 | lakefield
Processing Record 33 of Set 12 | bac lieu
Processing Record 34 of Set 12 | puerto vallarta
Processing Record 35 of Set 12 | new castle
Processing Record 36 of Set 12 | bismil
Processing Record 37 of Set 12 | ystad
Processing Record 38 of Set 12 | yanchukan
City not found. Skipping
Processing Record 39 of Set 12 | ayan
Processing Record 40 of Set 12 | nishihara
Processing Record 41 of Set 12 | hay river
Processing Record 42 of Set 12 | khartoum
Processing Record 43 of Set 12 | soe
Processi

In [6]:
# Tally the number of cities in the city_data array of dictionaries
len(city_data)

674

In [7]:
# Add the data to a list in a dict then at the DF
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description
0,Aklavik,CA,2022-04-10 13:43:47,68.2191,-135.0107,-17.12,98,85,2.33,overcast clouds
1,Rikitea,PF,2022-04-10 13:39:28,-23.1203,-134.9692,78.62,73,1,15.68,clear sky
2,Presque Isle,US,2022-04-10 13:43:47,46.6811,-68.0159,41.18,100,100,0.0,mist
3,Jamestown,US,2022-04-10 13:43:47,42.097,-79.2353,35.19,52,100,14.97,overcast clouds
4,Manaus,BR,2022-04-10 13:43:48,-3.1019,-60.025,82.89,78,40,2.3,scattered clouds
5,Vaini,TO,2022-04-10 13:41:10,-21.2,-175.2,77.16,94,40,5.75,scattered clouds
6,Bluff,NZ,2022-04-10 13:40:59,-46.6,168.3333,49.21,88,31,8.12,scattered clouds
7,Carnarvon,AU,2022-04-10 13:43:48,-24.8667,113.6333,71.67,68,0,17.27,clear sky
8,Kashin,RU,2022-04-10 13:43:49,57.3592,37.6081,49.93,58,100,6.42,overcast clouds
9,Kruisfontein,ZA,2022-04-10 13:43:49,-34.0033,24.7314,67.89,74,95,17.83,light rain


In [9]:
# Create CSV file of DF
csv_weather_file = "weather_database/weather_database.csv"
# Export CSV file 
city_data_df.to_csv(csv_weather_file, index_label="City_ID")