# Deliverable 1. Retrieve Weather Data.
---
1. Create a folder called `Weather_Database` to save all the files related with this deliverable.

2. Save the `Weather_Database_starter_code.ipynb` starter code to the `Weather_Database` folder and rename it as `Weather_Database.ipynb`.

3. Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

4. Use the `citipy` module to get the nearest city for each latitude and longitude combination.

5. Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key; also, it's critical to avoid publishing your API key on your GitHub repository.

6. Retrieve the following information from the API call:

    * Latitude and longitude

    * Maximum temperature

    * Percent humidity

    * Percent cloudiness

    * Wind speed

    * Weather description (for example, clouds, fog, light rain, clear sky)

7. Add the weather data to a new DataFrame.

8. Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.
---

In [6]:
# Import initial libraries
import numpy as np
import pandas as pd
from citipy import citipy
import matplotlib.pyplot as plt

## Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

In [7]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)

# Use the zip function to create an iterator of tuples containing the latitude and longitude combinations
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x22ccce49608>

In [8]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)


## Use the `citipy` module to get the nearest city for each latitude and longitude combination.

In [9]:
# Create an empty list for holding the cities
cities = []

# Use a for loop to identify nearest city for each latitude and longitude combination using the citipy module
for coordinate in coordinates:
    # Use the citipy module to identify the nearest city to the current coordinate
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    
# If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
print(cities)

['samusu', 'kapaa', 'bluff', 'severo-yeniseyskiy', 'totskoye', 'chokurdakh', 'vaini', 'georgetown', 'surt', 'yuancheng', 'port macquarie', 'saint-francois', 'hermanus', 'ushuaia', 'cape town', 'illoqqortoormiut', 'jamestown', 'taolanaro', 'puerto ayora', 'sandwick', 'poum', 'naryan-mar', 'new norfolk', 'alakurtti', 'port blair', 'sribne', 'paamiut', 'amderma', 'port hueneme', 'sedelnikovo', 'utiroa', 'songjianghe', 'mahebourg', 'kahului', 'mataura', 'hihifo', 'airai', 'sena madureira', 'great falls', 'maralal', 'wanlaweyn', 'butaritari', 'hithadhoo', 'rongcheng', 'souillac', 'clyde river', 'lar', 'carnarvon', 'geraldton', 'longyearbyen', 'tsabong', 'lawrence', 'punta arenas', 'daxian', 'rikitea', 'bredasdorp', 'goderich', 'shieli', 'ribeira grande', 'kununurra', 'kropotkin', 'prince rupert', 'port elizabeth', 'novo aripuana', 'khatanga', 'palma', 'albany', 'bambous virieux', 'thompson', 'hilo', 'ye', 'college', 'kaka', 'westport', 'tulun', 'garowe', 'provideniya', 'harlingen', 'fuyu', 

## Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key.

In [11]:
# Import the requests library
import requests

# Import the time library
import time

# Import the datetime module from the datetime library
from datetime import datetime

# Import the OpenWeatherMap's API key
from config import weather_api_key

In [12]:
# Assemble the OpenWeatherMap's API call
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key
print(url)

http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=dfa734f566cafc5b29c79bc46a224cda


## Retrieve the following information from the API call.

- The latitude and longitude
- The Max temperature
- The % humidity
- The % cloudiness
- The Wind speed
- The Weather description, i.e., cloudy, fog, light rain, clear sky, etc. 

In [14]:
# Create an empty list to hold weather data for each city
city_data = []

# Print a message to indicate that the data retrieval starts
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters and set them to 1
record_count = 1
set_count = 1

# Loop through all the cities in our list to fetch weather data for each city
for i, city in enumerate(cities):
        
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create an endpoint URL for each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the url, record, and set numbers
    print(f"Processing Record {record_count} of Set {set_count} | {city}")

    # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try:
            city_weather = requests.get(city_url).json()
            # Parse out the needed data.
            city_lat = city_weather["coord"]["lat"]
            city_lng = city_weather["coord"]["lon"]
            city_max_temp = city_weather["main"]["temp_max"]
            city_humidity = city_weather["main"]["humidity"]
            city_clouds = city_weather["clouds"]["all"]
            city_wind = city_weather["wind"]["speed"]
            city_country = city_weather["sys"]["country"]
            city_weather_description = city_weather['weather'][0]['description']
            # Convert the date to ISO standard.
            city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
            # Append the city information into city_data list.
            city_data.append({"City": city.title(),
                              "Lat": city_lat,
                              "Lng": city_lng,
                              "Max Temp": city_max_temp,
                              "Humidity": city_humidity,
                              "Cloudiness": city_clouds,
                              "Wind Speed": city_wind,
                              "Country": city_country,
                              "Date": city_date,
                              "Current Description": city_weather_description})
    # If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass

# Indicate that the data retrieval is complete 
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | samusu
City not found. Skipping...
Processing Record 2 of Set 1 | kapaa
Processing Record 3 of Set 1 | bluff
Processing Record 4 of Set 1 | severo-yeniseyskiy
Processing Record 5 of Set 1 | totskoye
Processing Record 6 of Set 1 | chokurdakh
Processing Record 7 of Set 1 | vaini
Processing Record 8 of Set 1 | georgetown
Processing Record 9 of Set 1 | surt
Processing Record 10 of Set 1 | yuancheng
Processing Record 11 of Set 1 | port macquarie
Processing Record 12 of Set 1 | saint-francois
Processing Record 13 of Set 1 | hermanus
Processing Record 14 of Set 1 | ushuaia
Processing Record 15 of Set 1 | cape town
Processing Record 16 of Set 1 | illoqqortoormiut
City not found. Skipping...
Processing Record 17 of Set 1 | jamestown
Processing Record 18 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 19 of Set 1 | puerto ayora
Processing Record 20 of Set 1 | sandwick
Processing Record 2

Processing Record 37 of Set 4 | sibolga
Processing Record 38 of Set 4 | marica
Processing Record 39 of Set 4 | hobart
Processing Record 40 of Set 4 | esso
Processing Record 41 of Set 4 | cabo san lucas
Processing Record 42 of Set 4 | umea
Processing Record 43 of Set 4 | ilka
City not found. Skipping...
Processing Record 44 of Set 4 | bitam
Processing Record 45 of Set 4 | belushya guba
City not found. Skipping...
Processing Record 46 of Set 4 | terrace
Processing Record 47 of Set 4 | barroualie
City not found. Skipping...
Processing Record 48 of Set 4 | svetlyy
Processing Record 49 of Set 4 | jinchang
Processing Record 50 of Set 4 | talnakh
Processing Record 1 of Set 5 | tuktoyaktuk
Processing Record 2 of Set 5 | coronel oviedo
Processing Record 3 of Set 5 | dhidhdhoo
Processing Record 4 of Set 5 | esperance
Processing Record 5 of Set 5 | henties bay
Processing Record 6 of Set 5 | smithers
Processing Record 7 of Set 5 | faya
Processing Record 8 of Set 5 | agadez
Processing Record 9 of S

Processing Record 26 of Set 8 | alugan
Processing Record 27 of Set 8 | batticaloa
Processing Record 28 of Set 8 | otjimbingwe
Processing Record 29 of Set 8 | teguise
Processing Record 30 of Set 8 | roma
Processing Record 31 of Set 8 | maraa
Processing Record 32 of Set 8 | ozernovskiy
Processing Record 33 of Set 8 | isangel
Processing Record 34 of Set 8 | aklavik
Processing Record 35 of Set 8 | teknaf
Processing Record 36 of Set 8 | srednekolymsk
Processing Record 37 of Set 8 | norman wells
Processing Record 38 of Set 8 | ginda
Processing Record 39 of Set 8 | broadstairs
Processing Record 40 of Set 8 | bilibino
Processing Record 41 of Set 8 | invermere
Processing Record 42 of Set 8 | ilulissat
Processing Record 43 of Set 8 | bulalacao
Processing Record 44 of Set 8 | pevek
Processing Record 45 of Set 8 | uyuni
Processing Record 46 of Set 8 | khor
Processing Record 47 of Set 8 | bermejo
Processing Record 48 of Set 8 | celestun
Processing Record 49 of Set 8 | quatre cocos
Processing Record

Processing Record 12 of Set 12 | bolsheustikinskoye
City not found. Skipping...
Processing Record 13 of Set 12 | axim
Processing Record 14 of Set 12 | malanje
Processing Record 15 of Set 12 | galiwinku
City not found. Skipping...
Processing Record 16 of Set 12 | camocim
Processing Record 17 of Set 12 | coquimbo
Processing Record 18 of Set 12 | santa marta
Processing Record 19 of Set 12 | marcona
City not found. Skipping...
Processing Record 20 of Set 12 | livingstone
Processing Record 21 of Set 12 | kokopo
Processing Record 22 of Set 12 | klaksvik
Processing Record 23 of Set 12 | yialos
City not found. Skipping...
Processing Record 24 of Set 12 | kieta
Processing Record 25 of Set 12 | muzhi
Processing Record 26 of Set 12 | lengshuijiang
Processing Record 27 of Set 12 | taber
Processing Record 28 of Set 12 | changping
Processing Record 29 of Set 12 | urucara
Processing Record 30 of Set 12 | vilia
Processing Record 31 of Set 12 | santa maria da vitoria
Processing Record 32 of Set 12 | ba

In [18]:
# Print the length of the city_data list to verify how many cities you have
len(city_data)

566

In [19]:
# Use the city_data list to create a new pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date,Current Description
0,Kapaa,22.0752,-159.319,73.38,83,44,1.99,US,2022-12-20 14:58:47,scattered clouds
1,Bluff,-46.6,168.3333,48.2,76,40,11.48,NZ,2022-12-20 14:58:48,scattered clouds
2,Severo-Yeniseyskiy,60.3725,93.0408,-20.54,95,65,2.91,RU,2022-12-20 14:58:48,broken clouds
3,Totskoye,52.5248,52.7623,10.85,96,31,3.4,RU,2022-12-20 14:58:48,scattered clouds
4,Chokurdakh,70.6333,147.9167,-6.59,99,87,2.86,RU,2022-12-20 14:58:49,overcast clouds
5,Vaini,-21.2,-175.2,78.96,94,40,4.61,TO,2022-12-20 14:58:49,scattered clouds
6,Georgetown,5.4112,100.3354,82.33,85,20,5.75,MY,2022-12-20 14:56:55,few clouds
7,Surt,31.2089,16.5887,65.37,60,100,14.45,LY,2022-12-20 14:58:50,overcast clouds
8,Yuancheng,36.652,107.7896,26.01,43,1,16.55,CN,2022-12-20 14:58:50,clear sky
9,Port Macquarie,-31.4333,152.9167,57.88,83,30,7.11,AU,2022-12-20 14:58:50,scattered clouds


In [20]:
# Display sample data
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date,Current Description
0,Kapaa,22.0752,-159.319,73.38,83,44,1.99,US,2022-12-20 14:58:47,scattered clouds
1,Bluff,-46.6,168.3333,48.2,76,40,11.48,NZ,2022-12-20 14:58:48,scattered clouds
2,Severo-Yeniseyskiy,60.3725,93.0408,-20.54,95,65,2.91,RU,2022-12-20 14:58:48,broken clouds
3,Totskoye,52.5248,52.7623,10.85,96,31,3.4,RU,2022-12-20 14:58:48,scattered clouds
4,Chokurdakh,70.6333,147.9167,-6.59,99,87,2.86,RU,2022-12-20 14:58:49,overcast clouds
5,Vaini,-21.2,-175.2,78.96,94,40,4.61,TO,2022-12-20 14:58:49,scattered clouds
6,Georgetown,5.4112,100.3354,82.33,85,20,5.75,MY,2022-12-20 14:56:55,few clouds
7,Surt,31.2089,16.5887,65.37,60,100,14.45,LY,2022-12-20 14:58:50,overcast clouds
8,Yuancheng,36.652,107.7896,26.01,43,1,16.55,CN,2022-12-20 14:58:50,clear sky
9,Port Macquarie,-31.4333,152.9167,57.88,83,30,7.11,AU,2022-12-20 14:58:50,scattered clouds


In [21]:
# Display the DataFrame's column names using the columns Pandas function
city_data_df.columns

Index(['City', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness',
       'Wind Speed', 'Country', 'Date', 'Current Description'],
      dtype='object')

In [22]:
city_data_df.count()

City                   566
Lat                    566
Lng                    566
Max Temp               566
Humidity               566
Cloudiness             566
Wind Speed             566
Country                566
Date                   566
Current Description    566
dtype: int64

In [23]:
# Create a list to reorder the column names as follows:
# "City", "Country", "Lat", "Lng", "Max Temp", "Humidity",  "Cloudiness", "Wind Speed",  "Current Description"
city_data_df = city_data_df[["City", "Country", "Lat", "Lng", "Max Temp", "Humidity",  "Cloudiness", "Wind Speed",  "Current Description"]]

# Recreate the DataFrame by using the new column order
city_data_df.count()

# Display sample data
city_data_df.head(10)

Unnamed: 0,City,Country,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description
0,Kapaa,US,22.0752,-159.319,73.38,83,44,1.99,scattered clouds
1,Bluff,NZ,-46.6,168.3333,48.2,76,40,11.48,scattered clouds
2,Severo-Yeniseyskiy,RU,60.3725,93.0408,-20.54,95,65,2.91,broken clouds
3,Totskoye,RU,52.5248,52.7623,10.85,96,31,3.4,scattered clouds
4,Chokurdakh,RU,70.6333,147.9167,-6.59,99,87,2.86,overcast clouds
5,Vaini,TO,-21.2,-175.2,78.96,94,40,4.61,scattered clouds
6,Georgetown,MY,5.4112,100.3354,82.33,85,20,5.75,few clouds
7,Surt,LY,31.2089,16.5887,65.37,60,100,14.45,overcast clouds
8,Yuancheng,CN,36.652,107.7896,26.01,43,1,16.55,clear sky
9,Port Macquarie,AU,-31.4333,152.9167,57.88,83,30,7.11,scattered clouds


In [24]:
# Display the data types of each column by using the dtypes Pandas function
city_data_df.dtypes

City                    object
Country                 object
Lat                    float64
Lng                    float64
Max Temp               float64
Humidity                 int64
Cloudiness               int64
Wind Speed             float64
Current Description     object
dtype: object

## Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.

In [29]:
# Set the output file name
output_data_file = "../Weather_Database/WeatherPy_Database.csv"


In [30]:
# Export the city_data DataFrame into a CSV file
city_data_df.to_csv(output_data_file, index_label="City_ID")