# Deliverable 1. Retrieve Weather Data.
---
1. Create a folder called `Weather_Database` to save all the files related with this deliverable.

2. Save the `Weather_Database_starter_code.ipynb` starter code to the `Weather_Database` folder and rename it as `Weather_Database.ipynb`.

3. Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

4. Use the `citipy` module to get the nearest city for each latitude and longitude combination.

5. Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key; also, it's critical to avoid publishing your API key on your GitHub repository.

6. Retrieve the following information from the API call:

    * Latitude and longitude

    * Maximum temperature

    * Percent humidity

    * Percent cloudiness

    * Wind speed

    * Weather description (for example, clouds, fog, light rain, clear sky)

7. Add the weather data to a new DataFrame.

8. Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.
---

In [60]:
# Import initial libraries
import numpy as np
import pandas as pd
from citipy import citipy

## Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

In [61]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=2000)
lngs = np.random.uniform(low=-180.000, high=180.000, size=2000)
lat_lngs = zip(lats, lngs)
lat_lngs
# Use the zip function to create an iterator of tuples containing the latitude and longitude combinations
at_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x1ba344e0dc8>

In [62]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

## Use the `citipy` module to get the nearest city for each latitude and longitude combination.

In [63]:
# Create an empty list for holding the cities
cities = []

# Use a for loop to identify nearest city for each latitude and longitude combination using the citipy module
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count
print (cities)
len (cities)

['ushuaia', 'sentyabrskiy', 'barrow', 'mataura', 'clyde river', 'kaitangata', 'marsa matruh', 'taolanaro', 'kavaratti', 'mount isa', 'punta arenas', 'lorengau', 'sangar', 'pochutla', 'little current', 'nikolskoye', 'bluff', 'bathsheba', 'port alfred', 'mamallapuram', 'lasa', 'margate', 'atuona', 'hobart', 'nanortalik', 'xuanwu', 'jinchengjiang', 'meulaboh', 'hilo', 'teya', 'orgun', 'tsihombe', 'faanui', 'busselton', 'puerto ayora', 'nanchang', 'viedma', 'mahebourg', 'kapaa', 'tuktoyaktuk', 'vidalia', 'okha', 'severo-kurilsk', 'hermanus', 'saint george', 'katobu', 'ambilobe', 'yuncheng', 'paramonga', 'hithadhoo', 'lagoa', 'te anau', 'buala', 'qaanaaq', 'port elizabeth', 'khonuu', 'khatanga', 'barentsburg', 'albany', 'churapcha', 'kalmunai', 'ulaanbaatar', 'bredasdorp', 'polewali', 'rikitea', 'kiruna', 'micheweni', 'ribeira grande', 'cape town', 'dikson', 'mutoko', 'vaini', 'port-gentil', 'bethel', 'lompoc', 'klaksvik', 'butaritari', 'georgetown', 'lavrentiya', 'adrar', 'hambantota', 'so

721

## Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key.

In [64]:
# Import the requests library
import requests

# Import the time library
import time

# Import the datetime module from the datetime library
from datetime import datetime

# Import the OpenWeatherMap's API key
from config import weather_api_key

In [65]:
# Assemble the OpenWeatherMap's API call
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

## Retrieve the following information from the API call.

- The latitude and longitude
- The Max temperature
- The % humidity
- The % cloudiness
- The Wind speed
- The Weather description, i.e., cloudy, fog, light rain, clear sky, etc. 

In [66]:
# Create an empty list to hold weather data for each city
city_data = []

# Print a message to indicate that the data retrieval starts
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters and set them to 1
record_count = 1
set_count = 1

# Loop through all the cities in our list to fetch weather data for each city
for i, city in enumerate(cities):
        
    # Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(1)

    # Create an endpoint URL for each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the url, record, and set numbers
    print(f"Processing Record {record_count} of Set {set_count} | {city}")

    # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        data = city_weather["weather"]
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_description = data[0]["description"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Description": city_description,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that the data retrieval is complete 
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | ushuaia
Processing Record 2 of Set 1 | sentyabrskiy
City not found. Skipping...
Processing Record 3 of Set 1 | barrow
Processing Record 4 of Set 1 | mataura
Processing Record 5 of Set 1 | clyde river
Processing Record 6 of Set 1 | kaitangata
Processing Record 7 of Set 1 | marsa matruh
Processing Record 8 of Set 1 | taolanaro
City not found. Skipping...
Processing Record 9 of Set 1 | kavaratti
Processing Record 10 of Set 1 | mount isa
Processing Record 11 of Set 1 | punta arenas
Processing Record 12 of Set 1 | lorengau
Processing Record 13 of Set 1 | sangar
Processing Record 14 of Set 1 | pochutla
Processing Record 15 of Set 1 | little current
Processing Record 16 of Set 1 | nikolskoye
Processing Record 17 of Set 1 | bluff
Processing Record 18 of Set 1 | bathsheba
Processing Record 19 of Set 1 | port alfred
Processing Record 20 of Set 1 | mamallapuram
Processing Record 21 of Set 1 | lasa
Processin

In [71]:
# Print the length of the city_data list to verify how many cities you have
len(city_data)

657

## Add the weather data to a new DataFrame.

In [82]:
# Use the city_data list to create a new pandas DataFrame.
city_data_df = pd.DataFrame(city_data)




In [83]:
# Display sample data
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Description,Country,Date
0,Ushuaia,-54.8,-68.3,62.26,36,40,9.22,scattered clouds,AR,2023-01-07 19:25:23
1,Barrow,71.2906,-156.7887,-11.18,77,0,13.8,mist,US,2023-01-07 19:30:25
2,Mataura,-46.1927,168.8643,55.33,61,1,4.56,clear sky,NZ,2023-01-07 19:30:20
3,Clyde River,70.4692,-68.5914,-28.97,75,0,3.44,clear sky,CA,2023-01-07 19:30:42
4,Kaitangata,-46.2817,169.8464,55.56,68,0,8.81,clear sky,NZ,2023-01-07 19:31:53
5,Marsa Matruh,31.3525,27.2453,59.2,77,40,6.91,light rain,EG,2023-01-07 19:33:03
6,Kavaratti,10.5669,72.642,81.14,64,5,7.11,clear sky,IN,2023-01-07 19:33:46
7,Mount Isa,-20.7333,139.5,73.17,100,100,5.75,light intensity shower rain,AU,2023-01-07 19:31:06
8,Punta Arenas,-53.15,-70.9167,66.31,30,20,23.02,few clouds,CL,2023-01-07 19:30:08
9,Lorengau,-2.0226,147.2712,80.56,78,99,3.91,overcast clouds,PG,2023-01-07 19:31:12


In [84]:
# Display the DataFrame's column names using the columns Pandas function
city_data_df.columns

Index(['City', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness',
       'Wind Speed', 'Description', 'Country', 'Date'],
      dtype='object')

In [85]:
city_data_df.dtypes

City            object
Lat            float64
Lng            float64
Max Temp       float64
Humidity         int64
Cloudiness       int64
Wind Speed     float64
Description     object
Country         object
Date            object
dtype: object

In [86]:
# Create a list to reorder the column names as follows:
# "City", "Country", "Lat", "Lng", "Max Temp", "Humidity",  "Cloudiness", "Wind Speed",  "Current Description"
new_column_order = city_data_df.columns.tolist()
new_column_order =["City", "Country", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed", "Description","Date"]
new_column_order
# Recreate the DataFrame by using the new column order
city_data_df = city_data_df[new_column_order]






# Display sample data
city_data_df.head(10)

Unnamed: 0,City,Country,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Description,Date
0,Ushuaia,AR,-54.8,-68.3,62.26,36,40,9.22,scattered clouds,2023-01-07 19:25:23
1,Barrow,US,71.2906,-156.7887,-11.18,77,0,13.8,mist,2023-01-07 19:30:25
2,Mataura,NZ,-46.1927,168.8643,55.33,61,1,4.56,clear sky,2023-01-07 19:30:20
3,Clyde River,CA,70.4692,-68.5914,-28.97,75,0,3.44,clear sky,2023-01-07 19:30:42
4,Kaitangata,NZ,-46.2817,169.8464,55.56,68,0,8.81,clear sky,2023-01-07 19:31:53
5,Marsa Matruh,EG,31.3525,27.2453,59.2,77,40,6.91,light rain,2023-01-07 19:33:03
6,Kavaratti,IN,10.5669,72.642,81.14,64,5,7.11,clear sky,2023-01-07 19:33:46
7,Mount Isa,AU,-20.7333,139.5,73.17,100,100,5.75,light intensity shower rain,2023-01-07 19:31:06
8,Punta Arenas,CL,-53.15,-70.9167,66.31,30,20,23.02,few clouds,2023-01-07 19:30:08
9,Lorengau,PG,-2.0226,147.2712,80.56,78,99,3.91,overcast clouds,2023-01-07 19:31:12


In [87]:
# Display the data types of each column by using the dtypes Pandas function
city_data_df.dtypes


City            object
Country         object
Lat            float64
Lng            float64
Max Temp       float64
Humidity         int64
Cloudiness       int64
Wind Speed     float64
Description     object
Date            object
dtype: object

## Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.

In [91]:
# Set the output file name
output_data_file = "weather_data/WeatherPy_Database.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")