# Deliverable 1. Retrieve Weather Data.
---
1. Create a folder called `Weather_Database` to save all the files related with this deliverable.

2. Save the `Weather_Database_starter_code.ipynb` starter code to the `Weather_Database` folder and rename it as `Weather_Database.ipynb`.

3. Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

4. Use the `citipy` module to get the nearest city for each latitude and longitude combination.

5. Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key; also, it's critical to avoid publishing your API key on your GitHub repository.

6. Retrieve the following information from the API call:

    * Latitude and longitude

    * Maximum temperature

    * Percent humidity

    * Percent cloudiness

    * Wind speed

    * Weather description (for example, clouds, fog, light rain, clear sky)

7. Add the weather data to a new DataFrame.

8. Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.
---

In [14]:
# Import initial libraries
import numpy as np
import pandas as pd
from citipy import citipy

## Use the `np.random.uniform` function to generate a new set of 2,000 random latitudes and 2,000 longitudes.

In [15]:
# Create a set of random latitude and longitude combinations
lats = np.random.uniform(-90, 90, 2000)
lngs = np.random.uniform(-180, 180, 2000)

# Use the zip function to create an iterator of tuples containing the latitude and longitude combinations
lat_lngs = zip(lats, lngs)

In [16]:
# Add the latitudes and longitudes to a list
coordinates = list(lat_lngs)

In [17]:
coordinates

[(71.28155523719133, -141.60515509844456),
 (7.574626744032329, 31.261068916119058),
 (-32.94176116127838, 150.6459026942547),
 (6.684240025600616, 76.19162681989047),
 (69.33107393755253, 136.41680481566425),
 (10.813336711310683, 86.39748055015849),
 (51.996359071125426, 34.284937618376404),
 (66.67524655624158, -24.669049138994467),
 (41.616802685703846, -146.47095108515936),
 (62.84614606929682, -81.15015380644851),
 (66.57700971474878, -20.85521609587326),
 (55.21400672643745, -121.04437543617158),
 (72.22664296137987, -65.55329937665023),
 (-50.935095913413825, -116.47458443810137),
 (-78.3193637633523, 75.92047465658169),
 (48.11995539587116, -81.94003612131698),
 (21.36148157121822, -146.9795395517306),
 (56.58823539791973, -29.312958395154993),
 (66.05202061403105, -175.81977358119417),
 (46.6839470904454, -37.646178413142565),
 (53.999338811039934, -138.96630756037155),
 (89.1793229145087, -174.87420839981948),
 (31.068347930626672, 108.94212349682198),
 (-29.01574537923139, 

## Use the `citipy` module to get the nearest city for each latitude and longitude combination.

In [18]:
# Create an empty list for holding the cities
cities = []
countries = []
city_country = []

# Use a for loop to identify nearest city for each latitude and longitude combination using the citipy module
for coordinate in coordinates:
    # Use the citipy module to identify the nearest city to the current coordinate
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name
    country = citipy.nearest_city(coordinate[0], coordinate[1]).country_code
  
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)
        countries.append(country)
        city_country.append(f'{city},{country}')


# Print the city count to confirm sufficient count
print(len(cities))
print(len(countries))
city_country

749
749


['aklavik,ca',
 'yirol,sd',
 'singleton,au',
 'manavalakurichi,in',
 'ust-kuyga,ru',
 'batticaloa,lk',
 'sevsk,ru',
 'bolungarvik,is',
 'kodiak,us',
 'attawapiskat,ca',
 'skagastrond,is',
 'dawson creek,ca',
 'clyde river,ca',
 'rikitea,pf',
 'busselton,au',
 'timmins,ca',
 'hilo,us',
 'grindavik,is',
 'provideniya,ru',
 'ribeira grande,pt',
 'sitka,us',
 'mys shmidta,ru',
 'wanxian,cn',
 'coquimbo,cl',
 'leeds,us',
 'barrow,us',
 'evensk,ru',
 'huarmey,pe',
 'te anau,nz',
 'praia da vitoria,pt',
 'puerto el triunfo,sv',
 'ushuaia,ar',
 'kavieng,pg',
 'pevek,ru',
 'palabuhanratu,id',
 'tessalit,ml',
 'cherskiy,ru',
 'chokurdakh,ru',
 'chuy,uy',
 'ust-kulom,ru',
 'aflu,dz',
 'albany,au',
 'meadow lake,ca',
 'natal,br',
 'srednekolymsk,ru',
 'hasaki,jp',
 'cidreira,br',
 'vaini,to',
 'taolanaro,mg',
 'cochabamba,bo',
 'east london,za',
 'killybegs,ie',
 'mikhaylovskoye,ru',
 'souillac,mu',
 'isangel,vu',
 'hamilton,bm',
 'barentsburg,sj',
 'adre,td',
 'kroya,id',
 'tasiilaq,gl',
 'dikson

## Import your OpenWeatherMap's API key and assemble the API call URL as a string variable. Recall to edit the `config.py` file to add your API key.

In [19]:
# Import the requests library
import requests

# Import the time library
import time

# Import the datetime module from the datetime library
from datetime import datetime

# Import the OpenWeatherMap's API key
from config import weather_api_key

In [20]:
# Assemble the OpenWeatherMap's API call
url = f'https://api.openweathermap.org/data/2.5/weather?units=Imperial&appid={weather_api_key}'

## Retrieve the following information from the API call.

- The latitude and longitude
- The Max temperature
- The % humidity
- The % cloudiness
- The Wind speed
- The Weather description, i.e., cloudy, fog, light rain, clear sky, etc. 

In [21]:
# Create an empty list to hold weather data for each city
city_data = []

# Print a message to indicate that the data retrieval starts
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters and set them to 1
record_count = 1
set_count = 1

# Loop through all the cities in our list to fetch weather data for each city
for i, city in enumerate(city_country):
        
# Group cities in sets of 50 for logging purposes
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
        time.sleep(60)

    # Create an endpoint URL for each city
    city_url = url + "&q=" + city.replace(" ","+")
    
    # Log the url, record, and set numbers
    print(f"Processing Record {record_count} of Set {set_count} | {city}")

    # Add 1 to the record count
    record_count += 1

    # Run an API request for each of the cities
    try:
        city_weather = requests.get(city_url).json()
        # Parse out the latitude, longitude, max temp, humidity, cloudiness, wind, country, and weather description
        city_name = city_weather['name']
        city_latitude = city_weather['coord']['lat']
        city_longitude = city_weather['coord']['lon']
        city_max_temp = city_weather['main']['temp_max']
        city_humidity = city_weather['main']['humidity']
        city_cloudiness = city_weather['clouds']['all']
        city_wind = city_weather['wind']['speed']
        city_countri = city_weather['sys']['country']
        city_weather_description = city_weather['weather'][0]['description']
            
        # Append the city information into the city_data list
        city_data.append({
            'City': city_name,
            'Lat': city_latitude,
            'Lon': city_longitude,
            'Max Temp': city_max_temp,
            'Humidity': city_humidity,
            'Cloudiness': city_cloudiness,
            'Wind': city_wind,
            'Country': city_countri,
            'Weather Description': city_weather_description})
    
    # If an error is experienced, skip the city
    except:
        print("City not found. Skipping...")
        pass

# Indicate that the data retrieval is complete 
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")
print(city_url)

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | aklavik,ca
Processing Record 2 of Set 1 | yirol,sd
City not found. Skipping...
Processing Record 3 of Set 1 | singleton,au
Processing Record 4 of Set 1 | manavalakurichi,in
Processing Record 5 of Set 1 | ust-kuyga,ru
Processing Record 6 of Set 1 | batticaloa,lk
Processing Record 7 of Set 1 | sevsk,ru
Processing Record 8 of Set 1 | bolungarvik,is
City not found. Skipping...
Processing Record 9 of Set 1 | kodiak,us
Processing Record 10 of Set 1 | attawapiskat,ca
City not found. Skipping...
Processing Record 11 of Set 1 | skagastrond,is
City not found. Skipping...
Processing Record 12 of Set 1 | dawson creek,ca
Processing Record 13 of Set 1 | clyde river,ca
Processing Record 14 of Set 1 | rikitea,pf
Processing Record 15 of Set 1 | busselton,au
Processing Record 16 of Set 1 | timmins,ca
Processing Record 17 of Set 1 | hilo,us
Processing Record 18 of Set 1 | grindavik,is
Processing Record 19 of Set 1 

In [26]:
# Print the length of the city_data list to verify how many cities you have
len(city_data)

662

## Add the weather data to a new DataFrame.

In [27]:
# Use the city_data list to create a new pandas DataFrame.
city_data_df = pd.DataFrame(city_data)

In [28]:
# Display sample data
city_data_df.head(10)

Unnamed: 0,City,Lat,Lon,Max Temp,Humidity,Cloudiness,Wind,Country,Weather Description
0,Aklavik,68.2191,-135.0107,-13.0,77,100,8.05,CA,overcast clouds
1,Singleton,-32.5667,151.1833,64.33,58,97,7.27,AU,overcast clouds
2,Manavālakurichi,8.1333,77.3,77.32,74,100,12.33,IN,overcast clouds
3,Ust-Kuyga,70.0167,135.6,-46.41,100,67,1.7,RU,broken clouds
4,Batticaloa,7.7102,81.6924,76.64,77,100,4.97,LK,overcast clouds
5,Sevsk,52.1491,34.4926,32.83,99,100,4.47,RU,overcast clouds
6,Saint Paul Harbor,57.79,-152.4072,29.71,40,0,11.5,US,clear sky
7,Dawson Creek,55.7666,-120.2362,28.04,54,0,6.91,CA,clear sky
8,Clyde River,70.4692,-68.5914,3.43,85,100,13.8,CA,light snow
9,Rikitea,-23.1203,-134.9692,76.37,78,13,16.53,PF,few clouds


In [32]:
# Display the DataFrame's column names using the columns Pandas function
city_data_df.columns

Index(['City', 'Lat', 'Lon', 'Max Temp', 'Humidity', 'Cloudiness', 'Wind',
       'Country', 'Weather Description'],
      dtype='object')

In [37]:
# Create a list to reorder the column names as follows:
# "City", "Country", "Lat", "Lng", "Max Temp", "Humidity",  "Cloudiness", "Wind Speed",  "Current Description"
city_data_df = city_data_df.rename(columns={'Weather Description': 'Current Description', 'Wind': 'Wind Speed', 'Lon':'Lng'})
reorder = ["City", "Country", "Lat", "Lng", "Max Temp", "Humidity",  "Cloudiness", "Wind Speed",  "Current Description"]

# Recreate the DataFrame by using the new column order
city_data_df = city_data_df[reorder]

# Display sample data
city_data_df

Unnamed: 0,City,Country,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Current Description
0,Aklavik,CA,68.2191,-135.0107,-13.00,77,100,8.05,overcast clouds
1,Singleton,AU,-32.5667,151.1833,64.33,58,97,7.27,overcast clouds
2,Manavālakurichi,IN,8.1333,77.3000,77.32,74,100,12.33,overcast clouds
3,Ust-Kuyga,RU,70.0167,135.6000,-46.41,100,67,1.70,broken clouds
4,Batticaloa,LK,7.7102,81.6924,76.64,77,100,4.97,overcast clouds
...,...,...,...,...,...,...,...,...,...
657,Lensk,RU,60.7253,114.9278,0.14,93,100,11.90,overcast clouds
658,Cam Ranh,VN,11.9214,109.1591,75.16,73,20,8.05,few clouds
659,Pitsunda,GE,43.1592,40.3378,51.98,70,87,5.12,light rain
660,Mao,TD,14.1212,15.3103,67.98,11,0,11.74,clear sky


In [38]:
# Display the data types of each column by using the dtypes Pandas function
city_data_df.dtypes

City                    object
Country                 object
Lat                    float64
Lng                    float64
Max Temp               float64
Humidity                 int64
Cloudiness               int64
Wind Speed             float64
Current Description     object
dtype: object

## Export the DataFrame as a CSV file, and save it as `WeatherPy_Database.csv` in the `Weather_Database` folder.

In [45]:
# Set the output file name
output_data_file = "/Users/mattzabriskie/Desktop/Bootcamp/repos/World_Weather_Analysis/Weather_Database/Starter_Code/WeatherPy_Database.csv"

# Export the city_data DataFrame into a CSV file
city_data_df.to_csv(output_data_file, index_label="City_ID")