# 6.1.4 Create Latitude and Longitude Combinations

In [27]:
# Import the dependencies.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

In [28]:
# Add the code that generates the latitudes and longitudes
#     first, they need to be stored for later access
#     declare each array as a variable since an array of latitudes and longitudes is being created.

# To ensure enough lats and longs are created, begin with 1500
# Pack the lats and longs as pairs and zip them (lat_lngs) with the "zip()" function.
    # zip object packs each pair of lats lngs having the same index in their respective array into a tuple
        # Example: if there are 1500 latitudes and longitudes, there will be 1500 tuples of paired latitudes and longitudes
        #      where each latitude and longitude in a tuple can be accessed by the index of 0 and 1 respectively.
        
        # **Can only unzip a zipped tuple once before it is removed from the computer's memory. 
        # **Ensure to unzip the latitudes and longitudes into the coordinates list before moving on.

In [29]:
# Create a set of random latitude and longitude combinations and "zip()" them.
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)
lat_lngs

<zip at 0x25064015680>

In [30]:
# Add the latitudes and longitudes to a list.
coordinates = list(lat_lngs)

In [31]:
# Once ordered pairs have been created and put into a list(array)
#      iterate through the list of tuples and find the nearest city to the coordinates.

# 6.1.5 Generate Random World Cities

In [32]:
# Match coordinates up with cities
    # With the list of random latitudes and longitudes, use the coordinates in lat_lngs tuple to find the nearest city
    #      using Python's "citipy module".

# Install(using "pip install citipy" from the PythonData Anaconda Prompt), Import and Test "CityPy" module.

In [33]:
# Use the citipy module to determine city based on latitude and longitude.
from citipy import citipy

In [34]:
# Create a list for holding the cities[].
# Create a for loop that will do the following:
    # Iterate through the coordinates' zipped tuple.
    # Use citipy.nearest_city() and inside the parentheses of nearest_city(),
    #      add the latitude and longitude in this format: coordinate[0], coordinate[1].
    # To print the city name, chain the city_name to the nearest_city() function.
    # To print the country name, chain the country_code to the nearest_city() function.

In [35]:
# Create a list for holding the cities.
cities = []
# Identify the nearest city for each latitude and longitude combination.
for coordinate in coordinates:
    city = citipy.nearest_city(coordinate[0], coordinate[1]).city_name

    # If the city is unique, then we will add it to the cities list.
    if city not in cities:
        cities.append(city)
# Print the city count to confirm sufficient count.
len(cities)

633

## Recap

- Create a cities list to store city names.
- Iterate through the coordinates, as in our practice, and retrieve the nearest city using the latitude and longitude pair.
- Add a decision statement with the logical operator not in to determine whether the found city is already in the cities list. If not, use the append() function to add it.  
    -This is done because among the 1,500 latitudes and longitudes, there might be duplicates, which will retrieve duplicate cities; need to be sure only the unique cities are captured.

### NOTE
The citipy module finds the nearest city to the latitude and longitude pair with a population of 500 or more.

# FINDING  
When the code block is run, there should be slightly more than 500 unique cities. If there are less than 500, the "size" limit on the "np.random.uniform()" function must be increased.

# 6.2.6 Get the City Weather Data (con't from API_Practice notebook)
## Import Dependencies, and Initialize an Empty List and Counters  
- Import your Requests Library.  
- Import the weather_api_key.  
- Build the basic URL for the OpenWeatherMap with weather_api_key added to the URL.  
- Import the datetime module:  
- Declare an empty list at the top of the code block "city_data = []"  
- Add a print statement that references the beginning of the logging  
- Create counters for the record numbers, 1-50  
    - set the counter  

In [36]:
# Import the requests library.
import requests

# Import the API key.
from config import weather_api_key

In [37]:
# Starting URL for Weather Map API Call.
# original URL structure from weathermap site: api.openweathermap.org/data/2.5/weather?q={city name}&appid={API key}
url = "http://api.openweathermap.org/data/2.5/weather?units=Imperial&APPID=" + weather_api_key

In [38]:
# Import the datetime module from the datetime library.
from datetime import datetime

In [39]:
# The code block is initialized with the counters set at 1 because
#      the first iteration of the logging for each recorded response
#      and the set should start at 1

# Create an empty list to hold the weather data.
city_data = []
# Print the beginning of the logging.
print("Beginning Data Retrieval     ")
print("-----------------------------")

# Create counters.
record_count = 1
set_count = 1


# Next, iterate through the above coded list of cities and begin building the URL for each city,
#      while grouping our records in sets of 50.

# Loop through all the cities in our list.
#for i in range(len(cities)):

    # Group cities in sets of 50 for logging purposes.
    #if (i % 50 == 0 and i >= 50):
        #set_count += 1
        #record_count = 1
    # Create endpoint URL with each city.
    #city_url = url + "&q=" + cities[i]

# Create another "for" loop(in this case the "enumerate()" method)
#      to prevent the indexing error by iterating through the [cities] list.
# Using the "enumerate()" method prevents the use of two "for" loops.
# It retrieves both the city and the index from the list.

# Loop through all the cities in the list. (Comment out the previous loop above.)
for i, city in enumerate(cities):

    # Group cities in sets of 50 for logging purposes.
    if (i % 50 == 0 and i >= 50):
        set_count += 1
        record_count = 1
    # Create endpoint URL with each city.
    city_url = url + "&q=" + city.replace(" ","+")

    # Log the URL, record, and set numbers and the city.
    print(f"Processing Record {record_count} of Set {set_count} | {city}")
    # Add 1 to the record count.
    record_count += 1

# Code continues here but the explanation is in the next markdown.

# Run an API request for each of the cities using the try-except statement.
    try:
        # Parse the JSON and retrieve data.
        city_weather = requests.get(city_url).json()
        # Parse out the needed data.
        city_lat = city_weather["coord"]["lat"]
        city_lng = city_weather["coord"]["lon"]
        city_max_temp = city_weather["main"]["temp_max"]
        city_humidity = city_weather["main"]["humidity"]
        city_clouds = city_weather["clouds"]["all"]
        city_wind = city_weather["wind"]["speed"]
        city_country = city_weather["sys"]["country"]
        # Convert the date to ISO standard.
        city_date = datetime.utcfromtimestamp(city_weather["dt"]).strftime('%Y-%m-%d %H:%M:%S')
        # Append the city information into city_data list.
        city_data.append({"City": city.title(),
                          "Lat": city_lat,
                          "Lng": city_lng,
                          "Max Temp": city_max_temp,
                          "Humidity": city_humidity,
                          "Cloudiness": city_clouds,
                          "Wind Speed": city_wind,
                          "Country": city_country,
                          "Date": city_date})

# If an error is experienced, skip the city. In the work environment "pass" should not typically be used.
    except:
        print("City not found. Skipping...")
        pass

# Indicate that Data Loading is complete.
print("-----------------------------")
print("Data Retrieval Complete      ")
print("-----------------------------")

Beginning Data Retrieval     
-----------------------------
Processing Record 1 of Set 1 | hilo
Processing Record 2 of Set 1 | butaritari
Processing Record 3 of Set 1 | kloulklubed
Processing Record 4 of Set 1 | ushuaia
Processing Record 5 of Set 1 | tiksi
Processing Record 6 of Set 1 | turayf
Processing Record 7 of Set 1 | hithadhoo
Processing Record 8 of Set 1 | toungoo
City not found. Skipping...
Processing Record 9 of Set 1 | toba
Processing Record 10 of Set 1 | severo-kurilsk
Processing Record 11 of Set 1 | ogdensburg
Processing Record 12 of Set 1 | ghatsila
Processing Record 13 of Set 1 | saint anthony
Processing Record 14 of Set 1 | le mars
Processing Record 15 of Set 1 | cayenne
Processing Record 16 of Set 1 | naral
City not found. Skipping...
Processing Record 17 of Set 1 | pacific grove
Processing Record 18 of Set 1 | mahebourg
Processing Record 19 of Set 1 | hermanus
Processing Record 20 of Set 1 | upernavik
Processing Record 21 of Set 1 | bethel
Processing Record 22 of Set 

Processing Record 36 of Set 4 | cidreira
Processing Record 37 of Set 4 | havoysund
Processing Record 38 of Set 4 | yellowknife
Processing Record 39 of Set 4 | riga
Processing Record 40 of Set 4 | rawannawi
City not found. Skipping...
Processing Record 41 of Set 4 | colares
Processing Record 42 of Set 4 | labuhan
Processing Record 43 of Set 4 | jardim
Processing Record 44 of Set 4 | vostok
Processing Record 45 of Set 4 | waipawa
Processing Record 46 of Set 4 | asau
Processing Record 47 of Set 4 | amderma
City not found. Skipping...
Processing Record 48 of Set 4 | torbay
Processing Record 49 of Set 4 | brindisi
Processing Record 50 of Set 4 | broken hill
Processing Record 1 of Set 5 | ochakiv
Processing Record 2 of Set 5 | ludvika
Processing Record 3 of Set 5 | lahij
Processing Record 4 of Set 5 | umzimvubu
City not found. Skipping...
Processing Record 5 of Set 5 | ngukurr
City not found. Skipping...
Processing Record 6 of Set 5 | tsabong
Processing Record 7 of Set 5 | san nicolas
Proces

Processing Record 27 of Set 8 | thiers
Processing Record 28 of Set 8 | gouloure
Processing Record 29 of Set 8 | yingcheng
Processing Record 30 of Set 8 | ryzdvyanyy
Processing Record 31 of Set 8 | sao felix do xingu
Processing Record 32 of Set 8 | berlevag
Processing Record 33 of Set 8 | arequipa
Processing Record 34 of Set 8 | auki
Processing Record 35 of Set 8 | guilin
Processing Record 36 of Set 8 | nilagiri
Processing Record 37 of Set 8 | florence
Processing Record 38 of Set 8 | mayo
Processing Record 39 of Set 8 | musiri
Processing Record 40 of Set 8 | oyama
Processing Record 41 of Set 8 | bambanglipuro
Processing Record 42 of Set 8 | urucara
Processing Record 43 of Set 8 | palafrugell
Processing Record 44 of Set 8 | usinsk
Processing Record 45 of Set 8 | san juan
Processing Record 46 of Set 8 | rundu
Processing Record 47 of Set 8 | itarema
Processing Record 48 of Set 8 | nata
Processing Record 49 of Set 8 | ukiah
Processing Record 50 of Set 8 | san joaquin
Processing Record 1 of 

Processing Record 15 of Set 12 | loja
Processing Record 16 of Set 12 | lai
Processing Record 17 of Set 12 | bucerias
Processing Record 18 of Set 12 | tabory
Processing Record 19 of Set 12 | morgan city
Processing Record 20 of Set 12 | san vicente
Processing Record 21 of Set 12 | kamenskoye
City not found. Skipping...
Processing Record 22 of Set 12 | portland
Processing Record 23 of Set 12 | tirat karmel
Processing Record 24 of Set 12 | filadelfia
Processing Record 25 of Set 12 | daru
Processing Record 26 of Set 12 | aksu
Processing Record 27 of Set 12 | xingyi
Processing Record 28 of Set 12 | pundaguitan
Processing Record 29 of Set 12 | moron
Processing Record 30 of Set 12 | dawlatabad
Processing Record 31 of Set 12 | gazanjyk
Processing Record 32 of Set 12 | bardiyah
Processing Record 33 of Set 12 | paamiut
Processing Record 34 of Set 12 | namtsy
Processing Record 35 of Set 12 | batagay-alyta
Processing Record 36 of Set 12 | lakhipur
Processing Record 37 of Set 12 | chinhoyi
Processin

In [40]:
print(len(city_data))

581


### **NOTE**  
When retrieving data from an API, or even when scraping a webpage, make sure there is data to parse.  
If not, the script might stop at that moment and not finish getting all the data we need.  

## Handle API Request Errors with try-except Blocks  
This prevents the API request from stopping prematurely if the request does not yield a valid response.  
If the request is not valid, the code will not find the first item requested and skip the city and continue to run.  
The syntax for the "try-except" statement is similar to the "if-else" statement.  

After the record_count +=1 code line add the "try" block.  

After adding a "try" block:  
    - Parse the JSON file.  
    - Assign variables for each piece of data needed.  
    - Add the data to the cities list in a dictionary format.  

### **IMPORTANT**
Generally, it isn't good coding practice to add the pass statement to the except block.  
Ideally, should handle or catch each error as it happens and do something specific  
(e.g., add another try block or print out the error).  

# 6.2.7 Create a DataFrame of City Weather Data  
Convert to DataFrame  
Export to csv file

In [41]:
# Convert the array of dictionaries to a Pandas DataFrame.
city_data_df = pd.DataFrame(city_data)
city_data_df.head(10)

Unnamed: 0,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,Hilo,19.7297,-155.09,76.62,94,90,6.91,US,2021-07-24 17:29:41
1,Butaritari,3.0707,172.7902,83.35,73,6,16.15,KI,2021-07-24 17:29:42
2,Kloulklubed,7.0419,134.2556,82.9,79,100,12.39,PW,2021-07-24 17:29:42
3,Ushuaia,-54.8,-68.3,38.82,87,40,5.75,AR,2021-07-24 17:29:42
4,Tiksi,71.6872,128.8694,39.61,91,98,6.13,RU,2021-07-24 17:29:43
5,Turayf,31.6725,38.6637,88.05,33,0,9.22,SA,2021-07-24 17:29:43
6,Hithadhoo,-0.6,73.0833,82.72,77,55,12.3,MV,2021-07-24 17:29:43
7,Toba,34.4833,136.85,77.0,81,29,1.32,JP,2021-07-24 17:29:44
8,Severo-Kurilsk,50.6789,156.125,53.91,96,76,2.44,RU,2021-07-24 17:29:44
9,Ogdensburg,44.6942,-75.4863,81.45,54,1,8.05,US,2021-07-24 17:29:44


In [42]:
# Reorder the DataFrame column order
new_column_order = ["City", "Country", "Date", "Lat", "Lng", "Max Temp", "Humidity", "Cloudiness", "Wind Speed"]
city_data_df = city_data_df[new_column_order]
city_data_df

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Hilo,US,2021-07-24 17:29:41,19.7297,-155.0900,76.62,94,90,6.91
1,Butaritari,KI,2021-07-24 17:29:42,3.0707,172.7902,83.35,73,6,16.15
2,Kloulklubed,PW,2021-07-24 17:29:42,7.0419,134.2556,82.90,79,100,12.39
3,Ushuaia,AR,2021-07-24 17:29:42,-54.8000,-68.3000,38.82,87,40,5.75
4,Tiksi,RU,2021-07-24 17:29:43,71.6872,128.8694,39.61,91,98,6.13
...,...,...,...,...,...,...,...,...,...
576,Mulege,MX,2021-07-24 17:32:29,26.8833,-111.9833,92.89,41,100,6.49
577,Linhai,CN,2021-07-24 17:32:30,28.8500,121.1167,76.93,84,100,19.71
578,Betare Oya,CM,2021-07-24 17:32:30,5.6000,14.0833,69.69,89,83,3.18
579,Wangkui,CN,2021-07-24 17:32:30,46.8333,126.5000,68.95,95,100,10.04


In [43]:
# Create the output file (CSV).
output_data_file = "weather_data/cities.csv"
# Export the City_Data into a CSV.
city_data_df.to_csv(output_data_file, index_label="City_ID")