In [7]:
# WeatherPy

### Analysis
#* As expected, the weather becomes significantly warmer as one approaches the equator (0 Deg. Latitude). More interestingly, however, is the fact that the southern hemisphere tends to be warmer this time of year than the northern hemisphere. This may be due to the tilt of the earth.
#* There is no strong relationship between latitude and cloudiness. However, it is interesting to see that a strong band of cities sits at 0, 80, and 100% cloudiness.
#* There is no strong relationship between latitude and wind speed. However, in northern hemispheres there is a flurry of cities with over 20 mph of wind.


#### Note
#* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [21]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
import json
import os
import datetime
import time
from pprint import pprint
# Import API key
# import api_keys
from api_keys import api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = os.path.join("output_data","cities.csv")

# Range of latitudes and longitudes
lat_range = (-90, 90)
lng_range = (-180, 180)


In [9]:
api_key

'060a1f5e08d612b9846c0c45534ae537'

In [10]:
citipy

<module 'citipy.citipy' from 'C:\\Users\\Vijayalaskmi\\Anaconda3\\lib\\site-packages\\citipy\\citipy.py'>

In [11]:
coordinates = [(200, 200), (23, 200), (42, 100)]

## Generate Cities List
Your objective is to build a series of scatter plots to showcase the following relationships:


1. Temperature (F) vs. Latitude

2. Humidity (%) vs. Latitude

3. Cloudiness (%) vs. Latitude

4. Wind Speed (mph) vs. Latitude

In [12]:
# List for holding lat_lngs and cities
# n = 500
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(low=-90.000, high=90.000, size=1500)
lngs = np.random.uniform(low=-180.000, high=180.000, size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
    
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)
cities

['northam',
 'albany',
 'hobart',
 'grand gaube',
 'port augusta',
 'ambilobe',
 'sistranda',
 'solovetskiy',
 'bonga',
 'clyde river',
 'zwedru',
 'ilulissat',
 'sumbe',
 'rikitea',
 'bethel',
 'azimur',
 'huallanca',
 'opatija',
 'atuona',
 'sumbawa',
 'warqla',
 'haibowan',
 'tomatlan',
 'aksu',
 'dunhua',
 'sola',
 'chuy',
 'tumannyy',
 'port alfred',
 'atambua',
 'berdsk',
 'ushuaia',
 'puerto ayora',
 'kodiak',
 'sao filipe',
 'arlit',
 'barentsburg',
 'mount gambier',
 'severo-kurilsk',
 'fortuna',
 'kodinsk',
 'polunochnoye',
 'ribeira grande',
 'alghero',
 'nicolas bravo',
 'olinda',
 'ellensburg',
 'oksfjord',
 'pasni',
 'tsihombe',
 'lavrentiya',
 'ponta do sol',
 'shubarkuduk',
 'butaritari',
 'mataura',
 'ponferrada',
 'vila velha',
 'khatanga',
 'saint anthony',
 'praya',
 'edd',
 'kahului',
 'bonham',
 'east london',
 'henties bay',
 'illoqqortoormiut',
 'longyearbyen',
 'arraial do cabo',
 'barrow',
 'ranghulu',
 'omboue',
 'hovd',
 'busselton',
 'komsomolskiy',
 'nyrob

In [13]:
for each in enumerate(cities):
    print(each)

(0, 'northam')
(1, 'albany')
(2, 'hobart')
(3, 'grand gaube')
(4, 'port augusta')
(5, 'ambilobe')
(6, 'sistranda')
(7, 'solovetskiy')
(8, 'bonga')
(9, 'clyde river')
(10, 'zwedru')
(11, 'ilulissat')
(12, 'sumbe')
(13, 'rikitea')
(14, 'bethel')
(15, 'azimur')
(16, 'huallanca')
(17, 'opatija')
(18, 'atuona')
(19, 'sumbawa')
(20, 'warqla')
(21, 'haibowan')
(22, 'tomatlan')
(23, 'aksu')
(24, 'dunhua')
(25, 'sola')
(26, 'chuy')
(27, 'tumannyy')
(28, 'port alfred')
(29, 'atambua')
(30, 'berdsk')
(31, 'ushuaia')
(32, 'puerto ayora')
(33, 'kodiak')
(34, 'sao filipe')
(35, 'arlit')
(36, 'barentsburg')
(37, 'mount gambier')
(38, 'severo-kurilsk')
(39, 'fortuna')
(40, 'kodinsk')
(41, 'polunochnoye')
(42, 'ribeira grande')
(43, 'alghero')
(44, 'nicolas bravo')
(45, 'olinda')
(46, 'ellensburg')
(47, 'oksfjord')
(48, 'pasni')
(49, 'tsihombe')
(50, 'lavrentiya')
(51, 'ponta do sol')
(52, 'shubarkuduk')
(53, 'butaritari')
(54, 'mataura')
(55, 'ponferrada')
(56, 'vila velha')
(57, 'khatanga')
(58, 'sai

cities

In [14]:
# Save config information
url = "http://api.openweathermap.org/data/2.5/weather?"
units = "metric"
query_url = f"{url}appid={api_key}&units={units}&q="

In [15]:
query_url
units

'metric'

In [16]:

lat = []
temp = []
humid = []
lngtude = []
wind = []
city = []
date = []
max.temp = []
cloudiness = []
dtype = []

print(f"Beginning Data Retrieval  ")
print("----------------------------")
# Loop through the list of cities and perform a request for data on each
#for city in cities:
for index, each in enumerate(cities):

    response = requests.get(query_url + each).json()
    try:
        lat.append(response['coord']['lat'])
        lngtude.append(response['coord']['lngtude'])
        temp.append(response['main']['temp'])
        humid.append(response['main']['humid'])
        wind.append(response['wind']['speed'])
        print(f"Processing Record {index} of Set 1 | {each}")
    
    
    
    except (KeyError, IndexError):
        print("Missing field/result... skipping.")

print(f"The latitude information received is: {lat}")
print(f"The temperature information received is: {temp}")
print("----------------------------")
print("Data Retrieval Complete  ")
print("----------------------------")




Beginning Data Retrieval  
----------------------------
Processing Record 0 of Set 1 | northam
Processing Record 1 of Set 1 | albany
Processing Record 2 of Set 1 | hobart
Processing Record 3 of Set 1 | grand gaube
Processing Record 4 of Set 1 | port augusta
Processing Record 5 of Set 1 | ambilobe
Processing Record 6 of Set 1 | sistranda
Missing field/result... skipping.
Processing Record 8 of Set 1 | bonga
Processing Record 9 of Set 1 | clyde river
Processing Record 10 of Set 1 | zwedru
Processing Record 11 of Set 1 | ilulissat
Processing Record 12 of Set 1 | sumbe
Processing Record 13 of Set 1 | rikitea
Processing Record 14 of Set 1 | bethel
Missing field/result... skipping.
Processing Record 16 of Set 1 | huallanca
Processing Record 17 of Set 1 | opatija
Processing Record 18 of Set 1 | atuona
Missing field/result... skipping.
Missing field/result... skipping.
Missing field/result... skipping.
Processing Record 22 of Set 1 | tomatlan
Processing Record 23 of Set 1 | aksu
Processing Rec

Processing Record 201 of Set 1 | bonthe
Processing Record 202 of Set 1 | talnakh
Processing Record 203 of Set 1 | torbay
Processing Record 204 of Set 1 | sin-le-noble
Processing Record 205 of Set 1 | poum
Processing Record 206 of Set 1 | altamira
Processing Record 207 of Set 1 | leningradskiy
Missing field/result... skipping.
Processing Record 209 of Set 1 | lorengau
Processing Record 210 of Set 1 | sorong
Processing Record 211 of Set 1 | greenville
Processing Record 212 of Set 1 | polyarnyy
Processing Record 213 of Set 1 | byron bay
Processing Record 214 of Set 1 | port elizabeth
Missing field/result... skipping.
Processing Record 216 of Set 1 | volot
Processing Record 217 of Set 1 | lagoa
Processing Record 218 of Set 1 | puerto madryn
Processing Record 219 of Set 1 | tarauaca
Processing Record 220 of Set 1 | valparaiso
Processing Record 221 of Set 1 | thompson
Processing Record 222 of Set 1 | baoning
Processing Record 223 of Set 1 | asyut
Processing Record 224 of Set 1 | glomfjord
Pr

Processing Record 401 of Set 1 | kontagora
Processing Record 402 of Set 1 | harper
Processing Record 403 of Set 1 | kalianget
Processing Record 404 of Set 1 | teguldet
Missing field/result... skipping.
Processing Record 406 of Set 1 | san antonio de los banos
Processing Record 407 of Set 1 | chuari khas
Processing Record 408 of Set 1 | alice springs
Processing Record 409 of Set 1 | oussouye
Missing field/result... skipping.
Processing Record 411 of Set 1 | posse
Processing Record 412 of Set 1 | los andes
Processing Record 413 of Set 1 | iquique
Missing field/result... skipping.
Processing Record 415 of Set 1 | shimoda
Processing Record 416 of Set 1 | suvorovo
Processing Record 417 of Set 1 | flin flon
Processing Record 418 of Set 1 | bathurst
Processing Record 419 of Set 1 | nuzvid
Processing Record 420 of Set 1 | saurimo
Processing Record 421 of Set 1 | ketchikan
Processing Record 422 of Set 1 | tailai
Processing Record 423 of Set 1 | karratha
Missing field/result... skipping.
Process

Processing Record 601 of Set 1 | sarrebourg
Processing Record 602 of Set 1 | saint-joseph
Processing Record 603 of Set 1 | nago
Processing Record 604 of Set 1 | albacete
Processing Record 605 of Set 1 | reserva
Processing Record 606 of Set 1 | baculin
Processing Record 607 of Set 1 | paamiut
Processing Record 608 of Set 1 | beloha
Processing Record 609 of Set 1 | albanel
Processing Record 610 of Set 1 | anadyr
Processing Record 611 of Set 1 | bristol
Processing Record 612 of Set 1 | yeppoon
Processing Record 613 of Set 1 | trelew
Processing Record 614 of Set 1 | santa rosa
Processing Record 615 of Set 1 | kieta
Processing Record 616 of Set 1 | petaluma
Processing Record 617 of Set 1 | kamen-rybolov
Processing Record 618 of Set 1 | magdalena
The latitude information received is: [51.04, 42.65, -42.88, -20.01, -32.49, -13.19, 63.73, 7.26, 70.47, 6.07, 69.22, -11.2, -23.12, 60.79, -9.9, 45.33, -9.8, 19.93, 52.04, 43.37, 58.89, -33.69, -33.59, -9.11, 54.76, -54.81, -0.74, 39.95, 14.9, 18.7

In [17]:

# Remove any cities that have NaN values
weather_df = weather_df.dropna(how='any')

print(f"The data frame contains {len(weather_df['City'])} unique cities.")

NameError: name 'weather_df' is not defined

In [18]:
# # Assemble everything into a data frame
# weather_df = pd.DataFrame({"City": cities,
#                            "Latitude": lats,
#                            "Longitude": lngs,
#                            #"
Humidity": humidity,
#                            #"Max Temp": temperature,
#                            #"Cloudiness": cloudiness,
#                            #"Wind Speed": wind_speed,
#                            #"Date": dates,
#                            #"Country": country_codes
#                           })
# weather_df


SyntaxError: EOL while scanning string literal (<ipython-input-18-72329e58c23c>, line 6)

In [19]:
# Save Data to csv
cities_pd.to_csv("cities_Output.csv")

# Visualize to confirm airport data appears
cities_pd.head(10)
                        

NameError: name 'cities_pd' is not defined

In [20]:
# create a data frame from cities, lat, and temp
weather_dict = {
    "city": cities,
    "lat": lat,
    "temp": temp
}
weather_data = pd.DataFrame(weather_dict)
weather_data.head()

ValueError: arrays must all be same length

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

### Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

#### Latitude vs. Temperature Plot

In [None]:
# #Create Scatter Plot, label and save it to a png in the Output folder, then display the plot
# plt.scatter(latitudelist, temperaturelist, marker="o", facecolors="red", edgecolors="black", alpha=0.75)
# plt.xlabel("Latitude (Degrees)")
# plt.ylabel("Temperature (Fahrenheit)")
# plt.title("City Latitude vs Average Temperature on 4/4/2018")
# plt.savefig("Output/Latitude_vs_Temperature")
# #plt.grid()
# plt.show()




In [None]:
# plt.scatter(urban_data, urban_avg_fare, s=urban_dr_count*.4, c="coral", alpha=.85,edgecolor="black",linewidths=1)
# plt.scatter(suburban_data, suburban_avg_fare, s=suburban_dr_count*.9, c="lightskyblue", alpha=1,edgecolor="black",linewidths=1)
# plt.scatter(rural_data, rural_avg_fare, s=rural_dr_count, c="gold", alpha=1,edgecolor="black",linewidths=1)
# plt.title("City Latitude vs. Max Temperature(10/06/2018)")
# plt.xlabel("Latitude")
# plt.ylabel("Max Temperature(F)")
# plt.legend(('Urban','Suburban','Rural'),loc = "upper right",title = "City Type",markerscale=.4)
# plt.text(45,35,"Notes:\nCircle size correlates with driver count per City")
# plt.grid(True)

# plt.show()

In [None]:
# plt.scatter("s=*.2, c="blue",edgecolor="black,linewidths=1)
# plt.title("City Latitude vs. Humiditym(10/06/2018)")
# plt.xlabel("Latitude")
# plt.ylabel("Humidity(%)")
# plt.grid(True)
# plt.show()

#### Latitude vs. Humidity Plot

In [None]:

# plt.scatter("s=*.2, c="blue",edgecolor="black,linewidths=1)
# plt.title("City Latitude vs. Cloudiness(10/06/2018)")
# plt.xlabel("latitude")
# plt.ylabel("Cloudiness(%)")
# plt.grid(True)
# plt.show()

#### Latitude vs. Cloudiness Plot

#### Latitude vs. Wind Speed Plot

In [None]:
# plt.scatter("s=*.2, c="blue",edgecolor="black,linewidths=1)
# plt.title("City Latitude vs. wind Speed(10/06/2018)")
# plt.xlabel("Latitude")
# plt.ylabel("Wind Speed(mph)")
# plt.grid(True)
# plt.show()