# WeatherPy
----

#### Note
* Instructions have been included for each segment. You do not have to follow them exactly, but they are included to help you think through the steps.

In [37]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import requests
import time
from scipy.stats import linregress


# Import API key
from api_keys import weather_api_key

# Incorporated citipy to determine city based on latitude and longitude
from citipy import citipy

# Output File (CSV)
output_data_file = ("..", "output_data/cities.csv")

# Range of latitudes and longitudes
lat_range = (-10, 10)
lng_range = (-5, 5)

## Generate Cities List

In [38]:
# List for holding lat_lngs and cities
lat_lngs = []
cities = []

# Create a set of random lat and lng combinations
lats = np.random.uniform(lat_range[0], lat_range[1], size=1500)
lngs = np.random.uniform(lng_range[0], lng_range[1], size=1500)
lat_lngs = zip(lats, lngs)

# Identify nearest city for each lat, lng combination
for lat_lng in lat_lngs:
    city = citipy.nearest_city(lat_lng[0], lat_lng[1]).city_name
   
    # If the city is unique, then add it to a our cities list
    if city not in cities:
        cities.append(city)

# Print the city count to confirm sufficient count
len(cities)

147

### Perform API Calls
* Perform a weather check on each city using a series of successive API calls.
* Include a print log of each city as it'sbeing processed (with the city number and city name).


In [39]:
url = "http://api.openweathermap.org/data/2.5/weather?"

unit = "imperial"

query_url = url + "appid=" + weather_api_key + "&units=" + unit + "&q="

print(query_url)



http://api.openweathermap.org/data/2.5/weather?appid=03807ab851ea52cddd7b52d74fcab014&units=imperial&q=


In [40]:
#number of Cities
x = 0
set = 1

#Variables
temp = []
humd = []
cloud = []
wind_spd = []
lat = []
lon = []
city_ = []
city_no = []
country = []
max_t = []
date = []


print('''
-----------------------------

Data Retrieval Begin

-----------------------------''')


for city in cities:
    try:
        
        city_data = (requests.get(query_url + city)).json()
        city_.append(city_data["name"])
        country.append(city_data["sys"]["country"])
        date.append(city_data["dt"])        
        lat.append(city_data["coord"]["lat"])
        lon.append(city_data["coord"]["lon"])        
        temp.append(city_data["main"]["temp"])
        max_t.append(city_data["main"]["temp_max"])
        humd.append(city_data["main"]["humidity"])
        cloud.append(city_data["clouds"]["all"])
        wind_spd.append(city_data["wind"]["speed"])

        
        if x == 50:
            x = 1
            set += 1
            time.sleep(60)
            
        else:
            x += 1
        
        print(f"Processing record {x} of set {set} | {city}.")
 
    except KeyError:
        print("not found")
        
print('''
-----------------------------
     Data Retrieval End
-----------------------------''')



-----------------------------

Data Retrieval Begin

-----------------------------
Processing record 1 of set 1 | takoradi.
Processing record 2 of set 1 | jamestown.
Processing record 3 of set 1 | mumford.
Processing record 4 of set 1 | begoro.
Processing record 5 of set 1 | omboue.
Processing record 6 of set 1 | kontagora.
Processing record 7 of set 1 | bibiani.
Processing record 8 of set 1 | grand-lahou.
Processing record 9 of set 1 | adzope.
Processing record 10 of set 1 | axim.
Processing record 11 of set 1 | san-pedro.
Processing record 12 of set 1 | kintampo.
Processing record 13 of set 1 | anloga.
Processing record 14 of set 1 | tabou.
Processing record 15 of set 1 | bonoua.
Processing record 16 of set 1 | gamba.
not found
Processing record 17 of set 1 | georgetown.
Processing record 18 of set 1 | cape coast.
Processing record 19 of set 1 | ogbomosho.
Processing record 20 of set 1 | bouna.
Processing record 21 of set 1 | port-gentil.
Processing record 22 of set 1 | anyama.
Proc

In [44]:
len(city_)

142

NameError: name 'value' is not defined

### Convert Raw Data to DataFrame
* Export the city data into a .csv.
* Display the DataFrame

In [45]:
# summary_grouped_df = pd.DataFrame({'Mean Tumor Volume (mm3)': tumor_mean, 'Median Tumor Volume (mm3)': tumor_median, 'Variance Tumor Volume (mm3)': tumor_var,
#                                    'Standard Deviation Tumor Volume (mm3)': tumor_std, 'SEM Tumor Volume (mm3)': tumor_sem})


# summary_grouped_df = pd.DataFrame({"City": city_, "Lat": lat, "Lng": lon, "Max Temp": max_t, "Humidity": humd, "Cloudiness": cloud, "Wind Speed": wind_spd, "date": date})

city_dict = {
    "City": city_, 
    "Country": country, 
    "Date": date,
    "Lat": lat, 
    "Lng": lon, 
    "Max Temp": max_t, 
    "Humidity": humd, 
    "Cloudiness": cloud, 
    "Wind Speed": wind_spd  
}

city_data_df = pd.DataFrame(city_dict)

city_data_df.count()

City          142
Country       142
Date          142
Lat           142
Lng           142
Max Temp      142
Humidity      142
Cloudiness    142
Wind Speed    142
dtype: int64

In [49]:
city_data_df.head()

Unnamed: 0,City,Country,Date,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed
0,Takoradze,GH,1612122438,4.8845,-1.7554,79.83,85,76,11.16
1,Jamestown,US,1612122409,42.0970,-79.2353,32.00,74,90,12.66
2,Mumford,GH,1612122208,5.2618,-0.7590,81.05,83,100,12.82
3,Begoro,GH,1612122461,6.3871,-0.3774,77.90,72,2,5.68
4,Omboué,GA,1612122442,-1.5746,9.2618,78.40,84,100,3.85
...,...,...,...,...,...,...,...,...,...
95,Ayamé,CI,1612122455,5.6083,-3.1563,77.43,86,2,5.97
96,Daoukro,CI,1612122481,7.0591,-3.9631,83.59,48,16,2.82
97,Sapele,NG,1612122811,5.8941,5.6767,81.43,73,0,5.91
98,Abeokuta,NG,1612122482,7.1500,3.3500,84.20,79,20,9.22


In [50]:
city_data_df.count()

City          142
Country       142
Date          142
Lat           142
Lng           142
Max Temp      142
Humidity      142
Cloudiness    142
Wind Speed    142
dtype: int64

In [51]:
len(city_data_df)

142

## Inspect the data and remove the cities where the humidity > 100%.
----
Skip this step if there are no cities that have humidity > 100%. 

In [None]:
#  Get the indices of cities that have humidity over 100%.


In [None]:
# Make a new DataFrame equal to the city data to drop all humidity outliers by index.
# Passing "inplace=False" will make a copy of the city_data DataFrame, which we call "clean_city_data".


## Plotting the Data
* Use proper labeling of the plots using plot titles (including date of analysis) and axes labels.
* Save the plotted figures as .pngs.

## Latitude vs. Temperature Plot

## Latitude vs. Humidity Plot

## Latitude vs. Cloudiness Plot

## Latitude vs. Wind Speed Plot

## Linear Regression

####  Northern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Southern Hemisphere - Max Temp vs. Latitude Linear Regression

####  Northern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Humidity (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Southern Hemisphere - Cloudiness (%) vs. Latitude Linear Regression

####  Northern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression

####  Southern Hemisphere - Wind Speed (mph) vs. Latitude Linear Regression