# VacationPy
---

## Starter Code to Import Libraries and Load the Weather and Coordinates Data

In [1]:
# Dependencies and Setup
import hvplot.pandas
import pandas as pd
import requests

# Import API key
from api_keys import geoapify_key

In [2]:
# Load the CSV file created in Part 1 into a Pandas DataFrame
city_data_df = pd.read_csv("output_data/cities.csv")

# Display sample data
city_data_df.head()

Unnamed: 0,City_ID,City,Lat,Lng,Max Temp,Humidity,Cloudiness,Wind Speed,Country,Date
0,0,thompson,55.7435,-97.8558,-3.91,93,100,1.54,CA,1731337385
1,1,saipan,15.1355,145.701,27.03,91,20,0.89,MP,1731337374
2,2,west island,-12.1568,96.8225,26.99,83,100,5.14,CC,1731337312
3,3,port-aux-francais,-49.35,70.2167,4.86,90,91,6.46,TF,1731337388
4,4,lebu,-37.6167,-73.65,14.26,67,20,4.25,CL,1731337389


---

### Step 1: Create a map that displays a point for every city in the `city_data_df` DataFrame. The size of the point should be the humidity in each city.

In [4]:
import hvplot.pandas

# Step 1: Create a map that displays a point for every city in the `city_data_df` DataFrame.
# The size of the point should be the humidity in each city.

# Ensure correct column names and data types
# Double-check the column names in your city_data_df DataFrame (Latitude, Longitude, Humidity)
# Make sure they are in the correct format (numeric values)

# Configure the map plot
map_plot = city_data_df.hvplot.points(
    x='Lng',  # Replace 'Lng' with the correct column name for longitude if different
    y='Lat',  # Replace 'Lat' with the correct column name for latitude if different
    size='Humidity',  # Replace with the correct column name for humidity
    color='City',  # Optionally color by city
    title="City Humidity Map",
    geo=True,  # Enable geographic plotting
    tiles='OSM',  # You can change this to another tile if desired, like 'CartoDB positron'
    size_max=30,  # Adjust the max size of the points for better visibility
    colorbar=True,  # Show colorbar if you want to see the color scale
    width=800,  # Set the width of the map
    height=600  # Set the height of the map
)

# Display the map
map_plot




### Step 2: Narrow down the `city_data_df` DataFrame to find your ideal weather condition

In [45]:
import pandas as pd
import requests
import hvplot.pandas  # Import for interactive plotting
from api_keys import geoapify_key  # Assuming your API key is stored here

# Load the weather data CSV file created in the previous part of the project
city_data_df = pd.read_csv("output_data/cities.csv")

# Display a few rows to understand the structure of the data
print(city_data_df.head())

# Plot the cities on an interactive map with points sized by humidity
map_plot = city_data_df.hvplot.points(
    "Lng",  # Longitude for the x-axis
    "Lat",  # Latitude for the y-axis
    geo=True,  # Enables a geographic map
    size="Humidity",  # Size of points based on humidity
    scale=1,
    color="City",  # Assigns a unique color to each city
    alpha=0.5,  # Sets transparency for overlapping points
    tiles="OSM",  # Background map tiles
    frame_width=700,
    frame_height=500
)

# Display the map
map_plot

# Define ideal weather conditions
ideal_temp_min = 21  # Minimum temperature in Celsius
ideal_temp_max = 27  # Maximum temperature in Celsius
max_wind_speed = 4.5  # Maximum acceptable wind speed (m/s)
cloudiness_required = 0  # Only clear skies (0% cloudiness)

# Filter cities based on the ideal conditions
ideal_weather_cities = city_data_df.loc[
    (city_data_df["Max Temp"] > ideal_temp_min) &
    (city_data_df["Max Temp"] < ideal_temp_max) &
    (city_data_df["Wind Speed"] < max_wind_speed) &
    (city_data_df["Cloudiness"] == cloudiness_required)
].dropna()

# Display filtered cities
print(ideal_weather_cities.head())

# Create hotel_df with relevant columns
hotel_df = ideal_weather_cities[["City", "Country", "Lat", "Lng", "Humidity"]].copy()

# Add an empty column where hotel names will be stored
hotel_df["Hotel Name"] = ""

# Define the search radius in meters (10 km)
search_radius = 10000  # 10 km

# Start searching for hotels near each city
print("Starting hotel search...")

# Loop through each row in the DataFrame
for index, row in hotel_df.iterrows():
    latitude = row["Lat"]
    longitude = row["Lng"]
    
    # Define the parameters for the API request
    params = {
        "categories": "accommodation.hotel",
        "filter": f"circle:{longitude},{latitude},{search_radius}",
        "bias": f"proximity:{longitude},{latitude}",
        "limit": 1,  # Get only the closest hotel
        "apiKey": geoapify_key
    }
    
    # Make a request to the Geoapify AP


   City_ID               City      Lat       Lng  Max Temp  Humidity  \
0        0           thompson  55.7435  -97.8558     -3.91        93   
1        1             saipan  15.1355  145.7010     27.03        91   
2        2        west island -12.1568   96.8225     26.99        83   
3        3  port-aux-francais -49.3500   70.2167      4.86        90   
4        4               lebu -37.6167  -73.6500     14.26        67   

   Cloudiness  Wind Speed Country        Date  
0         100        1.54      CA  1731337385  
1          20        0.89      MP  1731337374  
2         100        5.14      CC  1731337312  
3          91        6.46      TF  1731337388  
4          20        4.25      CL  1731337389  
     City_ID                    City      Lat       Lng  Max Temp  Humidity  \
45        45                 isangel -19.5500  169.2667     22.69        88   
110      110  hawaiian paradise park  19.5933 -154.9731     21.61        73   
205      205             port isabel  26.0

### Step 3: Create a new DataFrame called `hotel_df`.

In [46]:

# Step 2: Create a DataFrame for the Northern Hemisphere (latitude >= 0)
# First, we need to ensure the 'Lat' column exists and is numeric.
if 'Lat' in city_data_df.columns:
    # Filter the cities with latitude greater than or equal to 0 (Northern Hemisphere)
    northern_hemi_df = city_data_df[city_data_df["Lat"] >= 0]
    
    # Display sample data (first few rows)
    print("Sample data from Northern Hemisphere:")
    print(northern_hemi_df.head())  # Display the first few rows of the filtered data
else:
    print("'Lat' column is missing in the DataFrame.")


Sample data from Northern Hemisphere:
   City_ID            City      Lat       Lng  Max Temp  Humidity  Cloudiness  \
0        0        thompson  55.7435  -97.8558     -3.91        93         100   
1        1          saipan  15.1355  145.7010     27.03        91          20   
6        6  island harbour  50.7240   -1.2758     12.79        66         100   
7        7           utrik  11.2278  169.8474     28.17        80          43   
8        8       jamestown  42.0970  -79.2353     10.57        83         100   

   Wind Speed Country        Date  
0        1.54      CA  1731337385  
1        0.89      MP  1731337374  
6        1.79      GB  1731337392  
7        7.81      MH  1731337393  
8        7.20      US  1731337394  


In [47]:
# Check the columns in filtered_cities to ensure you are using the correct ones
print(filtered_cities.shape)  # This will show the number of rows and columns
print(filtered_cities.head())  # This will display the first few rows
print(filtered_cities.columns)  # This will display the column names

# Ensure that the columns you are trying to access are present and spelled correctly
# If there are different column names for 'Latitude' and 'Longitude', update accordingly.
# For example, if 'Latitude' is 'Lat' and 'Longitude' is 'Lng', change the following line.

# Use the correct column names based on the output of filtered_cities.columns
hotel_df = filtered_cities[['City', 'Country', 'Lat', 'Lng', 'Humidity']].copy()

# Add an empty column, "Hotel Name," 



(77, 10)
    City_ID               City      Lat       Lng  Max Temp  Humidity  \
32       32    arraial do cabo -22.9661  -42.0278     26.98        50   
53       53              crane  31.3974 -102.3501     15.69        41   
63       63           beinamar   8.6698   15.3813     33.50        22   
79       79  capilla del monte -30.8609  -64.5251     19.49        33   
83       83          iranshahr  27.2025   60.6848     28.19        18   

    Cloudiness  Wind Speed Country        Date  
32           0        7.72      BR  1731337423  
53           6        2.17      US  1731337446  
63           8        2.71      TD  1731337457  
79          54        1.34      AR  1731337475  
83           0        2.06      IR  1731337480  
Index(['City_ID', 'City', 'Lat', 'Lng', 'Max Temp', 'Humidity', 'Cloudiness',
       'Wind Speed', 'Country', 'Date'],
      dtype='object')


### Step 4: For each city, use the Geoapify API to find the first hotel located within 10,000 metres of your coordinates.

In [62]:
import requests
import pandas as pd

# Ensure that geoapify_key is correctly imported
from api_keys import geoapify_key  # Ensure that the geoapify_key is available in api_keys.py

# Set parameters to search for a hotel
radius = 10000  # Set search radius (in meters, 10 km)
params = {
    "categories": "accommodation.hotel",  # Search for hotels
    "limit": 20,  # Get only one closest hotel
    "apiKey": geoapify_key  # Add your API key (make sure geoapify_key is imported from api_keys)
}

# Print a message to follow up the hotel search
print("Starting hotel search...")

# Iterate through the hotel_df DataFrame
for index, row in hotel_df.iterrows():
    # Get latitude and longitude from the DataFrame
    latitude = row["Lat"]
    longitude = row["Lng"]

    # Print the coordinates for debugging
    print(f"Searching for hotels near: Latitude {latitude}, Longitude {longitude}")

    # Update the params dictionary with the current city's latitude and longitude
    params["filter"] = f"circle:{longitude},{latitude},{radius}"  # Set the radius for the search
    params["bias"] = f"proximity:{longitude},{latitude}"  # Set the bias to the city's location

    # Set base URL
    base_url = "https://api.geoapify.com/v2/places"

    # Make and API request using the params dictionary
    name_address = requests.get(base_url, params=params)

    # Convert the API response to JSON format
    name_address = name_address.json()

    # Grab the first hotel from the results and store the name in the hotel_df DataFrame
    try:
        hotel_df.loc[index, "Hotel Name"] = name_address["features"][0]["properties"]["name"]
    except (KeyError, IndexError):
        # If no hotel is found, set the hotel name as "No hotel found".
        hotel_df.loc[index, "Hotel Name"] = "No hotel found"

    # Log the search results for each city
    print(f"{hotel_df.loc[index, 'City']} - nearest hotel: {hotel_df.loc[index, 'Hotel Name']}")

# Display the updated DataFrame with hotel names
hotel_df
    


Starting hotel search...
Searching for hotels near: Latitude -22.9661, Longitude -42.0278
arraial do cabo - nearest hotel: No hotel found
Searching for hotels near: Latitude 31.3974, Longitude -102.3501
crane - nearest hotel: No hotel found
Searching for hotels near: Latitude 8.6698, Longitude 15.3813
beinamar - nearest hotel: No hotel found
Searching for hotels near: Latitude -30.8609, Longitude -64.5251
capilla del monte - nearest hotel: Hospedaje Galicia
Searching for hotels near: Latitude 27.2025, Longitude 60.6848
iranshahr - nearest hotel: هتل قصِر
Searching for hotels near: Latitude 4.6167, Longitude -61.1333
santa elena de uairen - nearest hotel: Posada Villa Fairmont
Searching for hotels near: Latitude -26.4833, Longitude 17.15
bethanie - nearest hotel: No hotel found
Searching for hotels near: Latitude 22.6783, Longitude -3.9836
taoudenni - nearest hotel: No hotel found
Searching for hotels near: Latitude 38.4167, Longitude 77.2406
shache - nearest hotel: 莎车新盛宾馆
Searching for

Unnamed: 0,City,Country,Lat,Lng,Humidity,Hotel Name
32,arraial do cabo,BR,-22.9661,-42.0278,50,No hotel found
53,crane,US,31.3974,-102.3501,41,No hotel found
63,beinamar,TD,8.6698,15.3813,22,No hotel found
79,capilla del monte,AR,-30.8609,-64.5251,33,Hospedaje Galicia
83,iranshahr,IR,27.2025,60.6848,18,هتل قصِر
...,...,...,...,...,...,...
542,omoku,NG,5.3435,6.6532,33,Royal Fortress Hotels
553,iskenderun,TR,36.5872,36.1735,48,aykut palace
554,adrar,MR,20.5022,-10.0711,9,No hotel found
569,al faw,IQ,29.9776,48.4741,35,No hotel found


### Step 5: Add the hotel name and the country as additional information in the hover message for each city in the map.

In [65]:
%%capture --no-display
# Configure the map plot
Map_city = hotel_df.hvplot.points(
    x='Lng',  # Replace 'Lng' with the correct column name for longitude if different
    y='Lat',  # Replace 'Lat' with the correct column name for latitude if different
    size='Humidity',  # Replace with the correct column name for humidity
    color='City',  # Optionally color by city
    title="city_picture Map",
    geo=True,  # Enable geographic plotting
    tiles='OSM',  # You can change this to another tile if desired, like 'CartoDB positron'
    size_max=30,  # Adjust the max size of the points for better visibility
    colorbar=True,  # Show colorbar if you want to see the color scale
    width=800,  # Set the width of the map
    height=600 , # Set the height of the map
    hover_cols=["Hotel_Name","Country"]
)
# Display the map
Map_city

