In [0]:
from pyspark.sql.functions import *

In [0]:
def csv_to_df(filename):
    """has one argument which expects a csv filename.
       This function loads the data in the file into 
       a dataframe and then displays the dataframe"""
    # File location and type
    file_location = "/FileStore/tables/" + filename
    file_type = "csv"
    # CSV options
    infer_schema = "true"
    first_row_is_header = "true"
    delimiter = ","
    # The applied options are for CSV files. For other file types, these will be ignored.
    df = spark.read.format(file_type) \
         .option("inferSchema", infer_schema) \
         .option("header", first_row_is_header) \
         .option("sep", delimiter) \
         .option("multiline","True") \
         .option("escape","\"") \
         .load(file_location)
    return df

In [0]:
df_1000_listings = csv_to_df("listings.csv")
display(df_1000_listings)

id,name,host_id,host_name,neighbourhood_group,neighbourhood,latitude,longitude,room_type,price,minimum_nights,number_of_reviews,last_review,reviews_per_month,calculated_host_listings_count,availability_365,number_of_reviews_ltm,license
5136,"Spacious Brooklyn Duplex, Patio + Garden",7378,Rebecca,Brooklyn,Sunset Park,40.66265,-73.99454,Entire home/apt,275,21,3,2022-08-10,0.03,1,267,1,
5203,Cozy Clean Guest Room - Family Apt,7490,MaryEllen,Manhattan,Upper West Side,40.8038,-73.96751,Private room,75,2,118,2017-07-21,0.73,1,0,0,
5121,BlissArtsSpace!,7356,Garon,Brooklyn,Bedford-Stuyvesant,40.68535,-73.95512,Private room,60,30,50,2019-12-02,0.3,2,322,0,
5178,Large Furnished Room Near B'way,8967,Shunichi,Manhattan,Midtown,40.76457,-73.98317,Private room,68,2,559,2022-11-20,3.38,1,79,50,
2595,Skylit Midtown Castle,2845,Jennifer,Manhattan,Midtown,40.75356,-73.98559,Entire home/apt,175,30,49,2022-06-21,0.31,3,365,1,
6872,Uptown Sanctuary w/ Private Bath (Month to Month),16104,Kae,Manhattan,East Harlem,40.80107,-73.94255,Private room,65,30,1,2022-06-05,0.16,2,300,1,
5803,"Lovely Room 1 in BEST AREA; Legal Rental, Spotless",9744,Laurie,Brooklyn,South Slope,40.66801,-73.98784,Private room,124,4,218,2022-10-10,1.31,3,163,14,
6848,Only 2 stops to Manhattan studio,15991,Allen & Irina,Brooklyn,Williamsburg,40.70935,-73.95342,Entire home/apt,68,30,187,2022-11-02,1.13,1,151,5,
7097,Perfect for Your Parents: Privacy + Garden,17571,Jane,Brooklyn,Fort Greene,40.691233,-73.972702,Entire home/apt,220,3,316,2022-10-29,2.01,2,38,36,
6990,UES Beautiful Blue Room,16800,Cyn,Manhattan,East Harlem,40.78778,-73.94759,Private room,62,30,242,2022-10-21,1.52,1,308,8,


In [0]:
from pyspark.sql.types import IntegerType
from pyspark.sql.functions import udf

@udf(returnType=IntegerType())
def summarize_sentiment(sum):
    x = 0
    if sum >= 1.75:
        return 2
    elif sum < 1.75 and sum >= 1.5:
        return 1
    else:
        return 0

In [0]:
df_1000_reviews = csv_to_df("labelled_reviews_v1.csv")
df_1000_reviews = df_1000_reviews.groupBy('listing_id').agg(mean("labelled_sentiment").alias("mean_prediction"))
df_1000_reviews = df_1000_reviews.withColumn('derived_summarize_sentiment', summarize_sentiment(df_1000_reviews['mean_prediction']))
df_1000_reviews = df_1000_reviews.drop("mean_prediction")
display(df_1000_reviews)

listing_id,derived_summarize_sentiment
34071682,2
1217318,2
46280898,2
51864768,2
43265776,1
36318290,2
38674685,2
34116613,1
20970822,2
49946969,2


In [0]:
df_50 = df_1000_listings.join(df_1000_reviews, df_1000_listings.id == df_1000_reviews.listing_id , "inner")

In [0]:
df_50 = df_50.withColumnRenamed("host_neighbourhood", "neighbourhood_group")
df_50 = df_50.select("id","price","neighbourhood_group","room_type","number_of_reviews","availability_365","derived_summarize_sentiment")
display(df_50)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment
1217318,90,Brooklyn,Private room,724,87,2
3798941,93,Brooklyn,Private room,723,63,2
6949526,163,Brooklyn,Entire home/apt,348,286,2
12171671,100,Manhattan,Private room,504,83,2
20970822,109,Brooklyn,Entire home/apt,578,272,2
22431770,482,Manhattan,Hotel room,569,357,2
24392338,166,Manhattan,Entire home/apt,518,216,2
25042316,136,Brooklyn,Entire home/apt,526,77,2
26743923,473,Manhattan,Hotel room,313,324,2
32284910,60,Queens,Private room,435,110,2


In [0]:
df_research_listings = csv_to_df("research_million_listing.csv")
display(df_research_listings)

id,listing_url,scrape_id,last_scraped,name,summary,space,description,experiences_offered,neighborhood_overview,notes,transit,access,interaction,house_rules,thumbnail_url,medium_url,picture_url,xl_picture_url,host_id,host_url,host_name,host_since,host_location,host_about,host_response_time,host_response_rate,host_acceptance_rate,host_is_superhost,host_thumbnail_url,host_picture_url,host_neighbourhood,host_listings_count,host_total_listings_count,host_verifications,host_has_profile_pic,host_identity_verified,street,neighbourhood,neighbourhood_cleansed,neighbourhood_group_cleansed,city,state,zipcode,market,smart_location,country_code,country,latitude,longitude,is_location_exact,property_type,room_type,accommodates,bathrooms,bedrooms,beds,bed_type,amenities,square_feet,price,weekly_price,monthly_price,security_deposit,cleaning_fee,guests_included,extra_people,minimum_nights,maximum_nights,calendar_updated,has_availability,availability_30,availability_60,availability_90,availability_365,calendar_last_scraped,number_of_reviews,first_review,last_review,review_scores_rating,review_scores_accuracy,review_scores_cleanliness,review_scores_checkin,review_scores_communication,review_scores_location,review_scores_value,requires_license,license,jurisdiction_names,instant_bookable,is_business_travel_ready,cancellation_policy,require_guest_profile_picture,require_guest_phone_verification,calculated_host_listings_count,reviews_per_month
2515,https://www.airbnb.com/rooms/2515,20180908060534,2018-09-08,Stay at Chez Chic budget room #1,Step into our artistic spacious apartment and enjoy your artistic Guest room with original artwork from NY artists. Shared with my little family however we often out and you won't see us much. across the street from Central Park - the busy city minutes away but sleeping in quiet at night!,"-PLEASE BOOK DIRECTLY. NO NEED TO SEND A REQUEST FOR DATES CALENDAR IS UP TO DATE ALL AIRBNB RESERVATIONS WILL BE HONORED Nice, comfortable, and clean private guest room with shared bathroom (2 people max) - full size bed. In very nice apartment on central Park North 4th floor walk-up. same place as Chez chic #2, max capacity of the rooms 2 people). You will share the apt with me and my little family. Daily cleaning in common areas. Located one block from Subway 2/3,B/C on 110th street, Bus M1,2,3,4 at the corner, central park across the street. Your room: full size bed (sleeps two), desk, Digital Tv/DVD, wifi internet, A/C, closet and desk. Sheets/Towels provided. Iron/air dryer provided. Separate Full bathroom shared with guestroom room #2. Access to the Kitchen from 8AM weekdays or anytime during the weekend and light cooking, access to kitchen at all times but no cooking in the evening. The apartment: spacious newly renovated, hardwood floors,3BD, 2Bath apartment with Living room","Step into our artistic spacious apartment and enjoy your artistic Guest room with original artwork from NY artists. Shared with my little family however we often out and you won't see us much. across the street from Central Park - the busy city minutes away but sleeping in quiet at night! -PLEASE BOOK DIRECTLY. NO NEED TO SEND A REQUEST FOR DATES CALENDAR IS UP TO DATE ALL AIRBNB RESERVATIONS WILL BE HONORED Nice, comfortable, and clean private guest room with shared bathroom (2 people max) - full size bed. In very nice apartment on central Park North 4th floor walk-up. same place as Chez chic #2, max capacity of the rooms 2 people). You will share the apt with me and my little family. Daily cleaning in common areas. Located one block from Subway 2/3,B/C on 110th street, Bus M1,2,3,4 at the corner, central park across the street. Your room: full size bed (sleeps two), desk, Digital Tv/DVD, wifi internet, A/C, closet and desk. Sheets/Towels provided. Iron/air dryer provided. Separate F",none,,Please no cooking at night but you can warm up food in the microwave and use the kitchen,Subway 2.3.B.C. at 110th street around the corner and bus M.2.3.4 at the corner,"Guests will have their PRIVATE BATHROOM (NOTE: Shared between June 22-Aug 22) (shared with 2nd guestroom if there are guests), and the kitchen","We will have a list of Harlem restaurants and points of interest ready for you, as well as a subway map of NYC and pratical infos.",no-smoking/please take off your shoes: cleaning fees $40,,,https://a0.muscache.com/im/pictures/d0489e42-4333-4360-911f-413d503fe146.jpg?aki_policy=large,,2758,https://www.airbnb.com/users/show/2758,Steph,2008-09-06,"New York, New York, United States",loves to host and welcome travelers from around the world in our family Apt.,within a few hours,93%,,f,https://a0.muscache.com/im/users/2758/profile_pic/1338267836/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/2758/profile_pic/1338267836/original.jpg?aki_policy=profile_x_medium,Harlem,3,3,"['email', 'phone', 'facebook', 'reviews', 'jumio', 'offline_government_id', 'government_id']",t,t,"New York, NY, United States",Harlem,Harlem,Manhattan,New York,NY,10026,New York,"New York, NY",US,United States,40.79920479936168,-73.95367574543542,t,Apartment,Private room,3,1.0,1.0,2,Real Bed,"{TV,""Cable TV"",Internet,Wifi,""Air conditioning"",Kitchen,""Free street parking"",""Buzzer/wireless intercom"",Heating,""Family/kid friendly"",""Smoke detector"",""Carbon monoxide detector"",""Fire extinguisher"",Essentials,Shampoo,""Lock on bedroom door"",Hangers,""Hair dryer"",Iron,""Laptop friendly workspace"",""Children’s books and toys"",""Window guards"",""Pack ’n Play/travel crib"",""Hot water"",Microwave,""Coffee maker"",Refrigerator,""Dishes and silverware"",""Cooking basics"",Oven,Stove,""Host greets you""}",,$59.00,$720.00,"$1,690.00",$0.00,$60.00,2,$39.00,2,21,4 days ago,t,6,26,52,317,2018-09-08,170,2008-10-13,2018-07-05,93.0,9.0,9.0,10.0,9.0,9.0,9.0,f,,,f,f,strict_14_with_grace_period,f,f,3,1.41
2539,https://www.airbnb.com/rooms/2539,20180908060534,2018-09-08,Clean & quiet apt home by the park,Renovated apt home in elevator building.,"Spacious, renovated, and clean apt home, one block to F train, 25 minutes to lower Manhatten","Renovated apt home in elevator building. Spacious, renovated, and clean apt home, one block to F train, 25 minutes to lower Manhatten Close to Prospect Park and Historic Ditmas Park Very close to F and G trains and Express bus into NY. The B and Q are closeby also. If this room is unavailable on your desired dates, check out our other rooms, such as: https://www.airbnb.com/rooms/10267242",none,Close to Prospect Park and Historic Ditmas Park,"If this room is unavailable on your desired dates, check out our other rooms, such as: https://www.airbnb.com/rooms/10267242",Very close to F and G trains and Express bus into NY. The B and Q are closeby also.,,,"-The security and comfort of all our guests is important to us! Therefore, no one is permitted to check in without first emailing or texting a clear picture ID, acceptable to manager. Instructions will be provided in the house manual. -No eating, drinking or storage of food in the room. -No smoking. -Illicit drug use is strictly forbidden. -Quiet hours after 10pm and before 8am, This is respectful for our neighbors and other guests. -Please clean up after yourself when using the kitchen and bath. -Please lock the doors and close the windows when exiting the home. -Please indicate and pay for the correct number of guests. Failure to do so will cancel your reservation with no refund due. -Please remove your shoes when entering the apt home. Thanks for choosing our home!",,,https://a0.muscache.com/im/pictures/3949d073-a02e-4ebc-aa9c-ac74f00eaa1f.jpg?aki_policy=large,,2787,https://www.airbnb.com/users/show/2787,John,2008-09-07,"New York, New York, United States","Educated professional living in Brooklyn. I love meeting new people, running, hiking, fine foods, traveling, etc. One of my favorite trips was spending New Year's Eve in London on the Thames River. Big Ben, spectacular fireworks and light show; and fun times with a good crowd of international tourists. A most memorable night and trip! Also, I generally approach life with a positive attitude. I look forward to meeting you.",within an hour,100%,,t,https://a0.muscache.com/im/pictures/8674565a-758d-476b-a580-4d99ea9baab9.jpg?aki_policy=profile_small,https://a0.muscache.com/im/pictures/8674565a-758d-476b-a580-4d99ea9baab9.jpg?aki_policy=profile_x_medium,Gravesend,8,8,"['email', 'phone', 'reviews', 'kba']",t,t,"Brooklyn , NY, United States",Kensington,Kensington,Brooklyn,Brooklyn,NY,11218,New York,"Brooklyn , NY",US,United States,40.64748608166989,-73.97236954007958,f,Apartment,Private room,4,1.0,1.0,3,Real Bed,"{TV,""Cable TV"",Internet,""Wheelchair accessible"",Kitchen,""Free parking on premises"",Breakfast,Elevator,""Free street parking"",""Buzzer/wireless intercom"",Heating,""Suitable for events"",Washer,Dryer,""Smoke detector"",""Carbon monoxide detector"",""First aid kit"",""Safety card"",""Fire extinguisher"",Essentials,Shampoo,""24-hour check-in"",Hangers,""Hair dryer"",Iron,""Laptop friendly workspace"",""translation missing: en.hosting_amenity_49"",""translation missing: en.hosting_amenity_50"",""Self check-in"",Keypad,""Outlet covers"",""Hot water"",""Bed linens"",""Extra pillows and blankets"",Microwave,""Coffee maker"",Refrigerator,""Dishes and silverware"",""Cooking basics"",Oven,Stove,""Luggage dropoff allowed"",""Long term stays allowed"",""Cleaning before checkout""}",,$149.00,$299.00,$999.00,$100.00,$25.00,1,$25.00,1,730,yesterday,t,30,60,90,365,2018-09-08,8,2015-12-04,2018-07-17,98.0,10.0,10.0,10.0,10.0,10.0,10.0,f,,,f,f,moderate,f,f,8,0.24
2595,https://www.airbnb.com/rooms/2595,20180908060534,2018-09-08,Skylit Midtown Castle,"Find your romantic getaway to this beautiful, spacious skylit studio in the heart of Midtown, Manhattan. STUNNING SKYLIT STUDIO / 1 BED + SINGLE / FULL BATH / FULL KITCHEN / FIREPLACE / CENTRALLY LOCATED / WiFi + APPLE TV / SHEETS + TOWELS","- Spacious (500+ft²), immaculate and nicely furnished & designed studio. - Tuck yourself into the ultra comfortable bed under the skylight. Fall in love with a myriad of bright lights in the city night sky. - Single-sized bed/convertible floor mattress with luxury bedding (available upon request). - Gorgeous pyramid skylight with amazing diffused natural light, stunning architectural details, soaring high vaulted ceilings, exposed brick, wood burning fireplace, floor seating area with natural zafu cushions, modern style mixed with eclectic art & antique treasures, large full bath, newly renovated kitchen, air conditioning/heat, high speed WiFi Internet, and Apple TV. - Centrally located in the heart of Midtown Manhattan just a few blocks from all subway connections in the very desirable Midtown location a few minutes walk to Times Square, the Theater District, Bryant Park and Herald Square. - The Midtown Castle is a uniquely charming Dutch Colonial survivor from the 1890s. - This is","Find your romantic getaway to this beautiful, spacious skylit studio in the heart of Midtown, Manhattan. STUNNING SKYLIT STUDIO / 1 BED + SINGLE / FULL BATH / FULL KITCHEN / FIREPLACE / CENTRALLY LOCATED / WiFi + APPLE TV / SHEETS + TOWELS - Spacious (500+ft²), immaculate and nicely furnished & designed studio. - Tuck yourself into the ultra comfortable bed under the skylight. Fall in love with a myriad of bright lights in the city night sky. - Single-sized bed/convertible floor mattress with luxury bedding (available upon request). - Gorgeous pyramid skylight with amazing diffused natural light, stunning architectural details, soaring high vaulted ceilings, exposed brick, wood burning fireplace, floor seating area with natural zafu cushions, modern style mixed with eclectic art & antique treasures, large full bath, newly renovated kitchen, air conditioning/heat, high speed WiFi Internet, and Apple TV. - Centrally located in the heart of Midtown Manhattan just a few blocks from all s",none,"Centrally located in the heart of Manhattan just a few blocks from all subway connections in the very desirable Midtown location a few minutes walk to Times Square, the Theater District, Bryant Park and Herald Square.",,"Apartment is located on 37th Street between 5th & 6th Avenue, just a few blocks from all subway connections. Closest Subways (in order of proximity to apartment (Website hidden by Airbnb) W: 34th Street & 6th Avenu (Website hidden by Airbnb) 3: 34th Street & 7th Avenue 7: 42nd & 5th Avenu (Website hidden by Airbnb) S: 42nd Street between Park & Lexington Avenue (Website hidden by Airbnb) E: 34th Street and 8th Avenue If coming by car, there is a parking garage on the block and free street parking.","Guests have full access to the kitchen, bathroom and living spaces. The closets are private/off limits.","I am a Sound Therapy Practitioner and Kundalini Yoga & Meditation teacher. I work with energy and sound for relaxation and healing, using Symphonic gong, singing bowls, tuning forks, drums, voice and other instruments. Sound relaxation sessions and/or personalized Kundalini Yoga sessions are available in the space upon request. Individual, couples or group sessions available. Licensed acupuncture and massage also available upon request. Please inquire. I welcome my guests at the apartment for check-in, or alternatively, a self check-in can be arranged. Once you are settled in, I am just a phone call, text or email away, should you have any questions, concerns or issues during your stay. My desire is that you have a smooth arrival and amazing stay here.","Make yourself at home, respect the space and the neighbors. No pets, no smoking and no unauthorized guests.",,,https://a0.muscache.com/im/pictures/f028bdf9-eaa3-4ce0-b441-e9f18df4709b.jpg?aki_policy=large,,2845,https://www.airbnb.com/users/show/2845,Jennifer,2008-09-09,"New York, New York, United States","A New Yorker since 2000! My passion is creating beautiful, unique spaces where unforgettable memories are made. It's my pleasure to host people from around the world and meet new faces. Welcome travelers! I am a Sound Therapy Practitioner and Kundalini Yoga & Meditation teacher. I work with energy and sound for relaxation and healing, using Symphonic gong, singing bowls, tuning forks, drums, voice and other instruments.",within a day,79%,,f,https://a0.muscache.com/im/users/2845/profile_pic/1259095067/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/2845/profile_pic/1259095067/original.jpg?aki_policy=profile_x_medium,Midtown,5,5,"['email', 'phone', 'reviews', 'kba', 'work_email']",t,t,"New York, NY, United States",Midtown,Midtown,Manhattan,New York,NY,10018,New York,"New York, NY",US,United States,40.75362072657246,-73.98377381114605,f,Apartment,Entire home/apt,2,1.0,0.0,1,Real Bed,"{TV,Wifi,""Air conditioning"",Kitchen,""Paid parking off premises"",""Free street parking"",""Indoor fireplace"",Heating,""Family/kid friendly"",""Smoke detector"",""Carbon monoxide detector"",""Fire extinguisher"",Essentials,Shampoo,""Lock on bedroom door"",Hangers,""Hair dryer"",Iron,""Laptop friendly workspace"",""Self check-in"",Keypad,""Private living room"",Bathtub,""Hot water"",""Bed linens"",""Extra pillows and blankets"",""Ethernet connection"",""Coffee maker"",Refrigerator,""Dishes and silverware"",""Cooking basics"",Oven,Stove,""Luggage dropoff allowed"",""Long term stays allowed"",""Cleaning before checkout""}",,$225.00,"$1,995.00",,$350.00,$100.00,2,$0.00,1,1125,today,t,16,46,76,341,2018-09-08,34,2009-11-21,2018-06-29,94.0,9.0,9.0,9.0,10.0,10.0,9.0,f,,,f,f,strict_14_with_grace_period,t,t,2,0.32
3330,https://www.airbnb.com/rooms/3330,20180908060534,2018-09-08,++ Brooklyn Penthouse Guestroom ++,"This is a spacious, clean, furnished master bedroom with PRIVATE bathroom and rooftop deck in one of Brooklyn's most vibrant neighborhoods, our beloved, East Williamsburg! Stay as the locals do and share our 3 bedroom, 2-story apartment! See u soon!","Room Features: - clean, hardwood floors - 2 large windows with sliding glass doors providing access to private rooftop deck - clean private bathroom with tub - comfy, cozy, queen sized bed with fresh sheets - full length mirror - dresser - hangers for clothes - fresh bath towels included with stay Apartment Features: - open living room with lots of natural light - basic cable/Netflix/ HBO Go on TV - high ceilings - dishwasher/microwave/gas stove - pots and pans for cooking / dishes & utensils - 2 quiet, working roommates (lovely ladies in their early 30s) Building: - 4 story - elevator - laundry facility in basement - 1 block from Montrose Ave stop on L train - friendly neighbors Ideal For: - someone on vacation looking for a great deal - someone in transition, moving, or exploring williamsburg - someone who wants hotel comfort, but not hotel rates - someone who is clean and will not smoke/do drugs in the apartment - someone who prefers to stay at least a week - couples welcome! no","This is a spacious, clean, furnished master bedroom with PRIVATE bathroom and rooftop deck in one of Brooklyn's most vibrant neighborhoods, our beloved, East Williamsburg! Stay as the locals do and share our 3 bedroom, 2-story apartment! See u soon! Room Features: - clean, hardwood floors - 2 large windows with sliding glass doors providing access to private rooftop deck - clean private bathroom with tub - comfy, cozy, queen sized bed with fresh sheets - full length mirror - dresser - hangers for clothes - fresh bath towels included with stay Apartment Features: - open living room with lots of natural light - basic cable/Netflix/ HBO Go on TV - high ceilings - dishwasher/microwave/gas stove - pots and pans for cooking / dishes & utensils - 2 quiet, working roommates (lovely ladies in their early 30s) Building: - 4 story - elevator - laundry facility in basement - 1 block from Montrose Ave stop on L train - friendly neighbors Ideal For: - someone on vacation looking for a great deal",none,"Location is GREAT!! Right off the L train in the best neighborhood in the five boroughs: Williamsburg (recognized as one of the best neighborhoods in New York City by TimeOut Magazine New York) You will be walking distance to all the best bars, restaurants and music venues in Brooklyn. Several Supermarkets and bodegas are all within short walking distance.",We would very much appreciate it if you give us details as to when you will get into Brooklyn as soon as possible after you book the place so we can plan accordingly to get you your key without any delay.,"You will be STEPS AWAY FROM THE L TRAIN. Hop on the L and get in to Manhattan in ten minutes. 15 minutes to the the East Village, Union Square, and Greenwich Village. You can also get to all the great NYC sites like the Empire State Building, Times Square, and the Statue of Liberty on this train right outside your front door. Our place is short walking distance to the J, M, Z trains at Union/Broadway as well as several bus routes. Free parking on the street, just pay attention to the signs!","The apartment is equipped with full kitchen (microwave oven, stove, toaster oven, pots, pans, etc.) and refrigerator for your use, large bathroom, a comfortable separate dining room, living room, and a private rooftop deck!","I will likely not be around as my room (Penthouse Guestroom) is typically only available when I am away. However, I am always reachable via text/email.",Guests should be respectful of the home and the neighbors. Love thy neighbor :),,,https://a0.muscache.com/im/pictures/41842659/5dd0ed5c_original.jpg?aki_policy=large,,4177,https://www.airbnb.com/users/show/4177,Jbee,2008-11-09,"New York, New York, United States",From Brooklyn with love.,within a day,100%,,f,https://a0.muscache.com/im/pictures/91fc9357-9073-4f37-bf88-e52dce0c3bcb.jpg?aki_policy=profile_small,https://a0.muscache.com/im/pictures/91fc9357-9073-4f37-bf88-e52dce0c3bcb.jpg?aki_policy=profile_x_medium,East Williamsburg,5,5,"['email', 'phone', 'reviews', 'kba']",t,t,"Brooklyn, NY, United States",Williamsburg,Williamsburg,Brooklyn,Brooklyn,NY,11206,New York,"Brooklyn, NY",US,United States,40.70855778333159,-73.94236227640226,t,Apartment,Private room,2,1.0,1.0,1,Real Bed,"{TV,Internet,Wifi,""Wheelchair accessible"",Kitchen,""Pets live on this property"",Elevator,""Free street parking"",""Buzzer/wireless intercom"",Heating,Washer,Dryer,""Smoke detector"",""Carbon monoxide detector"",Essentials,Shampoo,""Lock on bedroom door"",Hangers,""Hair dryer"",""Laptop friendly workspace"",""translation missing: en.hosting_amenity_49"",""translation missing: en.hosting_amenity_50"",""Hot water"",""Long term stays allowed"",Other}",,$70.00,$650.00,"$1,900.00",$150.00,$125.00,2,$50.00,5,730,6 days ago,t,7,14,40,298,2018-09-08,33,2010-01-04,2018-06-15,97.0,10.0,10.0,10.0,10.0,10.0,10.0,f,,,f,f,strict_14_with_grace_period,f,f,3,0.31
3647,https://www.airbnb.com/rooms/3647,20180908060534,2018-09-08,THE VILLAGE OF HARLEM....NEW YORK !,,WELCOME TO OUR INTERNATIONAL URBAN COMMUNITY This Spacious 1 bedroom is with Plenty of Windows with a View....... Sleeps.....Four Adults.....two in the Livingrm. with (2) Sofa-beds. (Website hidden by Airbnb) two in the Bedrm.on a very Comfortable Queen Size Bed... A Complete Bathrm.....With Shower and Bathtub....... Fully Equipped with Linens & Towels........ Spacious Living Room......Flat ScreenTelevision.....DVD Player with Movies available for your viewing during your stay............................................................................. Dining Area.....for Morning Coffee or Tea..................................................... The Kitchen Area is Modern with Granite Counter Top... includes the use of a Coffee Maker...Microwave to Heat up a Carry Out/In Meal.... Not suited for a Gourmet Cook...or Top Chef......Sorry!!!! . This Flat is located in HISTORIC HARLEM.... near the Appollo Theater and The Museum Mile...on Fifth Avenue. Sylvia's World Famous Resturant...loca,WELCOME TO OUR INTERNATIONAL URBAN COMMUNITY This Spacious 1 bedroom is with Plenty of Windows with a View....... Sleeps.....Four Adults.....two in the Livingrm. with (2) Sofa-beds. (Website hidden by Airbnb) two in the Bedrm.on a very Comfortable Queen Size Bed... A Complete Bathrm.....With Shower and Bathtub....... Fully Equipped with Linens & Towels........ Spacious Living Room......Flat ScreenTelevision.....DVD Player with Movies available for your viewing during your stay............................................................................. Dining Area.....for Morning Coffee or Tea..................................................... The Kitchen Area is Modern with Granite Counter Top... includes the use of a Coffee Maker...Microwave to Heat up a Carry Out/In Meal.... Not suited for a Gourmet Cook...or Top Chef......Sorry!!!! . This Flat is located in HISTORIC HARLEM.... near the Appollo Theater and The Museum Mile...on Fifth Avenue. Sylvia's World Famous Resturant...loca,none,,,,,,Upon arrival please have a legibile copy of your Passport and / or State Photo. ID. as well as your confirmation letter. Please NO SMOKING ...LOUD TALKING or PARTIES of any kind. Security Deposit and Cleaning Fees in CASH at time of arrival. Security deposit will be refunded within 72hrs pending no damages. .Cleaning fees are non-refundable. At Check Out... Please dispose of all trash/garbage in the bins located outside behind the entrance stairs. Please place all dirty linens and towels in the dirty laundry bin. Please don't leave any dishes in the sink and dispose of all Plastic Dishes/Plastic Culinary. If you need a late check-out please contact the Emergency Contact Telephone Numbers that are listed in the Flat. PLEASE LEAVE ALL KEYS IN THE FLAT and BE CERTAIN THE DOORS ARE LOCKED. WE HOPE YOU ENJOYED YOUR STAY and will write positve comments and will visit again.,,,https://a0.muscache.com/im/pictures/838341/9b3c66f3_original.jpg?aki_policy=large,,4632,https://www.airbnb.com/users/show/4632,Elisabeth,2008-11-25,"New York, New York, United States","Make Up Artist National/ (Website hidden by Airbnb) Production. I m curently working with a Production Company in WDC and Coordinated a ""Day Of Service "" for the Presidential Innaugration 2013. I can't live without Starbucks and Oprah's Chai Tea Latte...and my circle of of great friends world wide. ""BLESS ME INTO USEFULLNESS"" is my daily prayer. I",,,,f,https://a0.muscache.com/im/users/4632/profile_pic/1328402497/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/4632/profile_pic/1328402497/original.jpg?aki_policy=profile_x_medium,Harlem,1,1,"['email', 'phone', 'google', 'reviews', 'jumio', 'government_id']",t,t,"New York, NY, United States",Harlem,Harlem,Manhattan,New York,NY,10027,New York,"New York, NY",US,United States,40.809017849055714,-73.94190208041947,t,Apartment,Private room,2,1.0,1.0,1,Pull-out Sofa,"{""Cable TV"",Internet,Wifi,""Air conditioning"",Kitchen,""Buzzer/wireless intercom"",Heating,""Smoke detector"",""Carbon monoxide detector"",""translation missing: en.hosting_amenity_49"",""translation missing: en.hosting_amenity_50""}",,$150.00,,,$200.00,$75.00,2,$20.00,3,7,24 months ago,t,30,60,90,365,2018-09-08,0,,,,,,,,,,f,,,f,f,strict_14_with_grace_period,t,t,1,
3831,https://www.airbnb.com/rooms/3831,20180908060534,2018-09-08,Cozy Entire Floor of Brownstone,"Urban retreat: enjoy 500 s.f. floor in 1899 brownstone, with new flooring throughout (completed Aug. 2015 through Sept. 2015), roomy bdrm, & upgraded kitchen & bathroom (completed Oct. 2015). It's sunny and loaded with everything you need!","Greetings! We own a double-duplex brownstone in Clinton Hill on Gates near Classon Avenue - (7 blocks to C train, 5 blocks to G train, minutes to all), in which we host on the entire top floor of the upper duplex. This is more of an efficiency set-up: it is the top floor on a two-family, double duplex brownstone, the top floor for our guests consists of a sizable bedroom, full bath and eat-in kitchen for your exclusive use. Our family occupies the floors below. You go through a common hallway and staircase, to get to the top floor (2 easy flights up from the main entrance), but not through any rooms, so it is a fairly private set-up. - Clinton Hill, Gates Avenue near Classon Ave. (1 mi. or less to Williamsburg, Park Slope, Prospect Heights, downtown, Ft. Greene, Bed-Stuy, Bushwick; 20 mins to Manhattan) - includes FiOS, heat (or A/C), hot water, and electricity all included - furnished with two twin beds (convertible into a king bed), one rollaway twin bed and one inflatable m","Urban retreat: enjoy 500 s.f. floor in 1899 brownstone, with new flooring throughout (completed Aug. 2015 through Sept. 2015), roomy bdrm, & upgraded kitchen & bathroom (completed Oct. 2015). It's sunny and loaded with everything you need! Greetings! We own a double-duplex brownstone in Clinton Hill on Gates near Classon Avenue - (7 blocks to C train, 5 blocks to G train, minutes to all), in which we host on the entire top floor of the upper duplex. This is more of an efficiency set-up: it is the top floor on a two-family, double duplex brownstone, the top floor for our guests consists of a sizable bedroom, full bath and eat-in kitchen for your exclusive use. Our family occupies the floors below. You go through a common hallway and staircase, to get to the top floor (2 easy flights up from the main entrance), but not through any rooms, so it is a fairly private set-up. - Clinton Hill, Gates Avenue near Classon Ave. (1 mi. or less to Williamsburg, Park Slope, Prospect Heights,",none,Just the right mix of urban center and local neighborhood; close to all but enough quiet for a calming walk.,"My husband, Tivon, is NYC-licensed For-Hire-Vehicle driver with a luxury SUV available to/from all NYC airports and other destinations. Free birthday cake for guests staying with us during their birthday - send me flavor request and picture that you would like on the cake!","B52 bus for a 10-minute ride to downtown Brooklyn is a few yards away on the corner; G train/Classon Avenue is 5 blocks away; C train is about 6 blocks to either the Clinton/Washington stop or Franklin Avenue stop. There is on-street parking, alternate side is twice per week on the immediate block but only once per week on Classon. From LaGuardia Airport, a taxi will cost $30-$35, but there is also a bus that will put you at the Jackson Heights subway station, and from there it's about 5 stops to catch the G train, which stops 5 blocks away. From JFK, the taxi is closer to $40, but the AirTran can get you conveniently to the A/C line and the C train is about 6 blocks from here. From JFK via subway/metro/train: From JFK take the AirTrain to Howard Beach to catch the A train toward Brooklyn/Manhattan. Take the A train to Utica Avenue and go across that same platform to catch the C local train (you could also transfer at Nostrand but you would have to carry luggage downstairs to cat","You will have exclusive use of and access to: a sizable private room as described in ""The Space"" section, furnished with two twin beds (which we will combine into one king bed upon request) and optional rollaway twin and/or inflatable beds, and other small furnishings; full private bath and private eat-in kitchen both renovated in Fall 2015; sizable dining table in sun-filled kitchen area doubles as a great desk space; alcove perfect for vertical bike storage (2 Racor B-1R Solo Vertical Bike Rack hooks) Upon request you may also have some use of the livingroom on the floor just below.","We'll be around, but since you have the top floor to yourself, most of the interaction is on the way in or out - we're open to socializing and did so frequently with our last long-term guests, so it's really up to you",Smoking - outside please; pets allowed but please contact me first for arrangements,,,https://a0.muscache.com/im/pictures/e49999c2-9fd5-4ad5-b7cc-224deac989aa.jpg?aki_policy=large,,4869,https://www.airbnb.com/users/show/4869,LisaRoxanne,2008-12-07,"New York, New York, United States",Laid-back bi-coastal actor/professor/attorney.,within an hour,100%,,f,https://a0.muscache.com/im/users/4869/profile_pic/1371927771/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/4869/profile_pic/1371927771/original.jpg?aki_policy=profile_x_medium,Clinton Hill,1,1,"['email', 'phone', 'reviews', 'kba', 'work_email']",t,t,"Brooklyn, NY, United States",Clinton Hill,Clinton Hill,Brooklyn,Brooklyn,NY,11238,New York,"Brooklyn, NY",US,United States,40.68513770564301,-73.95975749881096,t,Guest suite,Entire home/apt,3,1.0,1.0,3,Real Bed,"{TV,""Cable TV"",Internet,Wifi,""Air conditioning"",Kitchen,""Pets allowed"",""Free street parking"",Heating,""Family/kid friendly"",""Smoke detector"",""Carbon monoxide detector"",""Fire extinguisher"",Essentials,Shampoo,""Lock on bedroom door"",""24-hour check-in"",Hangers,""Hair dryer"",Iron,""Laptop friendly workspace"",""Self check-in"",Lockbox,Bathtub,""High chair"",""Stair gates"",""Children’s books and toys"",""Pack ’n Play/travel crib"",""Hot water"",""Luggage dropoff allowed"",""Long term stays allowed""}",500.0,$89.00,$575.00,"$2,100.00",$500.00,,1,$0.00,1,730,today,t,0,0,2,182,2018-09-08,211,2014-09-30,2018-08-31,91.0,9.0,9.0,10.0,10.0,9.0,9.0,f,,,f,f,moderate,f,f,1,4.4
4484,https://www.airbnb.com/rooms/4484,20180908060534,2018-09-08,DowntownRoom,"My place is close to Katz's Delicatessen, State of New York- East River State Park, restaurants, bars, everything you want in downtown Manhattan.. You’ll love my place because of the location and the neighborhood. My place is good for couples, solo adventurers, and business travelers.","Rent the second bedroom in my cozy, friendly apartment. With wood floors, quality mattress, comfortable duvet, TV. The apt is on 4th St. between Aves. C & D, a quiet block of a vibrant, interesting neighborhood full of bars, restaurants, gardens, parks, theaters, and performance spaces --including around the corner, the famous Nuyorican Poets Cafe. In walking distance to West Village, Soho, Lower East Side. Looking forward to hosting you!","My place is close to Katz's Delicatessen, State of New York- East River State Park, restaurants, bars, everything you want in downtown Manhattan.. You’ll love my place because of the location and the neighborhood. My place is good for couples, solo adventurers, and business travelers. Rent the second bedroom in my cozy, friendly apartment. With wood floors, quality mattress, comfortable duvet, TV. The apt is on 4th St. between Aves. C & D, a quiet block of a vibrant, interesting neighborhood full of bars, restaurants, gardens, parks, theaters, and performance spaces --including around the corner, the famous Nuyorican Poets Cafe. In walking distance to West Village, Soho, Lower East Side. Looking forward to hosting you!",none,,,,,,- Please take off your shoes at the door and keep reasonably quiet after 10pm. - No smoking or drugs.,,,https://a0.muscache.com/im/pictures/f7be821c-e2a0-4c8f-b329-1bc0a075d05c.jpg?aki_policy=large,,5688,https://www.airbnb.com/users/show/5688,Robin,2008-12-28,"New York, New York, United States","I am a journalist who loves travel, music, art, and politics. I also love New York, where I've been living for about 10 years, and I love to show it off to visitors. Looking forward to hosting your next trip to NYC!",a few days or more,33%,,f,https://a0.muscache.com/im/users/5688/profile_pic/1259097412/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/5688/profile_pic/1259097412/original.jpg?aki_policy=profile_x_medium,Alphabet City,1,1,"['email', 'phone', 'reviews', 'kba']",t,t,"New York, NY, United States",Alphabet City,East Village,Manhattan,New York,NY,10009,New York,"New York, NY",US,United States,40.72066466596736,-73.9798430342775,t,Apartment,Entire home/apt,2,1.0,2.0,2,Real Bed,"{Internet,Wifi,Kitchen,Breakfast,Heating,""Smoke detector"",""Carbon monoxide detector"",""Safety card"",Essentials}",,$85.00,,,$150.00,$20.00,2,$20.00,1,730,6 months ago,t,0,0,0,62,2018-09-08,3,2018-03-22,2018-03-31,100.0,10.0,10.0,9.0,10.0,9.0,10.0,f,,,f,f,moderate,f,f,1,0.53
5022,https://www.airbnb.com/rooms/5022,20180908060534,2018-09-08,Entire Apt: Spacious Studio/Loft by central park,,"Loft apartment with high ceiling and wood flooring located 10 minutes away from Central Park in Harlem - 1 block away from 6 train and 3 blocks from 2 & 3 line. This is in a recently renovated building which includes elevator, trash shoot. marble entrance and laundromat in the basement. The apartment is a spacious loft studio. The seating area and sleeping area is divided by a bookcase. There is a long hallway entrance where the bathroom and closet for your clothes is situated. The apartment is in mint condition, the walls have been freshly painted a few months ago. Supermarket, and 24 hour convenience store less than 1 block away. 1 block away from Hot Yoga Studio and NY Sports club facility. Perfect for anyone wanting to stay in Manhattan but get more space. 10 minutes away from midtown and 15 minutes away from downtown. The neighborhood is lively and diverse. You will need to travel at least 10 blocks to find cafe's, restaurants etc.. There are a few restaurants on 100 street on","Loft apartment with high ceiling and wood flooring located 10 minutes away from Central Park in Harlem - 1 block away from 6 train and 3 blocks from 2 & 3 line. This is in a recently renovated building which includes elevator, trash shoot. marble entrance and laundromat in the basement. The apartment is a spacious loft studio. The seating area and sleeping area is divided by a bookcase. There is a long hallway entrance where the bathroom and closet for your clothes is situated. The apartment is in mint condition, the walls have been freshly painted a few months ago. Supermarket, and 24 hour convenience store less than 1 block away. 1 block away from Hot Yoga Studio and NY Sports club facility. Perfect for anyone wanting to stay in Manhattan but get more space. 10 minutes away from midtown and 15 minutes away from downtown. The neighborhood is lively and diverse. You will need to travel at least 10 blocks to find cafe's, restaurants etc.. There are a few restaurants on 100 street on",none,,,,,,Please be considerate when staying in the apartment. This is a low key building and it's important guest are respectful. You can come and go as you please I just ask that you keep a low profile. 1) Please be respectful of neighbors - no loud music after 10pm and keep a low profile 2) Do not open the door for anyone 3) Please keep the apt clean 4) No access to mailbox - please forward personal mail to job or school,,,https://a0.muscache.com/im/pictures/feb453bd-fdec-405c-8bfa-3f6963d827e9.jpg?aki_policy=large,,7192,https://www.airbnb.com/users/show/7192,Laura,2009-01-29,"Miami, Florida, United States",I have been a NYer for almost 10 years. I came to NY to study and never left. I work in the advertising industry and love to eat peanut butter & jelly sandwiches.,within a few hours,100%,,f,https://a0.muscache.com/im/users/7192/profile_pic/1325651676/original.jpg?aki_policy=profile_small,https://a0.muscache.com/im/users/7192/profile_pic/1325651676/original.jpg?aki_policy=profile_x_medium,East Harlem,1,1,"['email', 'phone', 'facebook', 'reviews', 'kba']",t,t,"New York, NY, United States",,East Harlem,Manhattan,New York,NY,10029,New York,"New York, NY",US,United States,40.79851419295301,-73.94399070712562,t,Apartment,Entire home/apt,1,1.0,,1,Real Bed,"{Internet,Wifi,""Air conditioning"",Kitchen,Elevator,""Free street parking"",""Buzzer/wireless intercom"",Heating,Washer,Dryer,""Smoke detector"",""Carbon monoxide detector"",Essentials,Shampoo,""Hair dryer"",""Hot water"",""Host greets you""}",,$80.00,$600.00,"$1,600.00",$100.00,$80.00,1,$20.00,5,120,6 weeks ago,t,0,5,35,35,2018-09-08,7,2012-03-20,2018-07-23,94.0,10.0,9.0,10.0,10.0,9.0,10.0,f,,,f,f,strict_14_with_grace_period,t,t,1,0.09
5099,https://www.airbnb.com/rooms/5099,20180908060534,2018-09-08,Large Cozy 1 BR Apartment In Midtown East,"My large 1 bedroom apartment is true New York City living. The apt is in midtown on the east side and centrally located, just a 10-minute walk from Grand Central Station, Empire State Building, Times Square. The kitchen and living room are large and bright with Apple TV. I have a new Queen Bed that sleeps 2 people, and a Queen Aero Bed that can sleep 2 people in the living room. The apartment is located on the 5th floor of a walk up - no elevator (lift).","I have a large 1 bedroom apartment centrally located in Midtown East. A 10 minute walk from Grand Central Station, Times Square, Empire State Building and all major subway and bus lines. The apartment is located on the 5th floor of a pre-war walk up building-no elevator/lift. The apartment is bright with has high ceilings and flow through rooms. A spacious, cozy living room with Netflix and Apple TV. A large bright kitchen to sit and enjoy coffee or tea. The bedroom is spacious with a comfortable queen size bed that sleeps 2. I have a comfortable queen size aero bed that fits in the living room and sleeps 2. It can be tucked away for living space and opened when ready for bed. I'd be happy to give you tips and advice on the best ways to experience the most of NYC. The apartment's location is great for sightseeing. ** Check out my listing guidebook ** If you would like to stay local in the area, there is a very long & famous strip of bars and restaurants along 3rd Avenue, which","My large 1 bedroom apartment is true New York City living. The apt is in midtown on the east side and centrally located, just a 10-minute walk from Grand Central Station, Empire State Building, Times Square. The kitchen and living room are large and bright with Apple TV. I have a new Queen Bed that sleeps 2 people, and a Queen Aero Bed that can sleep 2 people in the living room. The apartment is located on the 5th floor of a walk up - no elevator (lift). I have a large 1 bedroom apartment centrally located in Midtown East. A 10 minute walk from Grand Central Station, Times Square, Empire State Building and all major subway and bus lines. The apartment is located on the 5th floor of a pre-war walk up building-no elevator/lift. The apartment is bright with has high ceilings and flow through rooms. A spacious, cozy living room with Netflix and Apple TV. A large bright kitchen to sit and enjoy coffee or tea. The bedroom is spacious with a comfortable queen size bed that sleeps 2. I",none,"My neighborhood in Midtown East is called Murray Hill. The area is very centrally located with easy access to explore . The apartment is about 5 blocks (7 minute walk) to the United Nations and Grand Central Station the main and most historic train station. Grand Central will give you access to every train in the city. The apartment is also very close to main attractions, It's about a 10 minute walk to both the Empire State Building and Times Square. There's a great shopping area with dozens of stores including H&M, Zara, The Gap, BeBe and the world famous Macy's department store. These shops are a 10 minute walk up East 34th Street from 5th avenue and 8th avenue. If you would like to stay local in the area, there is a very long & famous strip of bars and restaurants along 3rd avenue, which is just around the corner from the apartment. It's commonly known as the 3rd avenue strip.","Read My Full Listing For All Information. New York City really is the city that doesn't sleep. There's a constant flow of people, bikes and cars. The city can be noisy at times, if you're a light sleeper, ear plugs would help. Check out my local guide book for things to do.","From the apartment is a 10 minute walk to Grand Central Station on East 42nd Street, a 10 minute walk to the Empire State Building on East 34th Street and 5th Avenue, a 10 minute walk to Times Square on West 42 Street and about 20 minutes walk to Central Park on 59th Street. Depending on how long you are staying, I would recommend a 7 day unlimited metro card. This allows you to travel unlimited all day and night on any train or bus in and outside of the city. Grand Central Station is the main NYC train station. You can find any train connection and get anywhere in Manhattan from Grand Central Station. You can get to Brooklyn, Queens, The Bronx and Staten Island from Grand Central Station The M15 bus is around the corner on 2nd avenue. This bus will take you from uptown Harlem to the East Village and South Street Seaport. It will also take you to the Staten Island ferry and Statue of Liberty and everywhere in between along the east side. The M101 bus is just up the street on 3rd aven",I will meet you upon arrival.,"I usually check in with guests via text or email. I'm available by text, email or phone call with any questions, suggestions or to help out.",• Check-in time is 2PM. • Check-out time is 12 PM. Please be respectful of the space and leave the apartment in the condition you were welcomed into.,,,https://a0.muscache.com/im/pictures/0790b1a5-8981-41cc-a370-fa2b982a8803.jpg?aki_policy=large,,7322,https://www.airbnb.com/users/show/7322,Chris,2009-02-02,"New York, New York, United States","I'm an artist, writer, traveler, and a native new yorker. Welcome to my city.",within a day,64%,,f,https://a0.muscache.com/im/pictures/user/26745d24-d818-4bf5-8f9e-26b097121ba7.jpg?aki_policy=profile_small,https://a0.muscache.com/im/pictures/user/26745d24-d818-4bf5-8f9e-26b097121ba7.jpg?aki_policy=profile_x_medium,Flatiron District,1,1,"['email', 'phone', 'reviews', 'jumio', 'government_id']",t,f,"New York, NY, United States",,Murray Hill,Manhattan,New York,NY,10016,New York,"New York, NY",US,United States,40.74767176908579,-73.97499733931186,f,Apartment,Entire home/apt,2,1.0,1.0,1,Real Bed,"{TV,""Cable TV"",Internet,Wifi,Kitchen,""Buzzer/wireless intercom"",Heating,""Smoke detector"",""Carbon monoxide detector"",""Fire extinguisher"",Essentials,Shampoo,Hangers,""Hair dryer"",Iron,""Laptop friendly workspace"",""translation missing: en.hosting_amenity_49"",""translation missing: en.hosting_amenity_50"",""Hot water"",""Bed linens"",""Extra pillows and blankets"",""Host greets you""}",,$185.00,,,$300.00,$125.00,2,$75.00,2,16,today,t,5,27,52,322,2018-09-08,65,2009-04-20,2018-01-01,87.0,9.0,9.0,10.0,10.0,9.0,9.0,f,,,f,f,strict_14_with_grace_period,t,t,1,0.57
5121,https://www.airbnb.com/rooms/5121,20180908060534,2018-09-08,BlissArtsSpace!,,"HELLO EVERYONE AND THANKS FOR VISITING BLISS ART SPACE! Thank you all for your support. I've traveled a lot in the last year few years, to the U.K. Germany, Italy and France! Loved Paris and Calabria! Highly recommend all these places. Things are a little busy this past month, so, please forgive me if I don't reply quickly. I am also in a moment where I don't wish to be in front of the computer 24/7. But I will answer as soon as I can : ) One room available for rent in a 2 bedroom apt in Bklyn. We share a common space with kitchen. I am an artist(painter, filmmaker) and curator who is working in the film industry while I'm building my art event production businesses. Price above is nightly for one person. Monthly rates available. Price is $875 per month for one person. Utilities not included, they are about 50 bucks, payable when the bill arrives mid month. Couples rates are slightly more for monthly and 90$ per night short term. If you are a couple please Iet me know and I’ll gi","HELLO EVERYONE AND THANKS FOR VISITING BLISS ART SPACE! Thank you all for your support. I've traveled a lot in the last year few years, to the U.K. Germany, Italy and France! Loved Paris and Calabria! Highly recommend all these places. Things are a little busy this past month, so, please forgive me if I don't reply quickly. I am also in a moment where I don't wish to be in front of the computer 24/7. But I will answer as soon as I can : ) One room available for rent in a 2 bedroom apt in Bklyn. We share a common space with kitchen. I am an artist(painter, filmmaker) and curator who is working in the film industry while I'm building my art event production businesses. Price above is nightly for one person. Monthly rates available. Price is $875 per month for one person. Utilities not included, they are about 50 bucks, payable when the bill arrives mid month. Couples rates are slightly more for monthly and 90$ per night short term. If you are a couple please Iet me know and I’ll gi",none,,,,,,,,,https://a0.muscache.com/im/pictures/2090980c-b68e-4349-a874-4818402923e7.jpg?aki_policy=large,,7356,https://www.airbnb.com/users/show/7356,Garon,2009-02-03,"New York, New York, United States","I am an artist(painter, filmmaker) and curator who is working in the film industry while I'm building my business. I am extremely easy going and would like that you are the laid back and enjoy life kind of person. I also ask that you are open, honest and easy to communicate with as this is how I like to live my life.And of course creative people are very welcome!",,,,f,https://a0.muscache.com/im/pictures/72a61bea-cfb1-45b6-abbb-85bdbd790b32.jpg?aki_policy=profile_small,https://a0.muscache.com/im/pictures/72a61bea-cfb1-45b6-abbb-85bdbd790b32.jpg?aki_policy=profile_x_medium,Bedford-Stuyvesant,1,1,"['email', 'phone', 'facebook', 'reviews']",t,f,"Brooklyn, NY, United States",,Bedford-Stuyvesant,Brooklyn,Brooklyn,NY,11216,New York,"Brooklyn, NY",US,United States,40.68688196488969,-73.95595708619274,f,Apartment,Private room,2,,1.0,1,Futon,"{Wifi,""Air conditioning"",Kitchen,""Pets live on this property"",Cat(s),Heating}",,$60.00,,,,,1,$30.00,45,730,8 months ago,t,30,60,90,365,2018-09-08,51,2009-05-28,2017-10-05,90.0,8.0,8.0,10.0,10.0,9.0,9.0,f,,,f,f,strict_14_with_grace_period,f,f,1,0.45


In [0]:
df_research_nikhil = csv_to_df("Nikhil_166_listing.csv")
df_research_nikhil = df_research_nikhil.drop("mean_prediction")
display(df_research_nikhil)

listing_id,derived_summarize_sentiment
30222,2
68974,2
275976,2
66741,2
152263,2
2515,2
20299,2
255601,2
424767,2
322037,2


In [0]:
df_research_doug = csv_to_df("doug_169_listing.csv")
df_research_doug = df_research_doug.drop("mean_prediction")
display(df_research_doug)

listing_id,derived_summarize_sentiment
29414,2
491123,2
278197,2
407469,2
205485,2
44221,2
70095,2
158176,2
248871,2
502429,2


In [0]:
df_research_hannah = csv_to_df("hannah_165_listing.csv")
df_research_hannah = df_research_hannah.drop("mean_prediction")
display(df_research_hannah)

listing_id,derived_summarize_sentiment
26785,2
546383,2
550297,2
58059,2
467634,2
506121,2
5178,2
31994,2
476983,2
27024,2


In [0]:
df_research_users_listing = df_research_nikhil.union(df_research_doug).union(df_research_hannah)
display(df_research_users_listing)

listing_id,derived_summarize_sentiment
30222,2
68974,2
275976,2
66741,2
152263,2
2515,2
20299,2
255601,2
424767,2
322037,2


In [0]:
df_research_data = df_research_listings.join(df_research_users_listing, df_research_listings.id == df_research_users_listing.listing_id , "inner")

In [0]:
df_research_data = df_research_data.withColumnRenamed("host_neighbourhood", "neighbourhood_group")
df_500 = df_research_data.select("id","price","neighbourhood_group","room_type","number_of_reviews","availability_365","derived_summarize_sentiment")
display(df_500)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment
2515,$59.00,Harlem,Private room,170,317,2
3831,$89.00,Clinton Hill,Entire home/apt,211,182,2
5172,$129.00,Murray Hill,Entire home/apt,78,0,2
5178,$79.00,Hell's Kitchen,Private room,394,195,2
5203,$79.00,Upper West Side,Private room,118,0,2
5238,$120.00,Lower East Side,Entire home/apt,148,229,2
5803,$88.00,Park Slope,Private room,157,318,2
6021,$85.00,Upper West Side,Private room,90,345,2
6848,$140.00,Williamsburg,Entire home/apt,102,262,2
6990,$75.00,East Harlem,Private room,228,270,2


In [0]:
df = df_500.union(df_50)
display(df)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment
2515,$59.00,Harlem,Private room,170,317,2
3831,$89.00,Clinton Hill,Entire home/apt,211,182,2
5172,$129.00,Murray Hill,Entire home/apt,78,0,2
5178,$79.00,Hell's Kitchen,Private room,394,195,2
5203,$79.00,Upper West Side,Private room,118,0,2
5238,$120.00,Lower East Side,Entire home/apt,148,229,2
5803,$88.00,Park Slope,Private room,157,318,2
6021,$85.00,Upper West Side,Private room,90,345,2
6848,$140.00,Williamsburg,Entire home/apt,102,262,2
6990,$75.00,East Harlem,Private room,228,270,2


In [0]:
from pyspark.sql.functions import regexp_replace, col

df = df.withColumn("price", regexp_replace(col("price"), "\$", "").cast("integer"))
display(df)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment
2515,59,Harlem,Private room,170,317,2
3831,89,Clinton Hill,Entire home/apt,211,182,2
5172,129,Murray Hill,Entire home/apt,78,0,2
5178,79,Hell's Kitchen,Private room,394,195,2
5203,79,Upper West Side,Private room,118,0,2
5238,120,Lower East Side,Entire home/apt,148,229,2
5803,88,Park Slope,Private room,157,318,2
6021,85,Upper West Side,Private room,90,345,2
6848,140,Williamsburg,Entire home/apt,102,262,2
6990,75,East Harlem,Private room,228,270,2


In [0]:
from pyspark.ml import Pipeline
from pyspark.ml.feature import StringIndexer, OneHotEncoder

str_cols= ["neighbourhood_group", "room_type"]
stages = [] 

for c in str_cols:
    stringIndexer = StringIndexer(inputCol=c, outputCol=c + "_index")
    encoder = OneHotEncoder(inputCols=[stringIndexer.getOutputCol()], \
            outputCols=[c + "_vec"])    
    stages += [stringIndexer, encoder] 

In [0]:
from pyspark.ml.feature import VectorAssembler


num_cols = ["number_of_reviews", "availability_365", "derived_summarize_sentiment"]
assemblerInputs = [c + "_vec" for c in str_cols] + num_cols
assembler = VectorAssembler(inputCols=assemblerInputs, outputCol="features")
stages += [assembler]
print(stages)

pipeline = Pipeline(stages=stages)
df = pipeline.fit(df).transform(df)

[StringIndexer_635b03dc46e2, OneHotEncoder_5999bb5492f6, StringIndexer_e57ce923b79a, OneHotEncoder_cd9a147d298d, VectorAssembler_f6bdf8bed88a]


In [0]:
train, test = df.randomSplit([0.70, 0.30])

#Price Prediction Model using Linear Regression

In [0]:
from pyspark.ml.feature import StandardScaler

# Fit scaler to train dataset
scaler = StandardScaler().setInputCol('features').setOutputCol('scaled')
scaler_model = scaler.fit(train)

# Scale train and test features
scaled_train = scaler_model.transform(train)
scaled_test = scaler_model.transform(test)

In [0]:
from pyspark.ml.regression import LinearRegression

lr = LinearRegression(featuresCol='scaled', labelCol='price')
lr_model = lr.fit(scaled_train)

In [0]:
train_predictions = lr_model.transform(scaled_train)
test_predictions = lr_model.transform(scaled_test)

In [0]:
display(test_predictions)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment,neighbourhood_group_index,neighbourhood_group_vec,room_type_index,room_type_vec,features,scaled,prediction
3831,89,Clinton Hill,Entire home/apt,211,182,2,9.0,"Map(vectorType -> sparse, length -> 83, indices -> List(9), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(9, 83, 86, 87, 88), values -> List(1.0, 1.0, 211.0, 182.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(9, 83, 86, 87, 88), values -> List(5.864439237311455, 1.99834348903721, 1.2417429511894456, 1.5878747386241157, 7.578118028945951))",207.29595742237657
5172,129,Murray Hill,Entire home/apt,78,0,2,46.0,"Map(vectorType -> sparse, length -> 83, indices -> List(46), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(46, 83, 86, 88), values -> List(1.0, 1.0, 78.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(46, 83, 86, 88), values -> List(19.183326093250876, 1.99834348903721, 0.4590329393022595, 7.578118028945951))",185.3716921368772
5178,79,Hell's Kitchen,Private room,394,195,2,13.0,"Map(vectorType -> sparse, length -> 83, indices -> List(13), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(13, 84, 86, 87, 88), values -> List(1.0, 1.0, 394.0, 195.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(13, 84, 86, 87, 88), values -> List(6.847951843029012, 2.0039507824953517, 2.3187048472447467, 1.7012943628115527, 7.578118028945951))",128.81122129689837
5803,88,Park Slope,Private room,157,318,2,6.0,"Map(vectorType -> sparse, length -> 83, indices -> List(6), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(1.0, 1.0, 157.0, 318.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(5.220249886559793, 2.0039507824953517, 0.9239509162878814, 2.774418499354224, 7.578118028945951))",104.90583509150603
6021,85,Upper West Side,Private room,90,345,2,4.0,"Map(vectorType -> sparse, length -> 83, indices -> List(4), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(4, 84, 86, 87, 88), values -> List(1.0, 1.0, 90.0, 345.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(4, 84, 86, 87, 88), values -> List(5.864439237311455, 2.0039507824953517, 0.5296533915026072, 3.0099823342050547, 7.578118028945951))",114.27306921011854
7097,215,Fort Greene,Entire home/apt,163,320,2,12.0,"Map(vectorType -> sparse, length -> 83, indices -> List(12), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(12, 83, 86, 87, 88), values -> List(1.0, 1.0, 163.0, 320.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(12, 83, 86, 87, 88), values -> List(6.847951843029012, 1.99834348903721, 0.9592611423880552, 2.7918676723061377, 7.578118028945951))",204.77714124062933
7322,140,Chelsea,Private room,246,0,2,17.0,"Map(vectorType -> sparse, length -> 83, indices -> List(17), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(17, 84, 86, 88), values -> List(1.0, 1.0, 246.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(17, 84, 86, 88), values -> List(6.847951843029012, 2.0039507824953517, 1.4477192701071262, 7.578118028945951))",86.51749994650179
8024,130,Park Slope,Private room,115,324,2,6.0,"Map(vectorType -> sparse, length -> 83, indices -> List(6), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(1.0, 1.0, 115.0, 324.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(5.220249886559793, 2.0039507824953517, 0.6767793335866646, 2.8267660182099643, 7.578118028945951))",103.34140803532594
9668,50,Hamilton Heights,Private room,222,339,2,14.0,"Map(vectorType -> sparse, length -> 83, indices -> List(14), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(14, 84, 86, 87, 88), values -> List(1.0, 1.0, 222.0, 339.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(14, 84, 86, 87, 88), values -> List(6.142079425146217, 2.0039507824953517, 1.306478365706431, 2.9576348153493144, 7.578118028945951))",114.99451244413532
9704,52,Harlem,Private room,73,307,2,3.0,"Map(vectorType -> sparse, length -> 83, indices -> List(3), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(3, 84, 86, 87, 88), values -> List(1.0, 1.0, 73.0, 307.0, 2.0))","Map(vectorType -> sparse, length -> 89, indices -> List(3, 84, 86, 87, 88), values -> List(4.630060509049565, 2.0039507824953517, 0.429607750885448, 2.6784480481187005, 7.578118028945951))",83.11643720086717


In [0]:
display(train_predictions.select('price', 'prediction'))

price,prediction
59,90.74586073334822
79,57.90878495722878
120,176.97585051757696
140,195.33288861326403
75,83.07985368625744
49,81.53061899458754
120,170.85396378154613
55,117.68337690428524
70,77.8940056049648
88,101.01824782464558


In [0]:
from pyspark.ml.evaluation import RegressionEvaluator

evaluator = RegressionEvaluator(labelCol="price", predictionCol="prediction", metricName="rmse")
rmse_train = evaluator.evaluate(train_predictions)
rmse_test = evaluator.evaluate(train_predictions)
print("Train Root Mean Squared Error (RMSE): %g" % evaluator.evaluate(train_predictions))
print("Test Root Mean Squared Error (RMSE):  %g" % evaluator.evaluate(test_predictions))

evaluator = RegressionEvaluator(predictionCol="prediction", labelCol="price", metricName="r2")
print("Train R2:", evaluator.evaluate(train_predictions))
print("Test R2:", evaluator.evaluate(test_predictions))

Train Root Mean Squared Error (RMSE): 87.2503
Test Root Mean Squared Error (RMSE):  109.944
Train R2: 0.6046595003641313
Test R2: 0.24757778844767586


#Price Prediction Model using Decision Tree

In [0]:
from pyspark.ml.regression import DecisionTreeRegressor

dt = DecisionTreeRegressor(featuresCol="features", labelCol="price")
model = dt.fit(train)
train_predictions = model.transform(train)
test_predictions = model.transform(test)
 
display(test_predictions.select('price', 'prediction'))
 
evaluator = RegressionEvaluator(labelCol="price", predictionCol="prediction", metricName="rmse")
print("Train Root Mean Squared Error (RMSE): %g" % evaluator.evaluate(train_predictions))
print("Test Root Mean Squared Error (RMSE): %g" % evaluator.evaluate(test_predictions))
 
evaluator = RegressionEvaluator(labelCol="price", predictionCol="prediction", metricName="r2")
print("r2 on train data = %g" % evaluator.evaluate(train_predictions))
print("r2 on test data = %g" % evaluator.evaluate(test_predictions))

price,prediction
89,165.73043478260868
129,165.73043478260868
79,84.11643835616438
88,84.11643835616438
85,84.11643835616438
215,207.86666666666667
140,84.11643835616438
130,84.11643835616438
50,84.11643835616438
52,84.11643835616438


Train Root Mean Squared Error (RMSE): 67.1974
Test Root Mean Squared Error (RMSE): 117.935
r2 on train data = 0.7655
r2 on test data = 0.134216


In [0]:
display(test_predictions)

id,price,neighbourhood_group,room_type,number_of_reviews,availability_365,derived_summarize_sentiment,neighbourhood_group_index,neighbourhood_group_vec,room_type_index,room_type_vec,features,prediction
3831,89,Clinton Hill,Entire home/apt,211,182,2,9.0,"Map(vectorType -> sparse, length -> 83, indices -> List(9), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(9, 83, 86, 87, 88), values -> List(1.0, 1.0, 211.0, 182.0, 2.0))",165.73043478260868
5172,129,Murray Hill,Entire home/apt,78,0,2,46.0,"Map(vectorType -> sparse, length -> 83, indices -> List(46), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(46, 83, 86, 88), values -> List(1.0, 1.0, 78.0, 2.0))",165.73043478260868
5178,79,Hell's Kitchen,Private room,394,195,2,13.0,"Map(vectorType -> sparse, length -> 83, indices -> List(13), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(13, 84, 86, 87, 88), values -> List(1.0, 1.0, 394.0, 195.0, 2.0))",84.11643835616438
5803,88,Park Slope,Private room,157,318,2,6.0,"Map(vectorType -> sparse, length -> 83, indices -> List(6), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(1.0, 1.0, 157.0, 318.0, 2.0))",84.11643835616438
6021,85,Upper West Side,Private room,90,345,2,4.0,"Map(vectorType -> sparse, length -> 83, indices -> List(4), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(4, 84, 86, 87, 88), values -> List(1.0, 1.0, 90.0, 345.0, 2.0))",84.11643835616438
7097,215,Fort Greene,Entire home/apt,163,320,2,12.0,"Map(vectorType -> sparse, length -> 83, indices -> List(12), values -> List(1.0))",0.0,"Map(vectorType -> sparse, length -> 3, indices -> List(0), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(12, 83, 86, 87, 88), values -> List(1.0, 1.0, 163.0, 320.0, 2.0))",207.86666666666667
7322,140,Chelsea,Private room,246,0,2,17.0,"Map(vectorType -> sparse, length -> 83, indices -> List(17), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(17, 84, 86, 88), values -> List(1.0, 1.0, 246.0, 2.0))",84.11643835616438
8024,130,Park Slope,Private room,115,324,2,6.0,"Map(vectorType -> sparse, length -> 83, indices -> List(6), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(6, 84, 86, 87, 88), values -> List(1.0, 1.0, 115.0, 324.0, 2.0))",84.11643835616438
9668,50,Hamilton Heights,Private room,222,339,2,14.0,"Map(vectorType -> sparse, length -> 83, indices -> List(14), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(14, 84, 86, 87, 88), values -> List(1.0, 1.0, 222.0, 339.0, 2.0))",84.11643835616438
9704,52,Harlem,Private room,73,307,2,3.0,"Map(vectorType -> sparse, length -> 83, indices -> List(3), values -> List(1.0))",1.0,"Map(vectorType -> sparse, length -> 3, indices -> List(1), values -> List(1.0))","Map(vectorType -> sparse, length -> 89, indices -> List(3, 84, 86, 87, 88), values -> List(1.0, 1.0, 73.0, 307.0, 2.0))",84.11643835616438


#Price Prediction Model using GradientBoosting

In [0]:
from pyspark.ml import Pipeline
from pyspark.ml.regression import GBTRegressor
from pyspark.ml.feature import VectorIndexer
from pyspark.ml.evaluation import RegressionEvaluator
 
 
gbt = GBTRegressor(featuresCol="features", labelCol="price",maxIter=10)
model = gbt.fit(train)
train_predictions = model.transform(train)
test_predictions = model.transform(test)

display(test_predictions.select('price', 'prediction'))
 
evaluator = RegressionEvaluator(labelCol="price", predictionCol="prediction", metricName="rmse")
print("Train Root Mean Squared Error (RMSE): %g" % evaluator.evaluate(train_predictions))
print("Test Root Mean Squared Error (RMSE): %g" % evaluator.evaluate(test_predictions))
 
evaluator = RegressionEvaluator(labelCol="price", predictionCol="prediction", metricName="r2")
print("r2 on train data = %g" % evaluator.evaluate(train_predictions))
print("r2 on test data = %g" % evaluator.evaluate(test_predictions))


price,prediction
89,163.16272537964252
129,167.49513910291697
79,81.54872895319821
88,84.05148085549449
85,83.93493574407836
215,207.8017091659968
140,159.5112545413384
130,83.93493574407836
50,79.60252202080392
52,88.09320465991011


Train Root Mean Squared Error (RMSE): 59.7263
Test Root Mean Squared Error (RMSE): 117.697
r2 on train data = 0.814746
r2 on test data = 0.137709


#Manpulating HyperParameters for Linear Regression

In [0]:
from pyspark.ml.tuning import ParamGridBuilder, CrossValidator

temp_train = scaled_train.withColumn('label', scaled_train["price"])
temp_test= scaled_test.withColumn('label', scaled_test["price"])

lr = LinearRegression(featuresCol='scaled', labelCol='price')
# Define a grid of hyperparameters to search over
paramGrid = ParamGridBuilder() \
    .addGrid(lr.regParam, [ 3.0, 5.0, 6.0]) \
    .addGrid(lr.elasticNetParam, [0.3, 0.7, 1.0]) \
    .addGrid(lr.maxIter, [10, 50, 100]) \
    .build()

# Use CrossValidator to perform cross-validation and find the best hyperparameters
evaluator = RegressionEvaluator(metricName="rmse")
crossval = CrossValidator(estimator=lr,
                          estimatorParamMaps=paramGrid,
                          evaluator=evaluator,
                          numFolds=5)
cvModel = crossval.fit(temp_train)

# Make predictions on the test data using the best model
train_predictions = cvModel.transform(temp_train)
test_predictions = cvModel.transform(temp_test)

In [0]:
evaluator = RegressionEvaluator(predictionCol="prediction", labelCol="label", metricName="rmse")
train_rmse = evaluator.evaluate(train_predictions)
train_r2 = evaluator.evaluate(train_predictions, {evaluator.metricName: "r2"})
test_rmse = evaluator.evaluate(test_predictions)
test_r2 = evaluator.evaluate(test_predictions, {evaluator.metricName: "r2"})

# Print the best hyperparameters and the test performance metrics
best = cvModel.bestModel
print('Best Param (regParam): ', best._java_obj.getRegParam())
print('Best Param (MaxIter): ', best._java_obj.getMaxIter())
print('Best Param (elasticNetParam): ', best._java_obj.getElasticNetParam())
print("Train RMSE: ", train_rmse)
print("Test RMSE: ", test_rmse)
print("Train R2: ", train_r2)
print("Test R2: ", test_r2)

Best Param (regParam):  3.0
Best Param (MaxIter):  10
Best Param (elasticNetParam):  1.0
Train RMSE:  90.0250257713051
Test RMSE:  105.21542054874354
Train R2:  0.5791144371062772
Test R2:  0.3109023926854936


In [0]:
# .addGrid(lr.regParam, [0.01, 0.1, 1.0]) \
# .addGrid(lr.elasticNetParam, [0.0, 0.5, 1.0]) \
# .addGrid(lr.maxIter, [10, 100, 1000]) \

In [0]:
# Train Root Mean Squared Error (RMSE): 84.2314
# Test Root Mean Squared Error (RMSE):  108.466
# Train R2: 0.626229093988184
# Test R2: 0.2933285498729584