In [278]:
import pandas as pd
import pickle

from sklearn.preprocessing import MinMaxScaler

pd.set_option('display.max_colwidth', None)

In [279]:
df_products = pd.read_json('../../../data/interim/final/products.json.gz', orient="records", compression="gzip")
df_interim_reviews = pd.read_json('../../../data/interim/final/reviews.json.gz', orient="records", compression="gzip")
df_processed_reviews = pd.read_json('../../../data/processed/reviews.json.gz', orient="records", compression="gzip")

In [280]:
df_reviews = df_interim_reviews
df_reviews['processed_review_text'] = df_processed_reviews['cleaned_review']
df_products_reviews = df_products.merge(df_reviews, how='inner', on='product_id', validate='one_to_many')[['product_id','processed_review_text']]

In [281]:
model = pickle.load(open('../../../models/sentiment_analysis/hyperparameter_tuning/logistic_regression_with_tfidf_vectorizer.pkl', 'rb'))

In [282]:
def predict_mean_sentiment(product_id:str):
    review_list = df_products_reviews[df_products_reviews['product_id'] == product_id]['processed_review_text'].tolist()
    if (len(review_list) == 0): return 0
    sentiment = predict_sentiment(review_list)
    if(sentiment is None):return 0
    
    return sentiment.mean()

def predict_sentiment(features:list):
    if (len(features) == 0): return
    return model.predict(features)

In [283]:
df_test = df_products[:50].copy()

In [284]:
df_test['mean_sentiment_score'] = df_test['product_id'].apply(predict_mean_sentiment)

In [285]:
scaler = MinMaxScaler(feature_range=(1, 5))
scaler.fit(df_test[['mean_sentiment_score']])
df_test['mean_sentiment_score'] = scaler.transform(df_test[['mean_sentiment_score']])

In [286]:
df_test.sort_values(by='mean_sentiment_score', ascending=False).head(50)

Unnamed: 0,product_id,name,description,price,image_url,mean_sentiment_score
0,B00001W0DG,Sony MDR-V500DJ Monitor Series Headphones with Swivel Earcups (Discontinued by Manufacturer),"Revel in high-quality audio with the MDR-V500DJ Studio Monitor Series DJ headphones. Featuring reversible earcups with remix applications, these comfortable headphones are the ideal DJ companion.",6.61,[https://images-na.ssl-images-amazon.com/images/I/21UDx%2BHFMJL.jpg],5.0
36,B0007CZ2UO,Olympus Camedia C5500 5.1MP Digital Camera with 5x Optical Zoom,"This Olympus Sport Zoom digital camera is as durable as it is functional. Features 5x optical and 4x digital zooms (20x total zoom); 5.1MP CCD; 2"" TFT LCD; 15 selectable shooting modes; QuickTime movie mode with audio; 7.939.5mm lens (38190mm 35mm equivalent); PicBridge compatibility allowing you to print without a PC; 16MB xD-Picture Card; and much more. Imported. 4Wx5Lx3-3-1/4H"".",28.0,"[https://images-na.ssl-images-amazon.com/images/I/41C8HSNCDSL.jpg, https://images-na.ssl-images-amazon.com/images/I/5114BH1383L.jpg, https://images-na.ssl-images-amazon.com/images/I/511ZGP80VJL.jpg, https://images-na.ssl-images-amazon.com/images/I/411CJ8M97VL.jpg, https://images-na.ssl-images-amazon.com/images/I/51K7YXMNH3L.jpg]",5.0
26,B0002AHQKU,Fujifilm Finepix E510 5MP Digital Camera with 5.2x Optical Zoom,"This Fuji Finepix digital camera has a 5.2MP sensor that captures enough detail to give you quality 13x17"" enlargements. Get great close-ups with a 3.2x optical zoom and 4.1x digital zoom. Camera also features 4 preprogrammed scene modes; a 2"" TFT LCD monitor; PictBridge compatibility; and one 16MB XD picture card.",14.99,[https://images-na.ssl-images-amazon.com/images/I/41437QW84NL.jpg],5.0
30,B0002R283S,Panasonic Lumix DMC-FX7S 5MP Digital Camera with 3x Image Stabilized Optical Zoom (Silver),"Panasonic DMC-FX7 LUMIX Digital Camera - At less than 1-inch deep, this Panasonic Lumix digital-camera has a metal body for dependability and a Leica Elmarit Vario lens for optic excellence. A rather remarkable new feature is OIS (Optical Image Stabilizer) that helps keep images stable despite the jitter from normal hand movements - a really popular feature that was introduced on camcorders. Speaking of camcorders, this camera can shoot still pictures as well as video/movie images - with or without sound. All images are stored on replaceable and reusable SecureDigital SD memory. 2.5 LCD Viewer built-in Burst Shooting Mode - 3.3fps Selectable Shooting Modes including Simple Mode Exposure Compensation with Auto Exposure Bracketing Audio Dubbing Light Metering - Intelligent Multiple / Spot Mode Self Timer (2, 10 seconds) Motion Image Recording QVGA (320 x 240 pixels) Built-in Multimode Automatic Electronic-Flash Is PictBridge compatible for printing images without requiring a computer Unit Dimensions (H x W x D) - 1.97'' x 3.70'' x 0.95'' / Weight - 0.30 lbs We advise buying an optional 256MB or higher SD card for more flexible use.",48.0,"[https://images-na.ssl-images-amazon.com/images/I/41036SZJ42L.jpg, https://images-na.ssl-images-amazon.com/images/I/416W4DEXHXL.jpg, https://images-na.ssl-images-amazon.com/images/I/41M9ZR2TK8L.jpg, https://images-na.ssl-images-amazon.com/images/I/31QJ3T4A97L.jpg, https://images-na.ssl-images-amazon.com/images/I/21228WK3AEL.jpg, https://images-na.ssl-images-amazon.com/images/I/41XDDC392NL.jpg]",5.0
13,B00006N21O,Nikon Coolpix 2000 2MP Digital Camera w/ 3x Optical Zoom,"You can shoot, send, share or save your photos with the touch of a button using the Nikon CoolPix 2000 digital camera. The CoolPix 2000 features a 3x Zoom-Nikkor lens with 2.0 effective megapixels; automatic focus, exposure and flash; 5 automatic scene modes for better pictures; and image playback with quick review to delete all or selected frames. Other features include one-touch upload to your Mac or PC; easy-to-use design; and movie mode. Camera comes with high-speed memory card, USB cable, video cable, strap, CD-ROM reference manual and quick-start guide. Imported. 7-3/4Lx6Wx3-3/4D"". Order now for a $50 manufacturer's mail-in rebate. View larger image for complete rebate details and printable coupon. Rebate requires coupon and packing slip receipt.",49.95,"[https://images-na.ssl-images-amazon.com/images/I/51GJS3VVA4L.jpg, https://images-na.ssl-images-amazon.com/images/I/41QSHC69KQL.jpg]",5.0
32,B00064OB3M,Canon Powershot SD20 5MP Ultra Compact Digital Camera (Garnet) (OLD MODEL),"Urban, smart and super slim, the PowerShot SD20 Digital ELPH is perfectly at home in all the right places. You can even pick the color that matches your taste and personality because the SD20 is available in 4 colors: Garnet, Midnight Blue, Zen Gray and Silver. It's a camera that's handsome enough to pose as a fashion accessory. But it's more than just a pretty model, inside it's got the high resolution and advanced performance to get your pictures noticed. Exclusive Canon DIGIC Image Processor and iSAPS Technology for faster processing speed, excellent image quality and crisp vibrant colors 5 New Scene Modes and the Print/Share Button for greater ease of use High-precision 9-point AF for sharp photos every time and Intelligent Orientation Sensor automatically rotates images for playback Built-in Electronic AutoFlash Images are stored on SD SecureDigital Media-Card and may be transferred to a Windows PC or Macintosh computer using built-in USB port (bundled software is included) 1.5 LCD Screen Program AutoExposure modes Shooting Modes - Auto, Manual, Portrait, Night Snapshot, Indoor, Underwater, Macro, Stitch Assist, Movies (Video images) Canon Direct Print modes to compatible Canon printer Dimensions (W x H x D) - 3.56 x 1.85 x 0.73 inch / Weighs about 4 ounces without battery",12.37,"[https://images-na.ssl-images-amazon.com/images/I/41TZNFB7ZVL.jpg, https://images-na.ssl-images-amazon.com/images/I/41P7KNT24ML.jpg, https://images-na.ssl-images-amazon.com/images/I/41ZVQA40HWL.jpg, https://images-na.ssl-images-amazon.com/images/I/4181SHYCNHL.jpg, https://images-na.ssl-images-amazon.com/images/I/41X5Y1N6GWL.jpg]",5.0
9,B00005UKBD,Sony DSCF707 Cyber-shot 5MP Digital Still Camera w/ 5x Optical Zoom,Accurately realistic photos are captured using this digital camera that has a 5.0 effective CCD and 5.2 gross pixel count. The included 16MB Memory Stick media stores your shots that can be easily downloaded using the USB interface. A Carl ZeissM-^Y Vario Sonnar lens with 5x Optical/10x Digital zoom captures the essence of each shot with clarity and precision accuracy. For consistently great shots even in low or no light conditions try using the built-in NightFinderM-^Y system.,76.0,"[https://images-na.ssl-images-amazon.com/images/I/41V6SKW8A5L.jpg, https://images-na.ssl-images-amazon.com/images/I/51W0TG780BL.jpg, https://images-na.ssl-images-amazon.com/images/I/51D2KHXVPRL.jpg, https://images-na.ssl-images-amazon.com/images/I/410RPXECBFL.jpg]",5.0
5,B000051TOG,Olympus E-10 4MP Digital Camera w/4x Optical Zoom (Discontinued by Manufacturer),"The Camedia E-10 is a true SLR digital camera that features a 4-megapixel imager and new lens technology specifically designed to focus light evenly across the entire CCD surface. The all black aluminum body and fast f2.0 9-36mm (35-140mm in 35mm) zoom lens is designed to maximize image quality. Manufactured with Extra Dispersion (ED) glass, the lens features fully multicoated elements with dual aspherical glass elements to reduce chromatic aberrations and deliver the highest image quality of any lens built for a digital camera. A variety of matched add-on lenses deliver the flexibility digital photographers need to maximize creativity.\nThe Camedia E-10 has the features that professionals expect from an SLR, including Program Auto, Aperture Priority, Shutter Priority and Manual exposure modes, a manual zoom and focusing ring on the lens barrel and a real focusing screen. The E-10 uses an Olympus-patented IR-active focus system for initial focus and a TTL passive focus for fine, accurate focus. Professionals will also appreciate the hot-shoe and PC flash connectivity for creative lighting.\nExtremely easy to use, the Camedia E-10 offers one-touch buttons and dials as alternative means to change program modes. Rather than navigate through layers of LCD menu commands, the Camedia E-10 sports dedicated buttons to control shooting modes, flash, white balance and media card settings. Aperture and shutter controls are set using dials, enabling quick and easy access to a wide range of commonly used features and settings.",453.0,"[https://images-na.ssl-images-amazon.com/images/I/51KQJ5RFY3L.jpg, https://images-na.ssl-images-amazon.com/images/I/51T11BHE9PL.jpg, https://images-na.ssl-images-amazon.com/images/I/517W7WVY7ZL.jpg]",5.0
42,B0009KMS7Y,Kodak Easyshare C360 5 MP Digital Camera with 3xOptical Zoom,"Share all that makes you smile. Memories are meant to be shared. With the KODAK C360 Digital Camera, you can capture and share life's moments with remarkable ease. A 5.0 megapixel and 3X Optical Zoom Glass Aspheric Lens offer a crisp image without losing image quality when getting close to your subject. Unpack the camera from the box and you're ready to go. 14 shooting modes such as Portrait, Landscape, Close-up, Sport, Night Portrait, Snow, Beach, Self Portrait, Party, Fireworks, Backlight, Children, Burst and the more commonly known Automatic mode",31.44,"[https://images-na.ssl-images-amazon.com/images/I/519F62FBQ6L.jpg, https://images-na.ssl-images-amazon.com/images/I/51PWFJHBR6L.jpg, https://images-na.ssl-images-amazon.com/images/I/41XWVQCN9NL.jpg]",5.0
24,B0002A6YVC,"Apple iBook Laptop 12&quot; M9623LL/A (1.2 GHz PowerPC G4, 256MB RAM, 30GB Hard Drive, Combo Drive, Built-in AirPort Extreme)","iBook is the lightest all-in-one consumer notebook available on the market. iBook was designed to be small and light, yet incredibly durable. With models weighing 4.9 and 5.9 pounds, iBook is extremely lightweight and portable. Its' small form factor makes it easy to carry anywhere. Beyond its' impressive size and weight, iBook was engineered to withstand far more in terms of shock and extreme temperatures than your average laptop. Apple built iBook to go anywhere and handle anything.",99.98,"[https://images-na.ssl-images-amazon.com/images/I/31STQvGaLsL.jpg, https://images-na.ssl-images-amazon.com/images/I/411ApYlvW6L.jpg, https://images-na.ssl-images-amazon.com/images/I/413xjFDmiSL.jpg, https://images-na.ssl-images-amazon.com/images/I/21S9IPaKxKL.jpg]",5.0
