In [0]:
from pyspark.sql.functions import avg, col, desc, count, regexp_replace
from pyspark.sql.types import IntegerType, DecimalType

In [0]:
df1 = spark.read \
           .format("csv")\
            .option("header", "true")\
            .option("inferSchema","true")\
            .load("dbfs:/FileStore/shared_uploads/himanshikoelpur@gmail.com/amazon.csv")

In [0]:
# QUESTION 1 ----> To select the top rated products on amazon
# Using spark transformation

df1.groupBy("product_id", "product_name") \
   .agg(avg(col("rating").cast(DecimalType(10, 2))).alias("avg_rating")) \
   .orderBy(desc("avg_rating")) \
   .display()

product_id,product_name,avg_rating
B0BQRJ3C47,"REDTECH USB-C to Lightning Cable 3.3FT, [Apple MFi Certified] Lightning to Type C Fast Charging Cord Compatible with iPhone 14/13/13 pro/Max/12/11/X/XS/XR/8, Supports Power Delivery - White",5.0
B09ZHCJDP1,"Amazon Basics Wireless Mouse | 2.4 GHz Connection, 1600 DPI | Type - C Adapter | Upto 12 Months of Battery Life | Ambidextrous Design | Suitable for PC/Mac/Laptop",5.0
B0BP7XLX48,"Syncwire LTG to USB Cable for Fast Charging Compatible with Phone 5/ 5C/ 5S/ 6/ 6S/ 7/8/ X/XR/XS Max/ 11/12/ 13 Series and Pad Air/Mini, Pod & Other Devices (1.1 Meter, White)",5.0
B0BQ3K23Y1,"Oratech Coffee Frother electric, milk frother electric, coffee beater, cappuccino maker, Coffee Foamer, Mocktail Mixer, Coffee Foam Maker, coffee whisker electric, Froth Maker, coffee stirrers electric, coffee frothers, Coffee Blender, (6 Month Warranty) (Multicolour)",4.8
B0BR4F878Q,"Swiffer Instant Electric Water Heater Faucet Tap Home-Kitchen Instantaneous Water Heater Tank less for Tap, LED Electric Head Water Heaters Tail Gallon Comfort(3000W) ((Pack of 1))",4.8
B0B53DS4TF,"Instant Pot Air Fryer, Vortex 2QT, Touch Control Panel, 360° EvenCrisp™ Technology, Uses 95 % less Oil, 4-in-1 Appliance: Air Fry, Roast, Bake, Reheat (Vortex 1.97Litre, Black)",4.8
B0BLC2BYPX,"Zuvexa USB Rechargeable Electric Foam Maker - Handheld Milk Wand Mixer Frother for Hot Milk, Hand Blender Coffee, Egg Beater (Black)",4.7
B0B23LW7NV,Spigen EZ Fit Tempered Glass Screen Protector for iPhone 14 Pro Max - 2 Pack (Sensor Protection),4.7
B09WN3SRC7,Sony Bravia 164 cm (65 inches) 4K Ultra HD Smart LED Google TV KD-65X74K (Black),4.7
B0BM4KTNL1,"FIGMENT Handheld Milk Frother Rechargeable, 3-Speed Electric Frother for Coffee with 2 Whisks and Coffee Decoration Tool, Coffee Frother Mixer, CRESCENT ENTERPRISES VRW0.50BK (A1)",4.7


In [0]:
# QUESTION 1 ----> To select the top rated products on amazon
# Using spark SQL

df1.createOrReplaceTempView("df1_view")
spark.sql("""
                select product_id, product_name, avg(rating) as avg_rating
                from df1_view
                group by product_id, product_name
                order by avg_rating desc
                """).display()

product_id,product_name,avg_rating
B0BQRJ3C47,"REDTECH USB-C to Lightning Cable 3.3FT, [Apple MFi Certified] Lightning to Type C Fast Charging Cord Compatible with iPhone 14/13/13 pro/Max/12/11/X/XS/XR/8, Supports Power Delivery - White",5.0
B09ZHCJDP1,"Amazon Basics Wireless Mouse | 2.4 GHz Connection, 1600 DPI | Type - C Adapter | Upto 12 Months of Battery Life | Ambidextrous Design | Suitable for PC/Mac/Laptop",5.0
B0BP7XLX48,"Syncwire LTG to USB Cable for Fast Charging Compatible with Phone 5/ 5C/ 5S/ 6/ 6S/ 7/8/ X/XR/XS Max/ 11/12/ 13 Series and Pad Air/Mini, Pod & Other Devices (1.1 Meter, White)",5.0
B0BQ3K23Y1,"Oratech Coffee Frother electric, milk frother electric, coffee beater, cappuccino maker, Coffee Foamer, Mocktail Mixer, Coffee Foam Maker, coffee whisker electric, Froth Maker, coffee stirrers electric, coffee frothers, Coffee Blender, (6 Month Warranty) (Multicolour)",4.8
B0BR4F878Q,"Swiffer Instant Electric Water Heater Faucet Tap Home-Kitchen Instantaneous Water Heater Tank less for Tap, LED Electric Head Water Heaters Tail Gallon Comfort(3000W) ((Pack of 1))",4.8
B0B53DS4TF,"Instant Pot Air Fryer, Vortex 2QT, Touch Control Panel, 360° EvenCrisp™ Technology, Uses 95 % less Oil, 4-in-1 Appliance: Air Fry, Roast, Bake, Reheat (Vortex 1.97Litre, Black)",4.8
B0BLC2BYPX,"Zuvexa USB Rechargeable Electric Foam Maker - Handheld Milk Wand Mixer Frother for Hot Milk, Hand Blender Coffee, Egg Beater (Black)",4.7
B0B23LW7NV,Spigen EZ Fit Tempered Glass Screen Protector for iPhone 14 Pro Max - 2 Pack (Sensor Protection),4.7
B09WN3SRC7,Sony Bravia 164 cm (65 inches) 4K Ultra HD Smart LED Google TV KD-65X74K (Black),4.7
B0BM4KTNL1,"FIGMENT Handheld Milk Frother Rechargeable, 3-Speed Electric Frother for Coffee with 2 Whisks and Coffee Decoration Tool, Coffee Frother Mixer, CRESCENT ENTERPRISES VRW0.50BK (A1)",4.7


In [0]:
# QUESTION 2 ----> To select the most reviewed product on amazon
# Using spark transformation

df1.groupBy("product_id", "product_name").count().orderBy(desc("count")).display()

product_id,product_name,count
B08CF3B7N1,"Portronics Konnect L 1.2M Fast Charging 3A 8 Pin USB Cable with Charge & Sync Function for iPhone, iPad (Grey)",3
B09YLXYP7Y,"Ambrane 60W / 3A Fast Charging Output Cable with Type-C to USB for Mobile, Neckband, True Wireless Earphone Charging, 480mbps Data Sync Speed, 1m Length (ACT - AZ10, Black)",3
B085DTN6R2,"Portronics Konnect CL 20W POR-1067 Type-C to 8 Pin USB 1.2M Cable with Power Delivery & 3A Quick Charge Support, Nylon Braided for All Type-C and 8 Pin Devices, Green",3
B08HDJ86NZ,"boAt Deuce USB 300 2 in 1 Type-C & Micro USB Stress Resistant, Tangle-Free, Sturdy Cable with 3A Fast Charging & 480mbps Data Transmission, 10000+ Bends Lifespan and Extended 1.5m Length(Martian Red)",3
B08R69VDHT,"Pinnaclz Original Combo of 2 Micro USB Fast Charging Cable, USB Charging Cable for Data Transfer Perfect for Android Smart Phones White 1.2 Meter Made in India (Pack of 2)",3
B08CF3D7QR,Portronics Konnect L POR-1081 Fast Charging 3A Type-C Cable 1.2Meter with Charge & Sync Function for All Type-C Devices (Grey),3
B082T6V3DT,"AmazonBasics New Release Nylon USB-A to Lightning Cable Cord, Fast Charging MFi Certified Charger for Apple iPhone, iPad (6-Ft, Rose Gold)",3
B08WRWPM22,"boAt Micro USB 55 Tangle-free, Sturdy Micro USB Cable with 3A Fast Charging & 480mbps Data Transmission (Black)",3
B096MSW6CT,"Sounce Fast Phone Charging Cable & Data Sync USB Cable Compatible for iPhone 13, 12,11, X, 8, 7, 6, 5, iPad Air, Pro, Mini & iOS Devices",3
B08Y1TFSP6,"pTron Solero TB301 3A Type-C Data and Fast Charging Cable, Made in India, 480Mbps Data Sync, Strong and Durable 1.5-Meter Nylon Braided USB Cable for Type-C Devices for Charging Adapter (Black)",3


In [0]:
# QUESTION 2 ----> To select the most reviewed product on amazon
# Using spark SQL

spark.sql("""
                select product_id, product_name, count(*) as count
                from df1_view
                group by product_id, product_name
                order by count desc
                """).display()

product_id,product_name,count
B08CF3B7N1,"Portronics Konnect L 1.2M Fast Charging 3A 8 Pin USB Cable with Charge & Sync Function for iPhone, iPad (Grey)",3
B09YLXYP7Y,"Ambrane 60W / 3A Fast Charging Output Cable with Type-C to USB for Mobile, Neckband, True Wireless Earphone Charging, 480mbps Data Sync Speed, 1m Length (ACT - AZ10, Black)",3
B085DTN6R2,"Portronics Konnect CL 20W POR-1067 Type-C to 8 Pin USB 1.2M Cable with Power Delivery & 3A Quick Charge Support, Nylon Braided for All Type-C and 8 Pin Devices, Green",3
B08HDJ86NZ,"boAt Deuce USB 300 2 in 1 Type-C & Micro USB Stress Resistant, Tangle-Free, Sturdy Cable with 3A Fast Charging & 480mbps Data Transmission, 10000+ Bends Lifespan and Extended 1.5m Length(Martian Red)",3
B08R69VDHT,"Pinnaclz Original Combo of 2 Micro USB Fast Charging Cable, USB Charging Cable for Data Transfer Perfect for Android Smart Phones White 1.2 Meter Made in India (Pack of 2)",3
B08CF3D7QR,Portronics Konnect L POR-1081 Fast Charging 3A Type-C Cable 1.2Meter with Charge & Sync Function for All Type-C Devices (Grey),3
B082T6V3DT,"AmazonBasics New Release Nylon USB-A to Lightning Cable Cord, Fast Charging MFi Certified Charger for Apple iPhone, iPad (6-Ft, Rose Gold)",3
B08WRWPM22,"boAt Micro USB 55 Tangle-free, Sturdy Micro USB Cable with 3A Fast Charging & 480mbps Data Transmission (Black)",3
B096MSW6CT,"Sounce Fast Phone Charging Cable & Data Sync USB Cable Compatible for iPhone 13, 12,11, X, 8, 7, 6, 5, iPad Air, Pro, Mini & iOS Devices",3
B08Y1TFSP6,"pTron Solero TB301 3A Type-C Data and Fast Charging Cable, Made in India, 480Mbps Data Sync, Strong and Durable 1.5-Meter Nylon Braided USB Cable for Type-C Devices for Charging Adapter (Black)",3


In [0]:
# QUESTION 3 ----> Discount Analysis: To find the avg discount percentage category wise for products.
# Using spark transformation

#df1.groupBy("category").agg(avg("discount_percentage").alias("avg_discount")).orderBy(desc("avg_discount")).display()

df1_cleaned = df1.withColumn("cleaned_discount_percentage",regexp_replace(col("discount_percentage"), '%', '').cast('float'))
df1_cleaned.groupBy("category").agg(avg("cleaned_discount_percentage").alias("avg_discount")).orderBy(desc("avg_discount")).display()

category,avg_discount
Computers&Accessories|Accessories&Peripherals|Cables&Accessories|CableConnectionProtectors,90.0
Electronics|Mobiles&Accessories|MobileAccessories|Décor|PhoneCharms,90.0
"Electronics|Headphones,Earbuds&Accessories|Earpads",90.0
"Electronics|Headphones,Earbuds&Accessories|Adapters",88.0
"Computers&Accessories|Accessories&Peripherals|Keyboards,Mice&InputDevices|Keyboard&MiceAccessories|DustCovers",87.5
Electronics|Mobiles&Accessories|MobileAccessories|Mounts|Shower&WallMounts,82.0
Computers&Accessories|Components|InternalHardDrives,80.0
Computers&Accessories|Accessories&Peripherals|Adapters|USBtoUSBAdapters,78.5
"Computers&Accessories|Accessories&Peripherals|TabletAccessories|Bags,Cases&Sleeves|Cases",78.0
Electronics|Mobiles&Accessories|MobileAccessories|Stands,76.4


In [0]:
# QUESTION 3 ----> Discount Analysis: To find the avg discount percentage category wise for products.
# Using spark SQL

spark.sql("""
                select category, avg(CAST(REPLACE(discount_percentage, '%', '') AS float)) as avg_discount
                from df1_view
                group by category
                order by avg_discount desc
                """).display()

category,avg_discount
Computers&Accessories|Accessories&Peripherals|Cables&Accessories|CableConnectionProtectors,90.0
Electronics|Mobiles&Accessories|MobileAccessories|Décor|PhoneCharms,90.0
"Electronics|Headphones,Earbuds&Accessories|Earpads",90.0
"Electronics|Headphones,Earbuds&Accessories|Adapters",88.0
"Computers&Accessories|Accessories&Peripherals|Keyboards,Mice&InputDevices|Keyboard&MiceAccessories|DustCovers",87.5
Electronics|Mobiles&Accessories|MobileAccessories|Mounts|Shower&WallMounts,82.0
Computers&Accessories|Components|InternalHardDrives,80.0
Computers&Accessories|Accessories&Peripherals|Adapters|USBtoUSBAdapters,78.5
"Computers&Accessories|Accessories&Peripherals|TabletAccessories|Bags,Cases&Sleeves|Cases",78.0
Electronics|Mobiles&Accessories|MobileAccessories|Stands,76.4


In [0]:
# QUESTION 4 ----> User Engagement: To find the user engagement on the basis of rating and its count on every product.
# Using spark transformation

df1.groupBy("product_id","product_name").agg(avg("rating").alias("avg_rating"), count("rating").alias("rating_count")).display()

product_id,product_name,avg_rating,rating_count
B09F6D21BY,7SEVEN Compatible LG TV Remote Suitable for LG Non Magic Smart tv Remote Control (Mouse & Voice Non-Support) MR20GA Prime Video and Netflix Hotkeys,3.0,1
B09HN7LD5L,"PROLEGEND® PL-T002 Universal TV Stand Table Top for Most 22 to 65 inch LCD Flat Screen TV, VESA up to 800 by 400mm",4.0,1
B00P93X2H6,"Classmate Pulse Spiral Notebook - 240 mm x 180 mm, Soft Cover, 200 Pages, Unruled",4.1,1
B078V8R9BS,Butterfly EKN 1.5-Litre Electric Kettle (Silver with Black),4.2,1
B00E3DVQFS,"Duracell Rechargeable AA 2500mAh Batteries, 4 Pcs",4.4,1
B09P22HXH6,"Lenovo 300 FHD Webcam with Full Stereo Dual Built-in mics | FHD 1080P 2.1 Megapixel CMOS Camera |Privacy Shutter | Ultra-Wide 95 Lens | 360 Rotation | Flexible Mount, Plug-n-Play | Cloud Grey",4.1,1
B00TDD0YM4,"Philips GC026/30 Fabric Shaver, Lint Remover for Woolen Sweaters, Blankets, Jackets/Burr Remover Pill Remover from Carpets, Curtains (White)",4.4,1
B0B5CGTBKV,"boAt Wave Call Smart Watch, Smart Talk with Advanced Dedicated Bluetooth Calling Chip, 1.69” HD Display with 550 NITS & 70% Color Gamut, 150+ Watch Faces, Multi-Sport Modes,HR,SpO2(Caribbean Green)",3.8,1
B09BNXQ6BR,"""Noise ColorFit Ultra SE Smart Watch with 1.75""""(4.3cm) HD Display",,1
B083GQGT3Z,"Caprigo Heavy Duty TV Wall Mount Stand for 12 to 27 inches LED/LCD/Monitor Screen's, Full Motion Rotatable Universal TV & Monitor Wall Mount Bracket with Swivel & Tilt Adjustments (Single Arm - M416)",4.1,1


In [0]:
# QUESTION 4 ----> User Engagement: To find the user engagement on the basis of rating and its count on every product.
# Using spark SQL


spark.sql("""
                select product_id, product_name, avg(rating) as avg_rating, count(rating) as rating_count
                from df1_view
                group by product_id, product_name
                """).display()

product_id,product_name,avg_rating,rating_count
B09F6D21BY,7SEVEN Compatible LG TV Remote Suitable for LG Non Magic Smart tv Remote Control (Mouse & Voice Non-Support) MR20GA Prime Video and Netflix Hotkeys,3.0,1
B09HN7LD5L,"PROLEGEND® PL-T002 Universal TV Stand Table Top for Most 22 to 65 inch LCD Flat Screen TV, VESA up to 800 by 400mm",4.0,1
B00P93X2H6,"Classmate Pulse Spiral Notebook - 240 mm x 180 mm, Soft Cover, 200 Pages, Unruled",4.1,1
B078V8R9BS,Butterfly EKN 1.5-Litre Electric Kettle (Silver with Black),4.2,1
B00E3DVQFS,"Duracell Rechargeable AA 2500mAh Batteries, 4 Pcs",4.4,1
B09P22HXH6,"Lenovo 300 FHD Webcam with Full Stereo Dual Built-in mics | FHD 1080P 2.1 Megapixel CMOS Camera |Privacy Shutter | Ultra-Wide 95 Lens | 360 Rotation | Flexible Mount, Plug-n-Play | Cloud Grey",4.1,1
B00TDD0YM4,"Philips GC026/30 Fabric Shaver, Lint Remover for Woolen Sweaters, Blankets, Jackets/Burr Remover Pill Remover from Carpets, Curtains (White)",4.4,1
B0B5CGTBKV,"boAt Wave Call Smart Watch, Smart Talk with Advanced Dedicated Bluetooth Calling Chip, 1.69” HD Display with 550 NITS & 70% Color Gamut, 150+ Watch Faces, Multi-Sport Modes,HR,SpO2(Caribbean Green)",3.8,1
B09BNXQ6BR,"""Noise ColorFit Ultra SE Smart Watch with 1.75""""(4.3cm) HD Display",,1
B083GQGT3Z,"Caprigo Heavy Duty TV Wall Mount Stand for 12 to 27 inches LED/LCD/Monitor Screen's, Full Motion Rotatable Universal TV & Monitor Wall Mount Bracket with Swivel & Tilt Adjustments (Single Arm - M416)",4.1,1


In [0]:
# QUESTION 5 ----> Category-wise Analysis: To find the Category-wise Analysis by calculating avg_rating, rating_count, discount_percentage on every category of product.
# Using spark transformation

df1_cleaned.groupBy("category").agg(avg("rating").alias("avg_rating"), count("rating").alias("rating_count"), avg("cleaned_discount_percentage").alias("avg_discount")).display()

category,avg_rating,rating_count,avg_discount
reminders,,1,
Computers&Accessories|Accessories&Peripherals|HardDriveAccessories|Caddies,4.1,1,75.0
"OfficeProducts|OfficePaperProducts|Paper|Stationery|Notebooks,WritingPads&Diaries|WireboundNotebooks",4.4,4,5.75
"OfficeProducts|OfficePaperProducts|Paper|Stationery|Notebooks,WritingPads&Diaries|CompositionNotebooks",4.371428571428571,7,12.0
Electronics|Cameras&Photography|Accessories|Batteries&Chargers|BatteryChargers,3.8,1,25.0
Computers&Accessories|ExternalDevices&DataStorage|ExternalMemoryCardReaders,4.3,1,45.0
TWS Connection,,3,
123 Sports Mode,,1,
Computers&Accessories|Accessories&Peripherals|TabletAccessories|ScreenProtectors,4.18,5,63.8
Computers&Accessories|Accessories&Peripherals|Audio&VideoAccessories|PCSpeakers,4.05,2,46.5


In [0]:
# QUESTION 5 ----> Category-wise Analysis: To find the Category-wise Analysis by calculating avg_rating, rating_count, discount_percentage on every category of product.
# Using spark SQL

spark.sql("""
                select product_id, product_name, avg(rating) as avg_rating, count(rating) as rating_count, avg(CAST(REPLACE(discount_percentage, '%', '') AS float)) as avg_discount
                from df1_view
                group by product_id, product_name
                """).display()

product_id,product_name,avg_rating,rating_count,avg_discount
B09F6D21BY,7SEVEN Compatible LG TV Remote Suitable for LG Non Magic Smart tv Remote Control (Mouse & Voice Non-Support) MR20GA Prime Video and Netflix Hotkeys,3.0,1,60.0
B09HN7LD5L,"PROLEGEND® PL-T002 Universal TV Stand Table Top for Most 22 to 65 inch LCD Flat Screen TV, VESA up to 800 by 400mm",4.0,1,59.0
B00P93X2H6,"Classmate Pulse Spiral Notebook - 240 mm x 180 mm, Soft Cover, 200 Pages, Unruled",4.1,1,11.0
B078V8R9BS,Butterfly EKN 1.5-Litre Electric Kettle (Silver with Black),4.2,1,33.0
B00E3DVQFS,"Duracell Rechargeable AA 2500mAh Batteries, 4 Pcs",4.4,1,21.0
B09P22HXH6,"Lenovo 300 FHD Webcam with Full Stereo Dual Built-in mics | FHD 1080P 2.1 Megapixel CMOS Camera |Privacy Shutter | Ultra-Wide 95 Lens | 360 Rotation | Flexible Mount, Plug-n-Play | Cloud Grey",4.1,1,66.0
B00TDD0YM4,"Philips GC026/30 Fabric Shaver, Lint Remover for Woolen Sweaters, Blankets, Jackets/Burr Remover Pill Remover from Carpets, Curtains (White)",4.4,1,12.0
B0B5CGTBKV,"boAt Wave Call Smart Watch, Smart Talk with Advanced Dedicated Bluetooth Calling Chip, 1.69” HD Display with 550 NITS & 70% Color Gamut, 150+ Watch Faces, Multi-Sport Modes,HR,SpO2(Caribbean Green)",3.8,1,75.0
B09BNXQ6BR,"""Noise ColorFit Ultra SE Smart Watch with 1.75""""(4.3cm) HD Display",,1,
B083GQGT3Z,"Caprigo Heavy Duty TV Wall Mount Stand for 12 to 27 inches LED/LCD/Monitor Screen's, Full Motion Rotatable Universal TV & Monitor Wall Mount Bracket with Swivel & Tilt Adjustments (Single Arm - M416)",4.1,1,50.0
