In [0]:
# pyspark functions
from pyspark.sql.functions import *
# URL processing
import urllib
# PySpark
from pyspark.sql import SparkSession


In [0]:
# Define the path to the Delta table
delta_table_path = "dbfs:/user/hive/warehouse/authentication_credentials"

# Read the Delta table to a Spark DataFrame
aws_keys_df = spark.read.format("delta").load(delta_table_path)

# Get the AWS access key and secret key from the spark dataframe
ACCESS_KEY = aws_keys_df.select('Access key ID').collect()[0]['Access key ID']
SECRET_KEY = aws_keys_df.select('Secret access key').collect()[0]['Secret access key']
# Encode the secrete key
ENCODED_SECRET_KEY = urllib.parse.quote(string=SECRET_KEY, safe="")

# AWS S3 bucket name
AWS_S3_BUCKET = "user-1279c94681db-bucket"
# Mount name for the bucket
MOUNT_NAME = "/mnt/saiful_bucket"
# Source url
SOURCE_URL = "s3n://{0}:{1}@{2}".format(ACCESS_KEY, ENCODED_SECRET_KEY, AWS_S3_BUCKET)
# Mount the drive
dbutils.fs.mount(SOURCE_URL, MOUNT_NAME)


In [0]:
display(dbutils.fs.ls("/mnt/saiful_bucket"))

path,name,size,modificationTime
dbfs:/mnt/saiful_bucket/_delta_log/,_delta_log/,0,1711712744713
dbfs:/mnt/saiful_bucket/kafka-connect-s3/,kafka-connect-s3/,0,1711712744713
dbfs:/mnt/saiful_bucket/part-00000-0fcd962a-3424-43c8-84cb-2dd2a888283a-c000.snappy.parquet,part-00000-0fcd962a-3424-43c8-84cb-2dd2a888283a-c000.snappy.parquet,1559,1711541089000
dbfs:/mnt/saiful_bucket/part-00000-48aa6cb4-c2d5-4356-9ced-981a86e6a408-c000.snappy.parquet,part-00000-48aa6cb4-c2d5-4356-9ced-981a86e6a408-c000.snappy.parquet,6560,1711540935000
dbfs:/mnt/saiful_bucket/part-00000-c43cf717-590a-4842-bddd-b3ef74d359ba-c000.snappy.parquet,part-00000-c43cf717-590a-4842-bddd-b3ef74d359ba-c000.snappy.parquet,1538,1711541098000
dbfs:/mnt/saiful_bucket/part-00001-0ae11eeb-9bb1-4bf9-ae4a-9abb1c81052a-c000.snappy.parquet,part-00001-0ae11eeb-9bb1-4bf9-ae4a-9abb1c81052a-c000.snappy.parquet,1548,1711541098000
dbfs:/mnt/saiful_bucket/part-00001-52e3e07b-c330-4db5-aac3-c8d773f734e8-c000.snappy.parquet,part-00001-52e3e07b-c330-4db5-aac3-c8d773f734e8-c000.snappy.parquet,7052,1711540932000
dbfs:/mnt/saiful_bucket/part-00001-cf663b7b-914b-4f23-b118-83a194b66f8a-c000.snappy.parquet,part-00001-cf663b7b-914b-4f23-b118-83a194b66f8a-c000.snappy.parquet,1564,1711541092000
dbfs:/mnt/saiful_bucket/part-00002-1af5ecde-303c-4b09-9de0-3315cee5a22d-c000.snappy.parquet,part-00002-1af5ecde-303c-4b09-9de0-3315cee5a22d-c000.snappy.parquet,1536,1711541098000
dbfs:/mnt/saiful_bucket/part-00002-2c31c0cf-2904-4668-bc1a-ba1bcbf1ea2c-c000.snappy.parquet,part-00002-2c31c0cf-2904-4668-bc1a-ba1bcbf1ea2c-c000.snappy.parquet,6560,1711540934000


In [0]:
%sql
-- Disable format checks during reading of the Delta tables
SET spark.databricks.delta.formatCheck.enabled=false

key,value
spark.databricks.delta.formatCheck.enabled,False


In [0]:
# File location and type
# Asterisk(*) indicates reading all the content of the specified file that have .json extension
file_location_1 = "/mnt/saiful_bucket/topics/1279c94681db.pin/partition=0/*.json"
file_location_2 = "/mnt/saiful_bucket/topics/1279c94681db.geo/partition=0/*.json"
file_location_3 = "/mnt/saiful_bucket/topics/1279c94681db.user/partition=0/*.json"
file_type = "json"
# Ask Spark to infer the schema
infer_schema = "true"
# Read in JSONs from mounted S3 bucket
df_pin = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location_1)
df_geo = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location_2)
df_user = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location_3)
# Display Spark dataframe to check its content
display(df_pin)
display(df_geo)
display(df_user)

category,description,downloaded,follower_count,image_src,index,is_image_or_video,poster_name,save_location,tag_list,title,unique_id
christmas,"Features: Material:Lint Size:48ｘ18cm Quantity:1 pc Shape:Santa Claus, snowman. Elk Occasion:Christmas Description: 1. Fashion design, high quality 2. Santa Claus, snowman. Elk C…",1,5k,https://i.pinimg.com/originals/b5/7f/21/b57f219fa89c1165b57525b8eae711da.jpg,1706,image,Wear24-7,Local save in /data/christmas,"Merry Christmas To You,Christmas Toys,Great Christmas Gifts,Christmas Snowman,Christmas Ornaments,Holiday,Christmas Party Decorations,Christmas Themes,Decoration Party",Standing Figurine Toys Xmas Santa Claus Snowman Reindeer Figure Plush Dolls Christmas Decorations Ornaments Home Indoor Table Ornaments Christmas Party Tree Hanging Decor Toys Gifts for Kids Friends…,b5c8a1b5-9e90-4522-9bec-2477b698d5b7
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,46k,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",Local save in /data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,46k,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",Local save in /data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd
christmas,15 unique Christmas porch ideas that will leave you feeling inspired and help you tackle decorating your own entryway for the holidays! It’s almost time to start decorating for…,1,19k,https://i.pinimg.com/originals/ff/f8/3b/fff83b02aeb29e2e9341a56fc5e63345.png,1967,image,Ashley - Modern Glam,Local save in /data/christmas,"Exterior Christmas Lights,Front Door Christmas Decorations,Christmas Lights Outside,Christmas House Lights,Decorating With Christmas Lights,Porch Decorating,Christmas Porch Decorations,Front Porch Ideas For Christmas,Christmas Lights Outdoor Trees",15 Fun & Festive Christmas Porch Ideas,0b9d5b95-51a6-465e-ae4a-2cb68ceada29
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,10k,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,10k,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,10k,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,31k,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,Local save in /data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,31k,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,Local save in /data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35
diy-and-crafts,"This post may contain affiliate links, read our Disclosure Policy for more information. As an Amazon Associate I earn from qualifying purchases, thank you! Make some cute handpr…",1,892k,https://i.pinimg.com/originals/ff/fe/38/fffe384f3ec18a0d87cb2d80cc8c1499.jpg,3156,image,Michelle {CraftyMorning.com},Local save in /data/diy-and-crafts,"Christmas Gifts For Parents,Christmas Decorations For Kids,Christmas Crafts For Toddlers,Preschool Christmas,Christmas Crafts For Gifts,Christmas Activities,Toddler Crafts,Kids Christmas,Christmas Feeling",Handprint Reindeer Ornaments - Crafty Morning,fa6e31a4-18c2-4eca-a6d8-e903eee2c2a4


country,ind,latitude,longitude,timestamp
Antarctica (the territory South of 60 deg S),2418,-88.4642,-171.061,2022-05-27T11:30:59
Antarctica (the territory South of 60 deg S),2418,-88.4642,-171.061,2022-05-27T11:30:59
Antarctica (the territory South of 60 deg S),5162,-71.6607,-149.206,2019-09-27T19:06:43
Antarctica (the territory South of 60 deg S),2418,-88.4642,-171.061,2022-05-27T11:30:59
Saint Vincent and the Grenadines,2301,13.4683,51.7244,2020-11-14T00:25:28
French Southern Territories,6014,-26.6026,155.206,2019-04-30T12:33:13
Cocos (Keeling) Islands,10794,-89.5236,-154.567,2022-01-01T02:26:50
Cocos (Keeling) Islands,10794,-89.5236,-154.567,2022-01-01T02:26:50
Cocos (Keeling) Islands,10794,-89.5236,-154.567,2022-01-01T02:26:50
Cocos (Keeling) Islands,10794,-89.5236,-154.567,2022-01-01T02:26:50


age,date_joined,first_name,ind,last_name
27,2016-03-08T13:38:37,Christopher,2015,Bradshaw
59,2017-05-12T21:22:17,Alexander,10673,Cervantes
27,2016-03-08T13:38:37,Christopher,2015,Bradshaw
59,2017-05-12T21:22:17,Alexander,10673,Cervantes
39,2016-06-29T20:43:59,Christina,6398,Davenport
20,2015-10-23T04:13:23,Alexandria,3599,Alvarado
39,2016-06-29T20:43:59,Christina,6398,Davenport
20,2015-10-23T04:13:23,Alexandria,3599,Alvarado
20,2015-12-01T15:08:31,Christopher,5076,Butler
39,2017-07-19T07:12:04,Michelle,7790,Gutierrez


In [0]:
df_pin.printSchema()

In [0]:
cleaned_df_pin = df_pin.replace({'User Info Error': None})
cleaned_df_pin = cleaned_df_pin.replace({'No description available Story format': None}, subset=['description'])

# Clean the data and convert to integer
cleaned_df_pin = cleaned_df_pin.withColumn("follower_count_numeric",
                   when(col("follower_count").rlike("\\d+M"), regexp_extract(col("follower_count"), r"(\d+)", 1).cast("int") * 1000000)
                   .when(col("follower_count").rlike("\\d+k"), regexp_extract(col("follower_count"), r"(\d+)", 1).cast("int") * 1000)
                   .when(col("follower_count").rlike("\\d+"), col("follower_count").cast("int"))
                   .otherwise(0)  # Set non-numeric values to 0 or any default value
                   )
cleaned_df_pin = cleaned_df_pin.drop("follower_count")
cleaned_df_pin = cleaned_df_pin.withColumnRenamed("follower_count_numeric", "follower_count")
# Display the transformed DataFrame
display(cleaned_df_pin)

category,description,downloaded,image_src,index,is_image_or_video,poster_name,save_location,tag_list,title,unique_id,follower_count
christmas,"Features: Material:Lint Size:48ｘ18cm Quantity:1 pc Shape:Santa Claus, snowman. Elk Occasion:Christmas Description: 1. Fashion design, high quality 2. Santa Claus, snowman. Elk C…",1,https://i.pinimg.com/originals/b5/7f/21/b57f219fa89c1165b57525b8eae711da.jpg,1706,image,Wear24-7,Local save in /data/christmas,"Merry Christmas To You,Christmas Toys,Great Christmas Gifts,Christmas Snowman,Christmas Ornaments,Holiday,Christmas Party Decorations,Christmas Themes,Decoration Party",Standing Figurine Toys Xmas Santa Claus Snowman Reindeer Figure Plush Dolls Christmas Decorations Ornaments Home Indoor Table Ornaments Christmas Party Tree Hanging Decor Toys Gifts for Kids Friends…,b5c8a1b5-9e90-4522-9bec-2477b698d5b7,5000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",Local save in /data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",Local save in /data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,15 unique Christmas porch ideas that will leave you feeling inspired and help you tackle decorating your own entryway for the holidays! It’s almost time to start decorating for…,1,https://i.pinimg.com/originals/ff/f8/3b/fff83b02aeb29e2e9341a56fc5e63345.png,1967,image,Ashley - Modern Glam,Local save in /data/christmas,"Exterior Christmas Lights,Front Door Christmas Decorations,Christmas Lights Outside,Christmas House Lights,Decorating With Christmas Lights,Porch Decorating,Christmas Porch Decorations,Front Porch Ideas For Christmas,Christmas Lights Outdoor Trees",15 Fun & Festive Christmas Porch Ideas,0b9d5b95-51a6-465e-ae4a-2cb68ceada29,19000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",Local save in /data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,Local save in /data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,Local save in /data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
diy-and-crafts,"This post may contain affiliate links, read our Disclosure Policy for more information. As an Amazon Associate I earn from qualifying purchases, thank you! Make some cute handpr…",1,https://i.pinimg.com/originals/ff/fe/38/fffe384f3ec18a0d87cb2d80cc8c1499.jpg,3156,image,Michelle {CraftyMorning.com},Local save in /data/diy-and-crafts,"Christmas Gifts For Parents,Christmas Decorations For Kids,Christmas Crafts For Toddlers,Preschool Christmas,Christmas Crafts For Gifts,Christmas Activities,Toddler Crafts,Kids Christmas,Christmas Feeling",Handprint Reindeer Ornaments - Crafty Morning,fa6e31a4-18c2-4eca-a6d8-e903eee2c2a4,892000


In [0]:
# Converting index and downloaded columns to integer data types
cleaned_df_pin = cleaned_df_pin.withColumn("index", cleaned_df_pin["index"].cast("integer"))
cleaned_df_pin = cleaned_df_pin.withColumn("downloaded", cleaned_df_pin["downloaded"].cast("integer"))

In [0]:
# Removing "Local save in" from save_location column to give the save path only
cleaned_df_pin = cleaned_df_pin.withColumn("save_location", regexp_replace(("save_location"), "Local save in", ""))
display(cleaned_df_pin)

category,description,downloaded,image_src,index,is_image_or_video,poster_name,save_location,tag_list,title,unique_id,follower_count
christmas,"Features: Material:Lint Size:48ｘ18cm Quantity:1 pc Shape:Santa Claus, snowman. Elk Occasion:Christmas Description: 1. Fashion design, high quality 2. Santa Claus, snowman. Elk C…",1,https://i.pinimg.com/originals/b5/7f/21/b57f219fa89c1165b57525b8eae711da.jpg,1706,image,Wear24-7,/data/christmas,"Merry Christmas To You,Christmas Toys,Great Christmas Gifts,Christmas Snowman,Christmas Ornaments,Holiday,Christmas Party Decorations,Christmas Themes,Decoration Party",Standing Figurine Toys Xmas Santa Claus Snowman Reindeer Figure Plush Dolls Christmas Decorations Ornaments Home Indoor Table Ornaments Christmas Party Tree Hanging Decor Toys Gifts for Kids Friends…,b5c8a1b5-9e90-4522-9bec-2477b698d5b7,5000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",/data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",/data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,15 unique Christmas porch ideas that will leave you feeling inspired and help you tackle decorating your own entryway for the holidays! It’s almost time to start decorating for…,1,https://i.pinimg.com/originals/ff/f8/3b/fff83b02aeb29e2e9341a56fc5e63345.png,1967,image,Ashley - Modern Glam,/data/christmas,"Exterior Christmas Lights,Front Door Christmas Decorations,Christmas Lights Outside,Christmas House Lights,Decorating With Christmas Lights,Porch Decorating,Christmas Porch Decorations,Front Porch Ideas For Christmas,Christmas Lights Outdoor Trees",15 Fun & Festive Christmas Porch Ideas,0b9d5b95-51a6-465e-ae4a-2cb68ceada29,19000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,/data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,/data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
diy-and-crafts,"This post may contain affiliate links, read our Disclosure Policy for more information. As an Amazon Associate I earn from qualifying purchases, thank you! Make some cute handpr…",1,https://i.pinimg.com/originals/ff/fe/38/fffe384f3ec18a0d87cb2d80cc8c1499.jpg,3156,image,Michelle {CraftyMorning.com},/data/diy-and-crafts,"Christmas Gifts For Parents,Christmas Decorations For Kids,Christmas Crafts For Toddlers,Preschool Christmas,Christmas Crafts For Gifts,Christmas Activities,Toddler Crafts,Kids Christmas,Christmas Feeling",Handprint Reindeer Ornaments - Crafty Morning,fa6e31a4-18c2-4eca-a6d8-e903eee2c2a4,892000


In [0]:
# Renaming index column to ind
cleaned_df_pin = cleaned_df_pin.withColumnRenamed("index", "ind")
display(cleaned_df_pin)

category,description,downloaded,image_src,ind,is_image_or_video,poster_name,save_location,tag_list,title,unique_id,follower_count
christmas,"Features: Material:Lint Size:48ｘ18cm Quantity:1 pc Shape:Santa Claus, snowman. Elk Occasion:Christmas Description: 1. Fashion design, high quality 2. Santa Claus, snowman. Elk C…",1,https://i.pinimg.com/originals/b5/7f/21/b57f219fa89c1165b57525b8eae711da.jpg,1706,image,Wear24-7,/data/christmas,"Merry Christmas To You,Christmas Toys,Great Christmas Gifts,Christmas Snowman,Christmas Ornaments,Holiday,Christmas Party Decorations,Christmas Themes,Decoration Party",Standing Figurine Toys Xmas Santa Claus Snowman Reindeer Figure Plush Dolls Christmas Decorations Ornaments Home Indoor Table Ornaments Christmas Party Tree Hanging Decor Toys Gifts for Kids Friends…,b5c8a1b5-9e90-4522-9bec-2477b698d5b7,5000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",/data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,"Christmas decorating ideas for porches. Beautiful holiday decor ideas for front porches both small and large. Outdoor decorations like sleds, lanterns, Christmas trees, wreaths,…",1,https://i.pinimg.com/videos/thumbnails/originals/40/83/f5/4083f5b4971bf235f89a4784ab87271e.0000001.jpg,2482,video,"Life on Summerhill | Home, Holiday Decor & DIY Website",/data/christmas,"Diy Christmas Decorations For Home,Farmhouse Christmas Decor,Christmas Home,Christmas Holidays,Christmas Front Porches,How To Decorate For Christmas,Christmas Porch Ideas,Christmas Decorating Ideas,Large Outdoor Christmas Decorations",FORNT PORCH CHRISTMAS DECORATING IDEAS,08604f20-fa17-4b9a-9949-781717eca6cd,46000
christmas,15 unique Christmas porch ideas that will leave you feeling inspired and help you tackle decorating your own entryway for the holidays! It’s almost time to start decorating for…,1,https://i.pinimg.com/originals/ff/f8/3b/fff83b02aeb29e2e9341a56fc5e63345.png,1967,image,Ashley - Modern Glam,/data/christmas,"Exterior Christmas Lights,Front Door Christmas Decorations,Christmas Lights Outside,Christmas House Lights,Decorating With Christmas Lights,Porch Decorating,Christmas Porch Decorations,Front Porch Ideas For Christmas,Christmas Lights Outdoor Trees",15 Fun & Festive Christmas Porch Ideas,0b9d5b95-51a6-465e-ae4a-2cb68ceada29,19000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
travel,"This Costa Rica itinerary is the ultimate guide to spending two weeks in Costa Rica. Find out about visiting La Fortuna, Arenal, Monteverde, Naranjo, Corcovado National Park, Or…",1,https://i.pinimg.com/originals/30/93/cb/3093cb01d9de2d125fda8ba5e3e41946.jpg,10138,image,"Wanderlust Chloe ✈️ Travel guides, inspo and adventure travel ✈️",/data/travel,"Costa Rica Travel,Rio Celeste Costa Rica,Dream Vacations,Vacation Spots,Vacation Travel,Travel Pictures,Travel Photos,Fortuna Costa Rica,Costa Rica Pictures","14 Amazing Things To Do In Costa Rica | Volcanoes, Waterfalls, Wildlife And More",927c4658-cc3f-4b92-9b5c-70743d0c238d,10000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,/data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
christmas,"My favorite 75+ Neutral Christmas Home Decor for decorating your house during the Holiday Season in earth tones and a farmhouse, rustic style all winter. I love this modern, sim…",1,https://i.pinimg.com/originals/86/84/39/868439dd894969e3abd6a2a8a9fe1e9c.jpg,2604,image,Everyday Wholesome,/data/christmas,"Colorful Christmas Decorations,Colorful Christmas Tree,Christmas Centerpieces,Christmas Colors,Xmas Colors,Winter Decorations,Christmas Trends,Christmas Inspiration,Christmas Home",75+ Neutral Christmas Home Decor for the Holiday Season in Farmhouse Style using Earth Tones Modern,087b0fa9-f901-4262-aa0a-6caf234d1b35,31000
diy-and-crafts,"This post may contain affiliate links, read our Disclosure Policy for more information. As an Amazon Associate I earn from qualifying purchases, thank you! Make some cute handpr…",1,https://i.pinimg.com/originals/ff/fe/38/fffe384f3ec18a0d87cb2d80cc8c1499.jpg,3156,image,Michelle {CraftyMorning.com},/data/diy-and-crafts,"Christmas Gifts For Parents,Christmas Decorations For Kids,Christmas Crafts For Toddlers,Preschool Christmas,Christmas Crafts For Gifts,Christmas Activities,Toddler Crafts,Kids Christmas,Christmas Feeling",Handprint Reindeer Ornaments - Crafty Morning,fa6e31a4-18c2-4eca-a6d8-e903eee2c2a4,892000


In [0]:
# Reordering the table columns
cleaned_df_pin = cleaned_df_pin.select("ind", "unique_id", "title", "description", "follower_count", "poster_name", "tag_list", "is_image_or_video", "image_src", "save_location", "category")

In [0]:
# Adding a new column "coordinates" by array of latitude and longitude columns
cleaned_df_geo = df_geo.withColumn("coordinates", array("latitude", "longitude"))
# Removing latitude and longitude columns
cleaned_df_geo = cleaned_df_geo.drop("longitude", "latitude")

In [0]:
# Converts timestamp column from sting to timestamp data type
cleaned_df_geo = cleaned_df_geo.withColumn("timestamp", to_timestamp("timestamp"))
cleaned_df_geo.printSchema()

In [0]:
# Reorders columns
cleaned_df_geo = cleaned_df_geo.select("ind", "country", "coordinates", "timestamp")
display(cleaned_df_geo)

ind,country,coordinates,timestamp
2418,Antarctica (the territory South of 60 deg S),"List(-88.4642, -171.061)",2022-05-27T11:30:59.000+0000
2418,Antarctica (the territory South of 60 deg S),"List(-88.4642, -171.061)",2022-05-27T11:30:59.000+0000
5162,Antarctica (the territory South of 60 deg S),"List(-71.6607, -149.206)",2019-09-27T19:06:43.000+0000
2418,Antarctica (the territory South of 60 deg S),"List(-88.4642, -171.061)",2022-05-27T11:30:59.000+0000
2301,Saint Vincent and the Grenadines,"List(13.4683, 51.7244)",2020-11-14T00:25:28.000+0000
6014,French Southern Territories,"List(-26.6026, 155.206)",2019-04-30T12:33:13.000+0000
10794,Cocos (Keeling) Islands,"List(-89.5236, -154.567)",2022-01-01T02:26:50.000+0000
10794,Cocos (Keeling) Islands,"List(-89.5236, -154.567)",2022-01-01T02:26:50.000+0000
10794,Cocos (Keeling) Islands,"List(-89.5236, -154.567)",2022-01-01T02:26:50.000+0000
10794,Cocos (Keeling) Islands,"List(-89.5236, -154.567)",2022-01-01T02:26:50.000+0000


In [0]:
# Create a new column called "user_name" adding "first_name" and "last_name"
cleaned_df_user = df_user.withColumn("user_name", array("first_name", "last_name"))
# Delete columns first_name and last_name
cleaned_df_user = cleaned_df_user.drop("first_name", "last_name")

In [0]:
# Convert date_joined column from string to timestamp
cleaned_df_user = cleaned_df_user.withColumn("date_joined", to_timestamp("date_joined"))
cleaned_df_user = cleaned_df_user.withColumn("ind", cleaned_df_user["ind"].cast("integer"))
cleaned_df_user = cleaned_df_user.withColumn("age", cleaned_df_user["age"].cast("integer"))
cleaned_df_user = cleaned_df_user.select("ind", "user_name", "age", "date_joined")
cleaned_df_user.printSchema()

In [0]:
cleaned_df_user.printSchema()

In [0]:
# Drop the existing table if it exists
spark.sql("DROP TABLE IF EXISTS cleaned_df_pin")



In [0]:
cleaned_df_pin.write.format("parquet").mode("overwrite").saveAsTable("1279c94681db_pin")
pin_clean = spark.read.parquet("dbfs:/user/hive/warehouse/1279c94681db_pin")
pin_clean.createOrReplaceTempView("pin")

In [0]:
cleaned_df_geo.write.format("parquet").mode("overwrite").saveAsTable("1279c94681db_geo")
geo_clean = spark.read.parquet("dbfs:/user/hive/warehouse/1279c94681db_geo")
geo_clean.createOrReplaceTempView("geo")

In [0]:
cleaned_df_user.write.format("parquet").mode("overwrite").saveAsTable("1279c94681db_user")
user_clean = spark.read.parquet("dbfs:/user/hive/warehouse/1279c94681db_user")
user_clean.createOrReplaceTempView("user")

In [0]:
%sql
-- Milestone 7 task 4
WITH country_category_counts AS (
    SELECT
        geo.country,
        pin.category,
        COUNT(*) AS category_count,
        RANK() OVER (PARTITION BY geo.country ORDER BY COUNT(*) DESC) AS category_rank
    FROM geo
    JOIN pin ON geo.ind = pin.ind
    GROUP BY geo.country, pin.category
)

SELECT 
    country,
    category,
    category_count
FROM country_category_counts
WHERE category_rank = 1

country,category,category_count
Afghanistan,art,4
Afghanistan,education,4
Albania,mens-fashion,30
Algeria,quotes,9
American Samoa,beauty,8
Andorra,art,4
Andorra,beauty,4
Andorra,tattoos,4
Angola,diy-and-crafts,9
Anguilla,home-decor,9


In [0]:
%sql

SELECT  date_part('year', geo.timestamp) AS post_year,
        category,
        COUNT(*) AS category_count
FROM geo
INNER JOIN pin ON geo.ind = pin.ind
WHERE geo.timestamp >= '2018-01-01' AND geo.timestamp < '2023-01-01'
GROUP BY category, post_year
ORDER BY post_year DESC, category_count DESC

post_year,category,category_count
2022,vehicles,30
2022,christmas,15
2022,beauty,15
2022,art,12
2022,tattoos,9
2022,quotes,6
2022,diy-and-crafts,5
2022,mens-fashion,4
2022,education,1
2021,finance,61


In [0]:
%sql
WITH user_followers AS (
  SELECT  pin.poster_name AS poster_name,
          pin.follower_count AS follower_count,
          geo.country AS country
  FROM pin
  INNER JOIN geo ON pin.ind = geo.ind
)
SELECT  country,
        follower_count
FROM followers_table
ORDER BY follower_count DESC
LIMIT 1;

country,follower_count
Azerbaijan,6000000


In [0]:
%sql
WITH age_group AS (
    SELECT  
        pin.category,
        COUNT(*) AS category_count,
        CASE
            WHEN u.age >= 18 AND u.age <= 24 THEN '18-24'
            WHEN u.age >= 25 AND u.age <= 35 THEN '25-35'
            WHEN u.age >= 36 AND u.age <= 50 THEN '36-50'
            ELSE '+50' 
        END AS age_group
    FROM user u
    INNER JOIN pin ON u.ind = pin.ind
    GROUP BY age_group, pin.category
)

SELECT age_group, category, category_count
FROM (
    SELECT age_group, category, category_count,
           ROW_NUMBER() OVER (PARTITION BY age_group ORDER BY category_count DESC) AS rn
    FROM age_group
) tmp
WHERE rn = 1

age_group,category,category_count
+50,beauty,12
18-24,mens-fashion,69
25-35,diy-and-crafts,59
36-50,finance,31


In [0]:
%sql

WITH age_groups AS (
    SELECT
        CASE
            WHEN user.age BETWEEN 18 AND 24 THEN '18-24'
            WHEN user.age BETWEEN 25 AND 35 THEN '25-35'
            WHEN user.age BETWEEN 36 AND 50 THEN '36-50'
            ELSE '+50'
        END AS age_group,
        pin.follower_count
    FROM user
    JOIN pin ON user.ind = pin.ind
)

SELECT
    age_group,
    PERCENTILE_CONT(0.5) WITHIN GROUP (ORDER BY follower_count) AS median_follower_count
FROM age_groups
GROUP BY age_group

age_group,median_follower_count
36-50,6000.0
+50,7000.0
18-24,108000.0
25-35,43000.0


In [0]:
%sql

WITH user_join_years AS (
    SELECT  
        YEAR(date_joined) AS join_year
    FROM user
    WHERE YEAR(date_joined) BETWEEN 2015 AND 2020
)

SELECT join_year AS post_year, COUNT(*) AS number_users_joined
FROM user_join_years
GROUP BY join_year

post_year,number_users_joined
2015,127
2016,138
2017,42


In [0]:
%sql

WITH user_join_years AS (
    SELECT  
        YEAR(user.date_joined) AS join_year,
        pin.follower_count
    FROM user
    JOIN pin ON user.ind = pin.ind
    WHERE YEAR(user.date_joined) BETWEEN 2015 AND 2020
)

SELECT join_year AS post_year, 
       PERCENTILE_CONT(0.5) WITHIN GROUP (ORDER BY follower_count) AS median_follower_count
FROM user_join_years
GROUP BY join_year

post_year,median_follower_count
2015,51000.0
2016,43000.0
2017,6000.0


In [0]:
%sql

WITH user_age_groups AS (
    SELECT
        CASE
            WHEN age BETWEEN 18 AND 24 THEN '18-24'
            WHEN age BETWEEN 25 AND 35 THEN '25-35'
            WHEN age BETWEEN 36 AND 50 THEN '36-50'
            ELSE '+50'
        END AS age_group,
        YEAR(date_joined) AS post_year,
        pin.follower_count
    FROM user
    JOIN pin ON user.ind = pin.ind
    WHERE YEAR(date_joined) BETWEEN 2015 AND 2020
)

SELECT age_group, post_year,
       PERCENTILE_CONT(0.5) WITHIN GROUP (ORDER BY follower_count) AS median_follower_count
FROM user_age_groups
GROUP BY age_group, post_year

age_group,post_year,median_follower_count
+50,2016,1000.0
25-35,2017,8000.0
18-24,2016,46000.0
18-24,2015,190000.0
25-35,2016,43000.0
36-50,2017,3000.0
36-50,2015,13000.0
18-24,2017,940.0
25-35,2015,51000.0
36-50,2016,9000.0


In [0]:
dbutils.fs.unmount("/mnt/saiful_bucket")