In [0]:
# pyspark functions
from pyspark.sql.functions import *
# URL processing
import urllib

# Define the path to the Delta table
delta_table_path = "dbfs:/user/hive/warehouse/authentication_credentials"

# Read the Delta table to a Spark DataFrame
aws_keys_df = spark.read.format("delta").load(delta_table_path)

# Get the AWS access key and secret key from the spark dataframe
ACCESS_KEY = aws_keys_df.select('Access key ID').collect()[0]['Access key ID']
SECRET_KEY = aws_keys_df.select('Secret access key').collect()[0]['Secret access key']

# Encode the secret key
ENCODED_SECRET_KEY = urllib.parse.quote(string=SECRET_KEY, safe="")

# AWS S3 bucket name
AWS_S3_BUCKET = "user-0eaa2e755d1f-bucket"
# Mount name for the bucket
MOUNT_NAME = "/mnt/pinterest"  # Use an absolute path for the mount point
# Source url
SOURCE_URL = "s3n://{0}:{1}@{2}".format(ACCESS_KEY, ENCODED_SECRET_KEY, AWS_S3_BUCKET)

if any(mount.mountPoint == MOUNT_NAME for mount in dbutils.fs.mounts()):
    dbutils.fs.unmount(MOUNT_NAME)
# Check if the directory is already mounted
if not any(mount.mountPoint == MOUNT_NAME for mount in dbutils.fs.mounts()):
    # Mount the drive
    dbutils.fs.mount(SOURCE_URL, MOUNT_NAME)

# Display the contents of the mounted directory
display(dbutils.fs.ls("/mnt/pinterest"))

path,name,size,modificationTime
dbfs:/mnt/pinterest/kafka-connect-s3/,kafka-connect-s3/,0,1724849885218
dbfs:/mnt/pinterest/topics/,topics/,0,1724849885218


In [0]:
# pyspark functions
from pyspark.sql.functions import *
# URL processing
import urllib

# Disable format checks during the reading of Delta tables
spark.conf.set("spark.databricks.delta.formatCheck.enabled", "false")

# File location and type
file_location = "/mnt/pinterest/topics/0eaa2e755d1f.pin/partition=0/*.json" 
file_type = "json"
# Ask Spark to infer the schema
infer_schema = "true"
# Read in JSONs from mounted S3 bucket
df_pin = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location)
# Display Spark dataframe to check its content
display(df_pin)
|


_corrupt_record,category,description,downloaded,follower_count,image_src,index,is_image_or_video,poster_name,save_location,tag_list,title,unique_id
"""{\""records\"": [{\""value\"": {\""index\"": 4387, \""unique_id\"": \""ae5e7377-f1bd-4ac5-94de-bee317f51a43\"", \""title\"": \""\\u0392\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7: H \\u03c0\\u03b1\\u03c1\\u03b1\\u03bc\\u03c5\\u03b8\\u03ad\\u03bd\\u03b9\\u03b1 \\u03b2\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7 \\u03c4\\u03b7\\u03c2 \\u03a4\\u03b9\\u03c4\\u03af\\u03ba\\u03b1\\u03c2 \\u03bc\\u03b5 \\u03b8\\u03ad\\u03bc\\u03b1 \\u03c4\\u03bf \\u03bc\\u03bf\\u03bd\\u03cc\\u03ba\\u03b5\\u03c1\\u03bf \\u03b1\\u03c0\\u03cc \\u03c4\\u03b7\\u03bd e.m. for you\"", \""description\"": \""\\u03a4\\u03bf \\u03cc\\u03bd\\u03bf\\u03bc\\u03b1 \\u03c0\\u03bf\\u03c5 \\u03b5\\u03c0\\u03ad\\u03bb\\u03b5\\u03be\\u03b5 \\u03b7 \\u03bc\\u03b1\\u03bc\\u03ac \\u0391\\u03bd\\u03b4\\u03c1\\u03b9\\u03b1\\u03bd\\u03ae \\u03b3\\u03b9\\u03b1 \\u03c4\\u03b7 \\u03b3\\u03bb\\u03c5\\u03ba\\u03b9\\u03ac \\u03a4\\u03b9\\u03c4\\u03af\\u03ba\\u03b1 \\u03b4\\u03b5\\u03bd \\u03b5\\u03af\\u03bd\\u03b1\\u03b9 \\u03ba\\u03b1\\u03b8\\u03cc\\u03bb\\u03bf\\u03c5 \\u03c4\\u03c5\\u03c7\\u03b1\\u03af\\u03bf. \\u039a\\u03b1\\u03b9 \\u03c6\\u03c5\\u03c3\\u03b9\\u03ba\\u03ac \\u03b4\\u03b5\\u03bd \\u03ac\\u03c6\\u03b7\\u03c3\\u03b5 \\u03c4\\u03af\\u03c0\\u03bf\\u03c4\\u03b1 \\u03c3\\u03c4\\u03b7\\u03bd \\u03c4\\u03cd\\u03c7\\u03b7 \\u03bf\\u03cd\\u03c4\\u03b5 \\u03c4\\u03b7\\u03bd \\u03b7\\u03bc\\u03ad\\u03c1\\u03b1 \\u03c4\\u03b7\\u03c2 \\u03b2\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7\\u03c2. \\u0391\\u03bd\\u03ad\\u03b8\\u03b5\\u03c3\\u03b5 \\u03c4\\u03b7\\u03bd \\u03bf\\u03c1\\u03b3\\u03ac\\u03bd\\u03c9\\u03c3\\u03b7 \\u03c3\\u03c4\\u03b7\\u03bd\\u2026\\u00a0\"", \""poster_name\"": \""Manosbojana Katsareas\"", \""follower_count\"": \""4\"", \""tag_list\"": \""Diy Flowers,Flower Diy,Baptism Decorations,Christening,Event Planning,Wedding Planner,Baptism Ideas,Birthday,Party\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/db/aa/d2/dbaad28fa85012a4ea6958540d98a8e5.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/event-planning\"", \""category\"": \""event-planning\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 4387, \""unique_id\"": \""ae5e7377-f1bd-4ac5-94de-bee317f51a43\"", \""title\"": \""\\u0392\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7: H \\u03c0\\u03b1\\u03c1\\u03b1\\u03bc\\u03c5\\u03b8\\u03ad\\u03bd\\u03b9\\u03b1 \\u03b2\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7 \\u03c4\\u03b7\\u03c2 \\u03a4\\u03b9\\u03c4\\u03af\\u03ba\\u03b1\\u03c2 \\u03bc\\u03b5 \\u03b8\\u03ad\\u03bc\\u03b1 \\u03c4\\u03bf \\u03bc\\u03bf\\u03bd\\u03cc\\u03ba\\u03b5\\u03c1\\u03bf \\u03b1\\u03c0\\u03cc \\u03c4\\u03b7\\u03bd e.m. for you\"", \""description\"": \""\\u03a4\\u03bf \\u03cc\\u03bd\\u03bf\\u03bc\\u03b1 \\u03c0\\u03bf\\u03c5 \\u03b5\\u03c0\\u03ad\\u03bb\\u03b5\\u03be\\u03b5 \\u03b7 \\u03bc\\u03b1\\u03bc\\u03ac \\u0391\\u03bd\\u03b4\\u03c1\\u03b9\\u03b1\\u03bd\\u03ae \\u03b3\\u03b9\\u03b1 \\u03c4\\u03b7 \\u03b3\\u03bb\\u03c5\\u03ba\\u03b9\\u03ac \\u03a4\\u03b9\\u03c4\\u03af\\u03ba\\u03b1 \\u03b4\\u03b5\\u03bd \\u03b5\\u03af\\u03bd\\u03b1\\u03b9 \\u03ba\\u03b1\\u03b8\\u03cc\\u03bb\\u03bf\\u03c5 \\u03c4\\u03c5\\u03c7\\u03b1\\u03af\\u03bf. \\u039a\\u03b1\\u03b9 \\u03c6\\u03c5\\u03c3\\u03b9\\u03ba\\u03ac \\u03b4\\u03b5\\u03bd \\u03ac\\u03c6\\u03b7\\u03c3\\u03b5 \\u03c4\\u03af\\u03c0\\u03bf\\u03c4\\u03b1 \\u03c3\\u03c4\\u03b7\\u03bd \\u03c4\\u03cd\\u03c7\\u03b7 \\u03bf\\u03cd\\u03c4\\u03b5 \\u03c4\\u03b7\\u03bd \\u03b7\\u03bc\\u03ad\\u03c1\\u03b1 \\u03c4\\u03b7\\u03c2 \\u03b2\\u03ac\\u03c0\\u03c4\\u03b9\\u03c3\\u03b7\\u03c2. \\u0391\\u03bd\\u03ad\\u03b8\\u03b5\\u03c3\\u03b5 \\u03c4\\u03b7\\u03bd \\u03bf\\u03c1\\u03b3\\u03ac\\u03bd\\u03c9\\u03c3\\u03b7 \\u03c3\\u03c4\\u03b7\\u03bd\\u2026\\u00a0\"", \""poster_name\"": \""Manosbojana Katsareas\"", \""follower_count\"": \""4\"", \""tag_list\"": \""Diy Flowers,Flower Diy,Baptism Decorations,Christening,Event Planning,Wedding Planner,Baptism Ideas,Birthday,Party\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/db/aa/d2/dbaad28fa85012a4ea6958540d98a8e5.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/event-planning\"", \""category\"": \""event-planning\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 6717, \""unique_id\"": \""bc5ab9ee-505e-44f6-92ba-677fe4fdf3e3\"", \""title\"": \""\\u301a \\u0423\\u044e\\u0442\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438 \\u043e\\u0442 Carina Olander \\u301b \\u25fe \\u0424\\u043e\\u0442\\u043e \\u25fe \\u0418\\u0434\\u0435\\u0438 \\u25fe \\u0414\\u0438\\u0437\\u0430\\u0439\\u043d\"", \""description\"": \""\\u0422\\u0440\\u0430\\u0434\\u0438\\u0446\\u0438\\u043e\\u043d\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438, \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u0441 \\u043a\\u0440\\u0430\\u0441\\u043d\\u044b\\u043c \\u0444\\u0430\\u0441\\u0430\\u0434\\u043e\\u043c \\u2014 \\u044d\\u0442\\u043e \\u043d\\u0430\\u0441\\u0442\\u043e\\u044f\\u0449\\u0435\\u0435 \\u0432\\u043e\\u043f\\u043b\\u043e\\u0449\\u0435\\u043d\\u0438\\u0435\\u043c \\u0438\\u0434\\u0435\\u0430\\u043b\\u044c\\u043d\\u043e\\u0433\\u043e \\u0437\\u0438\\u043c\\u043d\\u0435\\u0433\\u043e \\u0443\\u044e\\u0442\\u0430. \\u041e\\u043d\\u0438 \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u043e\\u0444\\u043e\\u0440\\u043c\\u043b\\u0435\\u043d\\u044b \\u043e\\u0447\\u0435\\u043d\\u044c \\u043f\\u0440\\u043e\\u0441\\u0442\\u043e \\u0438 \\u270cPUFIK. Beautiful Interiors. On\\u2026\\u00a0\"", \""poster_name\"": \""PUFIK Interiors & Inspirations\"", \""follower_count\"": \""136k\"", \""tag_list\"": \""Scandinavian Cottage,Swedish Cottage,Swedish Home Decor,Swedish Farmhouse,Swedish Style,Swedish Kitchen,Kitchen Black,Swedish House,Cozy Cottage\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/32/eb/72/32eb72e4fd8654c115a64528bd1f34b4.png\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/home-decor\"", \""category\"": \""home-decor\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 6717, \""unique_id\"": \""bc5ab9ee-505e-44f6-92ba-677fe4fdf3e3\"", \""title\"": \""\\u301a \\u0423\\u044e\\u0442\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438 \\u043e\\u0442 Carina Olander \\u301b \\u25fe \\u0424\\u043e\\u0442\\u043e \\u25fe \\u0418\\u0434\\u0435\\u0438 \\u25fe \\u0414\\u0438\\u0437\\u0430\\u0439\\u043d\"", \""description\"": \""\\u0422\\u0440\\u0430\\u0434\\u0438\\u0446\\u0438\\u043e\\u043d\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438, \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u0441 \\u043a\\u0440\\u0430\\u0441\\u043d\\u044b\\u043c \\u0444\\u0430\\u0441\\u0430\\u0434\\u043e\\u043c \\u2014 \\u044d\\u0442\\u043e \\u043d\\u0430\\u0441\\u0442\\u043e\\u044f\\u0449\\u0435\\u0435 \\u0432\\u043e\\u043f\\u043b\\u043e\\u0449\\u0435\\u043d\\u0438\\u0435\\u043c \\u0438\\u0434\\u0435\\u0430\\u043b\\u044c\\u043d\\u043e\\u0433\\u043e \\u0437\\u0438\\u043c\\u043d\\u0435\\u0433\\u043e \\u0443\\u044e\\u0442\\u0430. \\u041e\\u043d\\u0438 \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u043e\\u0444\\u043e\\u0440\\u043c\\u043b\\u0435\\u043d\\u044b \\u043e\\u0447\\u0435\\u043d\\u044c \\u043f\\u0440\\u043e\\u0441\\u0442\\u043e \\u0438 \\u270cPUFIK. Beautiful Interiors. On\\u2026\\u00a0\"", \""poster_name\"": \""PUFIK Interiors & Inspirations\"", \""follower_count\"": \""136k\"", \""tag_list\"": \""Scandinavian Cottage,Swedish Cottage,Swedish Home Decor,Swedish Farmhouse,Swedish Style,Swedish Kitchen,Kitchen Black,Swedish House,Cozy Cottage\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/32/eb/72/32eb72e4fd8654c115a64528bd1f34b4.png\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/home-decor\"", \""category\"": \""home-decor\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 6717, \""unique_id\"": \""bc5ab9ee-505e-44f6-92ba-677fe4fdf3e3\"", \""title\"": \""\\u301a \\u0423\\u044e\\u0442\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438 \\u043e\\u0442 Carina Olander \\u301b \\u25fe \\u0424\\u043e\\u0442\\u043e \\u25fe \\u0418\\u0434\\u0435\\u0438 \\u25fe \\u0414\\u0438\\u0437\\u0430\\u0439\\u043d\"", \""description\"": \""\\u0422\\u0440\\u0430\\u0434\\u0438\\u0446\\u0438\\u043e\\u043d\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438, \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u0441 \\u043a\\u0440\\u0430\\u0441\\u043d\\u044b\\u043c \\u0444\\u0430\\u0441\\u0430\\u0434\\u043e\\u043c \\u2014 \\u044d\\u0442\\u043e \\u043d\\u0430\\u0441\\u0442\\u043e\\u044f\\u0449\\u0435\\u0435 \\u0432\\u043e\\u043f\\u043b\\u043e\\u0449\\u0435\\u043d\\u0438\\u0435\\u043c \\u0438\\u0434\\u0435\\u0430\\u043b\\u044c\\u043d\\u043e\\u0433\\u043e \\u0437\\u0438\\u043c\\u043d\\u0435\\u0433\\u043e \\u0443\\u044e\\u0442\\u0430. \\u041e\\u043d\\u0438 \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u043e\\u0444\\u043e\\u0440\\u043c\\u043b\\u0435\\u043d\\u044b \\u043e\\u0447\\u0435\\u043d\\u044c \\u043f\\u0440\\u043e\\u0441\\u0442\\u043e \\u0438 \\u270cPUFIK. Beautiful Interiors. On\\u2026\\u00a0\"", \""poster_name\"": \""PUFIK Interiors & Inspirations\"", \""follower_count\"": \""136k\"", \""tag_list\"": \""Scandinavian Cottage,Swedish Cottage,Swedish Home Decor,Swedish Farmhouse,Swedish Style,Swedish Kitchen,Kitchen Black,Swedish House,Cozy Cottage\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/32/eb/72/32eb72e4fd8654c115a64528bd1f34b4.png\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/home-decor\"", \""category\"": \""home-decor\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 6717, \""unique_id\"": \""bc5ab9ee-505e-44f6-92ba-677fe4fdf3e3\"", \""title\"": \""\\u301a \\u0423\\u044e\\u0442\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438 \\u043e\\u0442 Carina Olander \\u301b \\u25fe \\u0424\\u043e\\u0442\\u043e \\u25fe \\u0418\\u0434\\u0435\\u0438 \\u25fe \\u0414\\u0438\\u0437\\u0430\\u0439\\u043d\"", \""description\"": \""\\u0422\\u0440\\u0430\\u0434\\u0438\\u0446\\u0438\\u043e\\u043d\\u043d\\u044b\\u0435 \\u0448\\u0432\\u0435\\u0434\\u0441\\u043a\\u0438\\u0435 \\u043a\\u043e\\u0442\\u0442\\u0435\\u0434\\u0436\\u0438, \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u0441 \\u043a\\u0440\\u0430\\u0441\\u043d\\u044b\\u043c \\u0444\\u0430\\u0441\\u0430\\u0434\\u043e\\u043c \\u2014 \\u044d\\u0442\\u043e \\u043d\\u0430\\u0441\\u0442\\u043e\\u044f\\u0449\\u0435\\u0435 \\u0432\\u043e\\u043f\\u043b\\u043e\\u0449\\u0435\\u043d\\u0438\\u0435\\u043c \\u0438\\u0434\\u0435\\u0430\\u043b\\u044c\\u043d\\u043e\\u0433\\u043e \\u0437\\u0438\\u043c\\u043d\\u0435\\u0433\\u043e \\u0443\\u044e\\u0442\\u0430. \\u041e\\u043d\\u0438 \\u043e\\u0431\\u044b\\u0447\\u043d\\u043e \\u043e\\u0444\\u043e\\u0440\\u043c\\u043b\\u0435\\u043d\\u044b \\u043e\\u0447\\u0435\\u043d\\u044c \\u043f\\u0440\\u043e\\u0441\\u0442\\u043e \\u0438 \\u270cPUFIK. Beautiful Interiors. On\\u2026\\u00a0\"", \""poster_name\"": \""PUFIK Interiors & Inspirations\"", \""follower_count\"": \""136k\"", \""tag_list\"": \""Scandinavian Cottage,Swedish Cottage,Swedish Home Decor,Swedish Farmhouse,Swedish Style,Swedish Kitchen,Kitchen Black,Swedish House,Cozy Cottage\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/32/eb/72/32eb72e4fd8654c115a64528bd1f34b4.png\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/home-decor\"", \""category\"": \""home-decor\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 10379, \""unique_id\"": \""9d48e180-aa78-48e9-9b2e-4c7ee6960c0e\"", \""title\"": \""\\u041d\\u043e\\u0432\\u0430\\u044f \\u043b\\u0435\\u0433\\u043a\\u0430\\u044f \\u0431\\u0440\\u043e\\u043d\\u0438\\u0440\\u043e\\u0432\\u0430\\u043d\\u043d\\u0430\\u044f \\u043c\\u0430\\u0448\\u0438\\u043d\\u0430 Scarabee \\u043e\\u0442 Arquus\"", \""description\"": \""\\u041d\\u0430 \\u043f\\u0440\\u043e\\u0445\\u043e\\u0434\\u044f\\u0449\\u0435\\u0439 \\u0432 \\u041f\\u0430\\u0440\\u0438\\u0436\\u0435 \\u0441 11 \\u043f\\u043e 14 \\u0438\\u044e\\u043d\\u044f 2018 \\u0433\\u043e\\u0434\\u0430 \\u043c\\u0435\\u0436\\u0434\\u0443\\u043d\\u0430\\u0440\\u043e\\u0434\\u043d\\u043e\\u0439 \\u043e\\u0431\\u043e\\u0440\\u043e\\u043d\\u043d\\u043e\\u0439 \\u0432\\u044b\\u0441\\u0442\\u0430\\u0432\\u043a\\u0435 Eurosatory 2018 \\u0444\\u0440\\u0430\\u043d\\u0446\\u0443\\u0437\\u0441\\u043a\\u0430\\u044f \\u043e\\u0431\\u043e\\u0440\\u043e\\u043d\\u043d\\u0430\\u044f \\u043a\\u043e\\u043c\\u043f\\u0430\\u043d\\u0438\\u044f Arquus ( \\u0431\\u044b\\u0432\\u0448\\u0430\\u044f Renault Truck Defense; \\u0432\\u0445\\u043e\\u0434\\u0438\\u0442 \\u0432\\u2026\\u00a0\"", \""poster_name\"": \""Dominic Shoblo\"", \""follower_count\"": \""336\"", \""tag_list\"": \""Lifted Ford Trucks,Jeep Truck,Big Trucks,Army Vehicles,Armored Vehicles,Offroad,Armored Truck,Bug Out Vehicle,Terrain Vehicle\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/7a/3f/1f/7a3f1fc6ed2bdc6e503b4e4d92c1dbe9.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/vehicles\"", \""category\"": \""vehicles\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 10379, \""unique_id\"": \""9d48e180-aa78-48e9-9b2e-4c7ee6960c0e\"", \""title\"": \""\\u041d\\u043e\\u0432\\u0430\\u044f \\u043b\\u0435\\u0433\\u043a\\u0430\\u044f \\u0431\\u0440\\u043e\\u043d\\u0438\\u0440\\u043e\\u0432\\u0430\\u043d\\u043d\\u0430\\u044f \\u043c\\u0430\\u0448\\u0438\\u043d\\u0430 Scarabee \\u043e\\u0442 Arquus\"", \""description\"": \""\\u041d\\u0430 \\u043f\\u0440\\u043e\\u0445\\u043e\\u0434\\u044f\\u0449\\u0435\\u0439 \\u0432 \\u041f\\u0430\\u0440\\u0438\\u0436\\u0435 \\u0441 11 \\u043f\\u043e 14 \\u0438\\u044e\\u043d\\u044f 2018 \\u0433\\u043e\\u0434\\u0430 \\u043c\\u0435\\u0436\\u0434\\u0443\\u043d\\u0430\\u0440\\u043e\\u0434\\u043d\\u043e\\u0439 \\u043e\\u0431\\u043e\\u0440\\u043e\\u043d\\u043d\\u043e\\u0439 \\u0432\\u044b\\u0441\\u0442\\u0430\\u0432\\u043a\\u0435 Eurosatory 2018 \\u0444\\u0440\\u0430\\u043d\\u0446\\u0443\\u0437\\u0441\\u043a\\u0430\\u044f \\u043e\\u0431\\u043e\\u0440\\u043e\\u043d\\u043d\\u0430\\u044f \\u043a\\u043e\\u043c\\u043f\\u0430\\u043d\\u0438\\u044f Arquus ( \\u0431\\u044b\\u0432\\u0448\\u0430\\u044f Renault Truck Defense; \\u0432\\u0445\\u043e\\u0434\\u0438\\u0442 \\u0432\\u2026\\u00a0\"", \""poster_name\"": \""Dominic Shoblo\"", \""follower_count\"": \""336\"", \""tag_list\"": \""Lifted Ford Trucks,Jeep Truck,Big Trucks,Army Vehicles,Armored Vehicles,Offroad,Armored Truck,Bug Out Vehicle,Terrain Vehicle\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/7a/3f/1f/7a3f1fc6ed2bdc6e503b4e4d92c1dbe9.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/vehicles\"", \""category\"": \""vehicles\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 4820, \""unique_id\"": \""ff50bb42-c7b5-41b8-bbd2-ae5761f4b1c0\"", \""title\"": \""\\u0416\\u0443\\u0440\\u043d\\u0430\\u043b \\u00abQuilt is LOVE\\u00bb. \\u0418\\u043d\\u0441\\u0442\\u0440\\u0443\\u043a\\u0446\\u0438\\u0438 \\u0438 \\u0448\\u0430\\u0431\\u043b\\u043e\\u043d\\u044b\"", \""description\"": \""\\u0416\\u0443\\u0440\\u043d\\u0430\\u043b \\u00abQuilt is LOVE\\u00bb. \\u0418\\u043d\\u0441\\u0442\\u0440\\u0443\\u043a\\u0446\\u0438\\u0438 \\u0438 \\u0448\\u0430\\u0431\\u043b\\u043e\\u043d\\u044b \\u043a \\u043f\\u0440\\u0435\\u0434\\u044b\\u0434\\u0443\\u0449\\u0435\\u0439 \\u043f\\u0443\\u0431\\u043b\\u0438\\u043a\\u0430\\u0446\\u0438\\u0438, \\u043e\\u0441\\u043d\\u043e\\u0432\\u043d\\u043e\\u0439 \\u0447\\u0430\\u0441\\u0442\\u0438 \\u0443\\u043d\\u0438\\u043a\\u0430\\u043b\\u044c\\u043d\\u043e\\u0433\\u043e \\u0436\\u0443\\u0440\\u043d\\u0430\\u043b\\u0430 \\u0434\\u043b\\u044f \\u043b\\u044e\\u0431\\u0438\\u0442\\u0435\\u043b\\u044c\\u043d\\u0438\\u0446 \\u043b\\u043e\\u0441\\u043a\\u0443\\u0442\\u043d\\u043e\\u0433\\u043e \\u0448\\u0438\\u0442\\u044c\\u044f.\"", \""poster_name\"": \""oliveira paulo sergio\"", \""follower_count\"": \""491\"", \""tag_list\"": \""Table Seating Chart,Seating Cards,Seating Chart Wedding,Wedding Table,Wedding Reception,Reception Seating,Wedding Decor,Wedding 2015,Our Wedding\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/bb/a7/d7/bba7d736a82a4f670b0218f2bc35472e.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/event-planning\"", \""category\"": \""event-planning\""}}]}""",,,,,,,,,,,,
"""{\""records\"": [{\""value\"": {\""index\"": 10943, \""unique_id\"": \""c8f5619c-c267-4d50-8231-3994d32fc0de\"", \""title\"": \""\\u041f\\u043e\\u043b\\u0438\\u0446\\u0435\\u0439\\u0441\\u043a\\u0430\\u044f \\u043f\\u043e\\u0433\\u043e\\u043d\\u044f #1. \\u041d\\u0435 \\u0440\\u0430\\u0437\\u043c\\u0438\\u043d\\u0443\\u043b\\u0438\\u0441\\u044c \\u0441\\u043e \\u0432\\u0441\\u0442\\u0440\\u0435\\u0447\\u043a\\u043e\\u0439.\"", \""description\"": \""\\u0411\\u0438\\u0442\\u043a\\u043e\\u0438\\u043d \\u043a\\u043e\\u043b\\u0435\\u0431\\u043b\\u0435\\u0442\\u0441\\u044f \\u043a\\u0430\\u0436\\u0434\\u044b\\u0439 \\u0434\\u0435\\u043d\\u044c \\u043e\\u0442 60000 \\u0434\\u043e 65000$, \\u043d\\u0430\\u0447\\u0438\\u043d\\u0430\\u0439 \\u0437\\u0430\\u0440\\u0430\\u0431\\u0430\\u0442\\u044b\\u0432\\u0430\\u0442\\u044c: https://bit.ly/36J0qVC\\u2605\\u2605\\u2605 \\u041f\\u043e\\u0434\\u043f\\u0438\\u0441\\u0430\\u0442\\u044c\\u0441\\u044f \\u043d\\u0430 \\u043a\\u0430\\u043d\\u0430\\u043b: https://bit.ly/343C0Sr \\u2605\\u2605\\u2605 \\u041f\\u043e\\u043b\\u0438\\u0446\\u0435\\u0439\\u0441\\u043a...\"", \""poster_name\"": \""Masfa Dkxmrvd\"", \""follower_count\"": \""41\"", \""tag_list\"": \""Lamborghini Veneno,Lamborghini Logo,Carros Lamborghini,Ferrari Laferrari,Luxury Sports Cars,Best Luxury Cars,Sport Cars,Exotic Sports Cars,Dream Cars\"", \""is_image_or_video\"": \""image\"", \""image_src\"": \""https://i.pinimg.com/originals/2c/2f/67/2c2f67f988c76514ecf611f6c725c304.jpg\"", \""downloaded\"": 1, \""save_location\"": \""Local save in /data/vehicles\"", \""category\"": \""vehicles\""}}]}""",,,,,,,,,,,,


In [0]:
# pyspark functions
from pyspark.sql.functions import *
# URL processing
import urllib

# Disable format checks during the reading of Delta tables
spark.conf.set("spark.databricks.delta.formatCheck.enabled", "false")

# File location and type
file_location = "/mnt/pinterest/topics/0eaa2e755d1f.geo/partition=0/*.json" 
file_type = "json"
# Ask Spark to infer the schema
infer_schema = "true"
# Read in JSONs from mounted S3 bucket
df_geo = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location)
# Display Spark dataframe to check its content
display(df_geo)

_corrupt_record,country,ind,latitude,longitude,timestamp
"""{\""records\"": [{\""value\"": {\""ind\"": 5395, \""timestamp\"": \""2020-08-15 19:30:19\"", \""latitude\"": -6.93422, \""longitude\"": -24.9989, \""country\"": \""British Virgin Islands\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1170, \""timestamp\"": \""2019-08-07 22:17:07\"", \""latitude\"": 56.1198, \""longitude\"": 20.2963, \""country\"": \""Libyan Arab Jamahiriya\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 9550, \""timestamp\"": \""2022-03-23 00:25:45\"", \""latitude\"": -84.918, \""longitude\"": 7.23235, \""country\"": \""British Virgin Islands\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 6575, \""timestamp\"": \""2020-12-29 22:59:37\"", \""latitude\"": 81.7192, \""longitude\"": 61.5152, \""country\"": \""Dominican Republic\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 3032, \""timestamp\"": \""2018-04-14 09:28:18\"", \""latitude\"": -66.7253, \""longitude\"": -122.489, \""country\"": \""American Samoa\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 2759, \""timestamp\"": \""2022-02-20 11:53:20\"", \""latitude\"": -66.7253, \""longitude\"": -122.489, \""country\"": \""American Samoa\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 10321, \""timestamp\"": \""2022-10-09 08:06:50\"", \""latitude\"": -89.1005, \""longitude\"": -151.255, \""country\"": \""Burkina Faso\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 6809, \""timestamp\"": \""2020-04-17 13:20:43\"", \""latitude\"": -89.4254, \""longitude\"": -161.818, \""country\"": \""Bangladesh\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1667, \""timestamp\"": \""2022-02-23 16:10:08\"", \""latitude\"": -83.448, \""longitude\"": -147.771, \""country\"": \""Bangladesh\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 9146, \""timestamp\"": \""2018-08-08 16:20:34\"", \""latitude\"": -89.4739, \""longitude\"": -176.154, \""country\"": \""Argentina\""}}]}""",,,,,


In [0]:
# pyspark functions
from pyspark.sql.functions import *
# URL processing
import urllib

# Disable format checks during the reading of Delta tables
spark.conf.set("spark.databricks.delta.formatCheck.enabled", "false")

# File location and type
file_location = "/mnt/pinterest/topics/0eaa2e755d1f.user/partition=0/*.json" 
file_type = "json"
# Ask Spark to infer the schema
infer_schema = "true"
# Read in JSONs from mounted S3 bucket
df_user = spark.read.format(file_type) \
.option("inferSchema", infer_schema) \
.load(file_location)
# Display Spark dataframe to check its content
display(df_user)

_corrupt_record,age,date_joined,first_name,ind,last_name
"""{\""records\"": [{\""value\"": {\""ind\"": 10137, \""first_name\"": \""Daniel\"", \""last_name\"": \""Matthews\"", \""age\"": 34, \""date_joined\"": \""2016-01-23 03:59:37\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 9146, \""first_name\"": \""Andrew\"", \""last_name\"": \""Anderson\"", \""age\"": 23, \""date_joined\"": \""2015-11-28 11:52:37\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1667, \""first_name\"": \""Bernard\"", \""last_name\"": \""Arnold\"", \""age\"": 21, \""date_joined\"": \""2015-12-12 01:39:29\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 6809, \""first_name\"": \""Andrea\"", \""last_name\"": \""Carroll\"", \""age\"": 20, \""date_joined\"": \""2016-01-21 03:54:20\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1170, \""first_name\"": \""Stacey\"", \""last_name\"": \""Stewart\"", \""age\"": 24, \""date_joined\"": \""2017-03-24 10:12:14\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1643, \""first_name\"": \""Claire\"", \""last_name\"": \""Leonard\"", \""age\"": 45, \""date_joined\"": \""2016-03-18 23:34:56\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 10883, \""first_name\"": \""Carl\"", \""last_name\"": \""Hampton\"", \""age\"": 25, \""date_joined\"": \""2015-11-26 03:43:03\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 5091, \""first_name\"": \""Samantha\"", \""last_name\"": \""Hall\"", \""age\"": 27, \""date_joined\"": \""2017-04-27 09:48:22\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 10321, \""first_name\"": \""Andrea\"", \""last_name\"": \""Burke\"", \""age\"": 20, \""date_joined\"": \""2015-12-12 11:20:08\""}}]}""",,,,,
"""{\""records\"": [{\""value\"": {\""ind\"": 1611, \""first_name\"": \""Erik\"", \""last_name\"": \""Martinez\"", \""age\"": 40, \""date_joined\"": \""2017-03-08 06:03:20\""}}]}""",,,,,
