## Sample read Delta table on Minio

In [1]:
from pyspark import SparkContext, SparkConf
from pyspark.sql import SparkSession
from pyspark.sql.functions import *
from pyspark.sql.types import *
from dotenv import load_dotenv
import os

In [2]:
load_dotenv()

HOST_ADDRESS = os.getenv("HOST_ADDRESS")
MINIO_ACCESS_KEY = os.getenv("MINIO_ACCESS_KEY")
MINIO_SECRET_KEY = os.getenv("MINIO_SECRET_KEY")

conf = SparkConf()

conf.setAppName("Sample read Delta table")
conf.set("spark.hadoop.fs.s3a.endpoint", f"http://{HOST_ADDRESS}:9000")
conf.set("spark.hadoop.fs.s3a.access.key", MINIO_ACCESS_KEY)
conf.set("spark.hadoop.fs.s3a.secret.key", MINIO_SECRET_KEY)
conf.set("spark.hadoop.fs.s3a.path.style.access", True)
conf.set("spark.hadoop.fs.s3a.impl", "org.apache.hadoop.fs.s3a.S3AFileSystem")
conf.set('spark.hadoop.fs.s3a.aws.credentials.provider', 'org.apache.hadoop.fs.s3a.SimpleAWSCredentialsProvider')
conf.set("spark.sql.extensions", "io.delta.sql.DeltaSparkSessionExtension")
conf.set("spark.sql.catalog.spark_catalog", "org.apache.spark.sql.delta.catalog.DeltaCatalog") 
conf.set("hive.metastore.uris", "thrift://metastore:9083")

spark = SparkSession.builder.config(conf=conf).enableHiveSupport().getOrCreate()

In [3]:
# Ler os arquivos Parquet com limite
df_parquet = spark.read.format("parquet").load('s3a://landing/isp_performance/landing_ordem_servico_aberto') \
    .filter("id IS NOT NULL") \
    .limit(100)

df_parquet.show()

+----------------+-------------------+-------------------+-------------------+-------------------+-------------+-------+-------------------+------+----+--------+-----------+---------+-------------------+-------------------+--------+------+---------+---------+-----+--------+---------+----------+--------------------+------------+--------------------+--------------------+------------+--------------+-----------+-------------------+--------------------+-------------------+--------------------+--------+-------------------+-------------------+-------------------+-------------------+------------+------------------+----------+-------------------+----+---------------+------------+-----------+-------+-----------------+-------------------+-------------+--------+--------------+------------------------+-----------------------+-------------------+-------------------+--------------+-------------------+--------------------+---------+
|mensagemResposta|    dataHoraAnalise|dataHoraEncaminhado|   dataHora