In [1]:
# Importando as bibliotecas utilizadas
from pyspark.sql import SparkSession
import pyspark.sql.functions as F

In [3]:
# Criando a sessão, nomeando e configurando para mostrar tabela do tipo pandas 
spark = (
    SparkSession.builder
    .appName('PySpark - Consultas SQL')
    .config('spark.sql.repl.eagerEval.enabled', True)
    .getOrCreate()
)

In [5]:
# Carregando um arquivo PARQUET para dataframe
df = spark.read.parquet('./DATASETS/LOGINS.parquet')

In [11]:
# Passando um comando SQL diretamente
spark.sql("""
    SELECT * 
    FROM {logins}
    WHERE estado IN {uf}
""", logins = df, uf = ('SP', 'PR'))

cpf,email,senha,data_de_nascimento,estado,data_cadastro,ipv4,cor_favorita,profissao,telefone
573.619.804-57,hnogueira@ig.com.br,&9Ejtll$PF,1949-03-06,SP,2023-01-27,168.162.247.252,Cinza,Instalador De Lin...,(031) 9148 3933
734.801.926-96,pedro-miguel43@bo...,*72CCJdxX0,1965-09-14,SP,2023-02-22,222.145.189.67,Roxo,Coach,51 9026 3441
524.789.301-88,diogosales@yahoo....,*yWPtYdi71,1931-01-17,PR,2023-01-14,149.106.171.164,Marrom,Turismólogo,+55 (041) 6393-0208
869.072.315-30,luiz-gustavorocha...,$62UN05c(9,1980-10-19,SP,2023-01-04,53.167.75.100,Verde Claro,Lactarista Hospit...,+55 31 1296 8466
291.358.407-14,lavinia54@ig.com.br,NyI@+8Kd!1,1982-01-28,SP,2023-02-26,79.132.46.55,Preto,Profissional De R...,+55 51 5526 8284
460.125.983-51,lazevedo@gmail.com,uC0O7QdE&B,1972-07-14,SP,2023-01-24,221.155.104.128,Preto,Atleta De Arremes...,+55 71 9251-1645
837.410.256-07,martinsmaysa@bol....,(Z8RNs%un6,1972-08-21,SP,2023-02-24,157.119.230.252,Cinza,Laboratorista,+55 (084) 4945-6200
730.184.526-07,fviana@ig.com.br,1(3oLDln$8,1938-10-23,SP,2023-03-02,99.31.171.138,Verde Escuro,Profissional De I...,0900-429-5628
874.092.613-31,bruno71@yahoo.com.br,HF1FfNe5&H,1946-11-25,SP,2023-03-03,14.80.253.67,Violeta,Confeiteiro,(084) 0687-3775
465.092.837-00,stellacastro@uol....,t@3Fyqzr&#,2005-12-03,PR,2023-01-04,105.93.60.18,Laranja,Piloto Automobilí...,0500 746 4091


In [14]:
# O mesmo resultado com as funções do PySpark 
df.where(F.col('estado').isin('SP', 'PR')) # .select('*') é implícito

cpf,email,senha,data_de_nascimento,estado,data_cadastro,ipv4,cor_favorita,profissao,telefone
573.619.804-57,hnogueira@ig.com.br,&9Ejtll$PF,1949-03-06,SP,2023-01-27,168.162.247.252,Cinza,Instalador De Lin...,(031) 9148 3933
734.801.926-96,pedro-miguel43@bo...,*72CCJdxX0,1965-09-14,SP,2023-02-22,222.145.189.67,Roxo,Coach,51 9026 3441
524.789.301-88,diogosales@yahoo....,*yWPtYdi71,1931-01-17,PR,2023-01-14,149.106.171.164,Marrom,Turismólogo,+55 (041) 6393-0208
869.072.315-30,luiz-gustavorocha...,$62UN05c(9,1980-10-19,SP,2023-01-04,53.167.75.100,Verde Claro,Lactarista Hospit...,+55 31 1296 8466
291.358.407-14,lavinia54@ig.com.br,NyI@+8Kd!1,1982-01-28,SP,2023-02-26,79.132.46.55,Preto,Profissional De R...,+55 51 5526 8284
460.125.983-51,lazevedo@gmail.com,uC0O7QdE&B,1972-07-14,SP,2023-01-24,221.155.104.128,Preto,Atleta De Arremes...,+55 71 9251-1645
837.410.256-07,martinsmaysa@bol....,(Z8RNs%un6,1972-08-21,SP,2023-02-24,157.119.230.252,Cinza,Laboratorista,+55 (084) 4945-6200
730.184.526-07,fviana@ig.com.br,1(3oLDln$8,1938-10-23,SP,2023-03-02,99.31.171.138,Verde Escuro,Profissional De I...,0900-429-5628
874.092.613-31,bruno71@yahoo.com.br,HF1FfNe5&H,1946-11-25,SP,2023-03-03,14.80.253.67,Violeta,Confeiteiro,(084) 0687-3775
465.092.837-00,stellacastro@uol....,t@3Fyqzr&#,2005-12-03,PR,2023-01-04,105.93.60.18,Laranja,Piloto Automobilí...,0500 746 4091


In [20]:
# Pode ser criado tabelas temporárias com os dataframes 
df.createOrReplaceTempView('logins') # registerTempTable foi depreciado

spark.sql("""
    SELECT * 
    FROM logins
    WHERE estado IN ('SP', 'PR')
""")

cpf,email,senha,data_de_nascimento,estado,data_cadastro,ipv4,cor_favorita,profissao,telefone
573.619.804-57,hnogueira@ig.com.br,&9Ejtll$PF,1949-03-06,SP,2023-01-27,168.162.247.252,Cinza,Instalador De Lin...,(031) 9148 3933
734.801.926-96,pedro-miguel43@bo...,*72CCJdxX0,1965-09-14,SP,2023-02-22,222.145.189.67,Roxo,Coach,51 9026 3441
524.789.301-88,diogosales@yahoo....,*yWPtYdi71,1931-01-17,PR,2023-01-14,149.106.171.164,Marrom,Turismólogo,+55 (041) 6393-0208
869.072.315-30,luiz-gustavorocha...,$62UN05c(9,1980-10-19,SP,2023-01-04,53.167.75.100,Verde Claro,Lactarista Hospit...,+55 31 1296 8466
291.358.407-14,lavinia54@ig.com.br,NyI@+8Kd!1,1982-01-28,SP,2023-02-26,79.132.46.55,Preto,Profissional De R...,+55 51 5526 8284
460.125.983-51,lazevedo@gmail.com,uC0O7QdE&B,1972-07-14,SP,2023-01-24,221.155.104.128,Preto,Atleta De Arremes...,+55 71 9251-1645
837.410.256-07,martinsmaysa@bol....,(Z8RNs%un6,1972-08-21,SP,2023-02-24,157.119.230.252,Cinza,Laboratorista,+55 (084) 4945-6200
730.184.526-07,fviana@ig.com.br,1(3oLDln$8,1938-10-23,SP,2023-03-02,99.31.171.138,Verde Escuro,Profissional De I...,0900-429-5628
874.092.613-31,bruno71@yahoo.com.br,HF1FfNe5&H,1946-11-25,SP,2023-03-03,14.80.253.67,Violeta,Confeiteiro,(084) 0687-3775
465.092.837-00,stellacastro@uol....,t@3Fyqzr&#,2005-12-03,PR,2023-01-04,105.93.60.18,Laranja,Piloto Automobilí...,0500 746 4091
