> Create a virtual Env.
> Example:
>
> 1. create a simple new env
>
>    ```
>    pyenv virtualenv 3.10.6 .envPyspark
>    pyenv activate .envPyspark
>    ```
>
> 2. install the requirements
>    ```
>    pip install --upgrade pip 
>
>    pip install ipykernel pyspark==3.4.0
>    ```
>
> 3. Set as the kernel for your notebook

# Create the spark session

In [4]:
from pyspark.sql import SparkSession
from pyspark.sql.dataframe import DataFrame

spark: SparkSession = (
    SparkSession.builder
        .appName('Visualizations')
        .getOrCreate()
    )

df: DataFrame = (
    spark.createDataFrame([{'name': 'josh'}])
)

# Basic visualization

In [5]:
df.show()

                                                                                

+----+
|name|
+----+
|josh|
+----+



# Improved the visualization in the notebooks

In [28]:
spark.conf.set('spark.sql.repl.eagerEval.enabled', True)

In [29]:
df

name
josh


# Show vertical your data

In [30]:
df.show(1, vertical = True)

-RECORD 0----
 name | josh 



## See a summary about your data

In [31]:
df.summary().show()

[Stage 33:>                                                         (0 + 8) / 8]

+-------+----+
|summary|name|
+-------+----+
|  count|   1|
|   mean|null|
| stddev|null|
|    min|josh|
|    25%|null|
|    50%|null|
|    75%|null|
|    max|josh|
+-------+----+



                                                                                

# References

1. https://spark.apache.org/docs/3.4.0/api/python/reference/index.html