In [0]:
from pyspark.sql.functions import lit

In [0]:
value = lit('abcd')
print(value)

Column<'abcd'>


In [0]:
data = [('wafa','male',2000),('maheer','male',4000)]
schema = ('name','gender','salary')
df = spark.createDataFrame(data,schema)
df.show()
df.printSchema()

+------+------+------+
|  name|gender|salary|
+------+------+------+
|  wafa|  male|  2000|
|maheer|  male|  4000|
+------+------+------+

root
 |-- name: string (nullable = true)
 |-- gender: string (nullable = true)
 |-- salary: long (nullable = true)



In [0]:
df = df.withColumn('newCol',lit('newVal'))
df.show()
df.printSchema()

+------+------+------+------+
|  name|gender|salary|newCol|
+------+------+------+------+
|  wafa|  male|  2000|newVal|
|maheer|  male|  4000|newVal|
+------+------+------+------+

root
 |-- name: string (nullable = true)
 |-- gender: string (nullable = true)
 |-- salary: long (nullable = true)
 |-- newCol: string (nullable = false)



In [0]:
df1 = df.select(df.name)
display(df1)

name
wafa
maheer


In [0]:
df2 = df.select(df['name']).show()

+------+
|  name|
+------+
|  wafa|
|maheer|
+------+



In [0]:
from pyspark.sql.functions import col

In [0]:
df3 = df.select(col('name')).show()

+------+
|  name|
+------+
|  wafa|
|maheer|
+------+



In [0]:
from pyspark.sql.types import StructType,StructField,StringType

In [0]:
data = [('wafa','male',('blue','brown')),('maheer','male',('black','blue'))]
props = StructType([\
    StructField('hairColor',StringType()),\
    StructField('EyeColor',StringType())
])
schema = StructType([
    StructField('name',StringType()),\
    StructField('gender',StringType()),\
    StructField('props',props)
])
df = spark.createDataFrame(data,schema)
df.show()
df.printSchema()

+------+------+-------------+
|  name|gender|        props|
+------+------+-------------+
|  wafa|  male|{blue, brown}|
|maheer|  male|{black, blue}|
+------+------+-------------+

root
 |-- name: string (nullable = true)
 |-- gender: string (nullable = true)
 |-- props: struct (nullable = true)
 |    |-- hairColor: string (nullable = true)
 |    |-- EyeColor: string (nullable = true)



In [0]:
df.select(df.props.haircolor).show()

+---------------+
|props.haircolor|
+---------------+
|           blue|
|          black|
+---------------+



In [0]:
from pyspark.sql.functions import col

In [0]:
df.select(col('props.EyeColor')).show()

+--------+
|EyeColor|
+--------+
|   brown|
|    blue|
+--------+



In [0]:
df.select(df['props.hairColor']).show()

+---------+
|hairColor|
+---------+
|     blue|
|    black|
+---------+

