In [0]:
help(spark.createDataFrame)

Help on method createDataFrame in module pyspark.sql.session:

createDataFrame(data: Union[pyspark.rdd.RDD[Any], Iterable[Any], ForwardRef('PandasDataFrameLike'), ForwardRef('ArrayLike')], schema: Union[pyspark.sql.types.AtomicType, pyspark.sql.types.StructType, str, NoneType] = None, samplingRatio: Optional[float] = None, verifySchema: bool = True) -> pyspark.sql.dataframe.DataFrame method of pyspark.sql.session.SparkSession instance
    Creates a :class:`DataFrame` from an :class:`RDD`, a list, a :class:`pandas.DataFrame`
    or a :class:`numpy.ndarray`.
    
    .. versionadded:: 2.0.0
    
    .. versionchanged:: 3.4.0
        Support Spark Connect.
    
    Parameters
    ----------
    data : :class:`RDD` or iterable
        an RDD of any kind of SQL data representation (:class:`Row`,
        :class:`tuple`, ``int``, ``boolean``, etc.), or :class:`list`,
        :class:`pandas.DataFrame` or :class:`numpy.ndarray`.
    schema : :class:`pyspark.sql.types.DataType`, str or list, opt

In [0]:
data = [(1,'Athiya'),
        (2,'studies')]
df = spark.createDataFrame(data = data)
df.show()

+---+-------+
| _1|     _2|
+---+-------+
|  1| Athiya|
|  2|studies|
+---+-------+



In [0]:
data = [(1,'Athiya'),
        (2,'studies')]
schema = ['Id','Name']
df = spark.createDataFrame(data = data,schema = schema)
df.show()

+---+-------+
| Id|   Name|
+---+-------+
|  1| Athiya|
|  2|studies|
+---+-------+



In [0]:
from pyspark.sql.types import *
help(StructType)

Help on class StructType in module pyspark.sql.types:

class StructType(DataType)
 |  StructType(fields: Optional[List[pyspark.sql.types.StructField]] = None)
 |  
 |  Struct type, consisting of a list of :class:`StructField`.
 |  
 |  This is the data type representing a :class:`Row`.
 |  
 |  Iterating a :class:`StructType` will iterate over its :class:`StructField`\s.
 |  A contained :class:`StructField` can be accessed by its name or position.
 |  
 |  Examples
 |  --------
 |  >>> from pyspark.sql.types import *
 |  >>> struct1 = StructType([StructField("f1", StringType(), True)])
 |  >>> struct1["f1"]
 |  StructField('f1', StringType(), True)
 |  >>> struct1[0]
 |  StructField('f1', StringType(), True)
 |  
 |  >>> struct1 = StructType([StructField("f1", StringType(), True)])
 |  >>> struct2 = StructType([StructField("f1", StringType(), True)])
 |  >>> struct1 == struct2
 |  True
 |  >>> struct1 = StructType([StructField("f1", CharType(10), True)])
 |  >>> struct2 = StructType([S

In [0]:
from pyspark.sql.types import *
data = [(1,'Athiya'),
        (2,'studies')]
schema = StructType([StructField(name='Id',dataType=IntegerType()),
                    StructField(name='Name',dataType=StringType())])
df = spark.createDataFrame(data = data,schema = schema)
df.show()

+---+-------+
| Id|   Name|
+---+-------+
|  1| Athiya|
|  2|studies|
+---+-------+



In [0]:
df.printSchema()

root
 |-- Id: integer (nullable = true)
 |-- Name: string (nullable = true)



In [0]:
data = [{'id':1,'name':'Athiya'},
        {'id':2,'name':'studies'}]
df = spark.createDataFrame(data)
df.show()
df.printSchema()

+---+-------+
| id|   name|
+---+-------+
|  1| Athiya|
|  2|studies|
+---+-------+

root
 |-- id: long (nullable = true)
 |-- name: string (nullable = true)

