import
pyspark
from
pyspark.sql
import
SparkSession
spark
=
SparkSession.builder.appName(
'sparkdf'
).getOrCreate()
data
=
[[
1
,
"sravan"
,
"company 1"
],
[
2
,
"ojaswi"
,
"company 1"
],
[
3
,
"rohith"
,
"company 2"
],
[
4
,
"sridevi"
,
"company 1"
],
[
1
,
"sravan"
,
"company 1"
],
[
4
,
"sridevi"
,
"company 1"
]]
columns
=
[
'ID'
,
'NAME'
,
'Company'
]
dataframe
=
spark.createDataFrame(data, columns)
dataframe.show()