Demonstrate Explode
from pyspark.sql import SparkSession
from pyspark.sql.functions import explode
#spark = SparkSession.builder.appName("StructuredStreaming").getOrCreate()
spark = SparkSession.builder.appName("StreamingExample").getOrCreate()
data = [
(1, ["apple","banana","cherry"]),
(2, ["orange","cherry"]),
(3, [])
]
df = spark.createDataFrame(data, ["id", "fruit"])
df.select("id",explode("fruit").alias("fruits")).show()
Comments
Post a Comment