Demonstrate Explode

 from pyspark.sql import SparkSession

from pyspark.sql.functions import explode


#spark = SparkSession.builder.appName("StructuredStreaming").getOrCreate()

spark = SparkSession.builder.appName("StreamingExample").getOrCreate()


data = [

    (1, ["apple","banana","cherry"]),

    (2, ["orange","cherry"]),

    (3, [])

]

df = spark.createDataFrame(data, ["id", "fruit"])


df.select("id",explode("fruit").alias("fruits")).show()

Comments

Popular posts from this blog

sql question set 1

SCD Type 2 in MySQL/ coforge

3 days running average / capco