xxxxxxxxxx
from pyspark.sql import SparkSession
from pyspark.sql.functions import collect_list
# Create a SparkSession
spark = SparkSession.builder.getOrCreate()
# Create a sample dataframe
data = [("Alice", 25), ("Bob", 30), ("Charlie", 35)]
df = spark.createDataFrame(data, ["Name", "Age"])
# Convert the "Name" column into a list
name_list = df.select(collect_list("Name").alias("NameList")).first().NameList
# Print the resulting list
print(name_list)
xxxxxxxxxx
# convert student Name to list using
# flatMap
print(dataframe.select('student Name').
rdd.flatMap(lambda x: x).collect())
# convert student ID to list using
# flatMap
print(dataframe.select('student ID').
rdd.flatMap(lambda x: x).collect())
xxxxxxxxxx
>>> mvv_list = mvv_count_df.select('mvv').collect()
>>> mvv_list[0]
Out: Row(mvv=1)