RDD与DataFrame from pyspark.sql import SparkSession spark = SparkSession.builder.master("local[2]").appName("TextFileApp").getOrCreate() data = spark.createDataFrame(([1,12,100],[1,12,100],[1,12,100],[2,12,200],[3,13,100]),['ID','time','Consumer']) data.show() data.groupby('ID','...