# coding:utf8 from pyspark.sql import SparkSession from pyspark.sql.functions import avg if __name__ == '__main__': spark = SparkSession\ .builder\ .master("local[*]")\ .appName("Simple Application")\ .getOrCreate() bookDF = spark \ .createDataFrame([("spark", 2), ("hadoop", 6), ("hadoop", 4), ("spark", 6)]) \ .toDF("book", "amount") avgDF = bookDF.groupBy("book").agg(avg("amount")) avgDF.show() spark.stop()

视频信息