pyspark时间聚合
w = df.groupBy(window("date", "5 seconds")).agg(sum("val").alias("sum"))
移动窗口
data1 = data.groupBy(window(data.date,"3 days","1 days"),data.column2,data.column3).count()
w = df.groupBy(window("date", "5 seconds")).agg(sum("val").alias("sum"))
移动窗口
data1 = data.groupBy(window(data.date,"3 days","1 days"),data.column2,data.column3).count()