spark
Dataset.groupByKey + reduceGroups
wefree
2025. 1. 6. 10:47
case class Foo(x: String, y: String, z: Int)
val ds = df.as[Foo]
ds.groupByKey(_.x).reduceGroups((a, b) => a.copy(z = a.z + b.z)).explain