Skip to content

Commit

Permalink
Don't import spark session implicits (#25)
Browse files Browse the repository at this point in the history
  • Loading branch information
cwienberg committed Aug 26, 2022
1 parent 2e530b4 commit b3dd37d
Showing 1 changed file with 2 additions and 3 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -110,22 +110,21 @@ final class SecondarySortGroupByKeyDatasetFunctions[K, V](
keyOrdering: Ordering[K],
kaEncoder: Encoder[(K, A)]
): Dataset[(K, A)] = {
import dataset.sparkSession.implicits._
val repartitionedStartValues = SecondarySortGroupByKeyDatasetFunctions
.repartitionAndSort(startValues, numPartitions)
.rdd
val repartitionedValues = SecondarySortGroupByKeyDatasetFunctions
.repartitionAndSort(dataset, numPartitions, orderExprs)
.rdd
repartitionedStartValues
val kaRDD = repartitionedStartValues
.zipPartitions(
repartitionedValues.mapPartitions(
new GroupByKeyIterator(_),
preservesPartitioning = true
),
preservesPartitioning = true
)(joinAndFold(op))
.toDS()
dataset.sparkSession.createDataset(kaRDD)
}

/** Groups by key and applies a binary operation using foldLeft
Expand Down

0 comments on commit b3dd37d

Please sign in to comment.