
com.github.panhongan.util.spark.RDDUtil.scala Maven / Gradle / Ivy
The newest version!
package com.github.panhongan.util.spark
import org.apache.spark.rdd.RDD
import com.github.panhongan.util.collection.CollectionUtil
object RDDUtil {
def distinct(rdd : RDD[String]) : RDD[String] = {
rdd.mapPartitions(CollectionUtil.distinct _).distinct()
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy