
geotrellis.spark.io.hadoop.SaveBytesToHadoopMethods.scala Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of geotrellis-spark_2.11 Show documentation
Show all versions of geotrellis-spark_2.11 Show documentation
GeoTrellis is an open source geographic data processing engine for high performance applications.
The newest version!
package geotrellis.spark.io.hadoop
import geotrellis.spark.render._
import geotrellis.spark.{LayerId, SpatialKey}
import java.net.URI
import org.apache.hadoop.conf.Configuration
import org.apache.hadoop.fs.{FileSystem, Path}
import org.apache.spark.rdd.RDD
class SaveBytesToHadoopMethods[K](rdd: RDD[(K, Array[Byte])]) {
/** Saves to Hadoop FileSystem, returns a count of records saved.
*
* @param keyToUri A function from K (a key) to a Hadoop URI
*/
def saveToHadoop(keyToUri: K => String): Long =
SaveToHadoop(rdd, keyToUri)
/** Sets up saving to Hadoop, but returns an RDD so that writes can be chained.
*
* @param scheme URI scheme, used to get a hadoop FileSystem object
* @param keyToUri A function from K (a key) to a Hadoop URI
*/
def setupSaveToHadoop(keyToUri: K => String): RDD[(K, Array[Byte])] =
SaveToHadoop.setup(rdd, keyToUri)
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy