geotrellis.spark.io.s3.S3LayerWriter.scala Maven / Gradle / Ivy
package geotrellis.spark.io.s3
import geotrellis.raster.{MultibandTile, Tile}
import geotrellis.spark._
import geotrellis.spark.io._
import geotrellis.spark.io.avro._
import geotrellis.spark.io.avro.codecs._
import geotrellis.spark.io.index._
import geotrellis.util._
import com.amazonaws.services.s3.model.PutObjectRequest
import com.typesafe.scalalogging.slf4j._
import org.apache.spark.rdd.RDD
import spray.json._
import scala.reflect._
/**
* Handles writing Raster RDDs and their metadata to S3.
*
* @param bucket S3 bucket to be written to
* @param keyPrefix S3 prefix to write the raster to
* @param keyIndexMethod Method used to convert RDD keys to SFC indexes
* @param attributeStore AttributeStore to be used for storing raster metadata
* @param putObjectModifier Function that will be applied ot S3 PutObjectRequests, so that they can be modified (e.g. to change the ACL settings)
* @tparam K Type of RDD Key (ex: SpatialKey)
* @tparam V Type of RDD Value (ex: Tile or MultibandTile )
* @tparam M Type of Metadata associated with the RDD[(K,V)]
*/
class S3LayerWriter(
val attributeStore: AttributeStore,
bucket: String,
keyPrefix: String,
putObjectModifier: PutObjectRequest => PutObjectRequest = { p => p }
) extends LayerWriter[LayerId] with LazyLogging {
def rddWriter: S3RDDWriter = S3RDDWriter
protected def _write[
K: AvroRecordCodec: JsonFormat: ClassTag,
V: AvroRecordCodec: ClassTag,
M: JsonFormat: GetComponent[?, Bounds[K]]
](id: LayerId, rdd: RDD[(K, V)] with Metadata[M], keyIndex: KeyIndex[K]): Unit = {
require(!attributeStore.layerExists(id), s"$id already exists")
implicit val sc = rdd.sparkContext
val prefix = makePath(keyPrefix, s"${id.name}/${id.zoom}")
val metadata = rdd.metadata
val header = S3LayerHeader(
keyClass = classTag[K].toString(),
valueClass = classTag[V].toString(),
bucket = bucket,
key = prefix)
val maxWidth = Index.digits(keyIndex.toIndex(keyIndex.keyBounds.maxKey))
val keyPath = (key: K) => makePath(prefix, Index.encode(keyIndex.toIndex(key), maxWidth))
val schema = KeyValueRecordCodec[K, V].schema
try {
attributeStore.writeLayerAttributes(id, header, metadata, keyIndex, schema)
logger.info(s"Saving RDD ${id.name} to $bucket $prefix")
rddWriter.write(rdd, bucket, keyPath, putObjectModifier)
} catch {
case e: Exception => throw new LayerWriteError(id).initCause(e)
}
}
}
object S3LayerWriter {
def apply(attributeStore: AttributeStore, bucket: String, prefix: String, putObjectModifier: PutObjectRequest => PutObjectRequest): S3LayerWriter =
new S3LayerWriter(attributeStore, bucket, prefix, putObjectModifier)
def apply(attributeStore: AttributeStore, bucket: String, prefix: String): S3LayerWriter =
new S3LayerWriter(attributeStore, bucket, prefix)
def apply(attributeStore: S3AttributeStore): S3LayerWriter =
apply(attributeStore, attributeStore.bucket, attributeStore.prefix)
def apply(attributeStore: S3AttributeStore, putObjectModifier: PutObjectRequest => PutObjectRequest): S3LayerWriter =
apply(attributeStore, attributeStore.bucket, attributeStore.prefix, putObjectModifier)
def apply(bucket: String, prefix: String): S3LayerWriter =
apply(S3AttributeStore(bucket, prefix))
def apply(bucket: String, prefix: String, putObjectModifier: PutObjectRequest => PutObjectRequest): S3LayerWriter =
apply(S3AttributeStore(bucket, prefix), putObjectModifier)
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy