com.intel.analytics.bigdl.nn.quantized.SpatialDilatedConvolution.scala Maven / Gradle / Ivy
The newest version!
/*
* Copyright 2016 The BigDL Authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.intel.analytics.bigdl.nn.quantized
import com.intel.analytics.bigdl.nn.abstractnn.DataFormat
import com.intel.analytics.bigdl.tensor.TensorNumericMath.TensorNumeric
import com.intel.analytics.bigdl.tensor.{FloatType, QuantizedTensor, Tensor}
import com.intel.analytics.bigdl.utils.serializer.converters.DataConverter
import com.intel.analytics.bigdl.utils.serializer.{DeserializeContext, ModuleData, SerializeContext}
import com.intel.analytics.bigdl.serialization.Bigdl.{AttrValue, BigDLModule}
import scala.reflect.ClassTag
import scala.reflect.runtime.universe
@SerialVersionUID(- 8572055756810843156L)
private[bigdl] class SpatialDilatedConvolution[T: ClassTag](
nInputPlane: Int, // The number of expected input planes in the image given into forward()
nOutputPlane: Int, // The number of output planes the convolution layer will produce.
kernelW: Int, // The kernel width of the convolution
kernelH: Int, // The kernel height of the convolution
strideW: Int = 1, // The step of the convolution in the width dimension.
strideH: Int = 1, // The step of the convolution in the height dimension
padW: Int = 0, // The additional zeros added per width to the input planes.
padH: Int = 0, // The additional zeros added per height to the input planes.
val dilationW: Int = 1,
val dilationH: Int = 1,
format: DataFormat = DataFormat.NCHW
)(implicit ev: TensorNumeric[T]) extends SpatialConvolution[T](
nInputPlane,
nOutputPlane,
kernelW,
kernelH,
strideW,
strideH,
padW,
padH,
format = format
) {
override val dilationWidth: Int = dilationW
override val dilationHeight: Int = dilationH
override def toString(): String = {
s"quantized.SpatialDilatedConvolution($nInputPlane -> $nOutputPlane, $kernelW x" +
s" $kernelH, $strideW, $strideH, $padW, $padH, $dilationW, $dilationH)"
}
}
object SpatialDilatedConvolution extends QuantSerializer {
def apply[T: ClassTag](
nInputPlane: Int,
nOutputPlane: Int,
kW: Int,
kH: Int,
dW: Int = 1,
dH: Int = 1,
padW: Int = 0,
padH: Int = 0,
dilationW: Int = 1,
dilationH: Int = 1,
initWeight: Tensor[T] = null,
initBias: Tensor[T] = null,
format: DataFormat = DataFormat.NCHW
)(implicit ev: TensorNumeric[T]) : SpatialDilatedConvolution[T] = {
val conv = new SpatialDilatedConvolution[T](nInputPlane, nOutputPlane, kW, kH, dW, dH,
padW, padH, dilationW, dilationH, format = format)
conv.initWeightAndBias(initWeight, initBias)
}
override def serializeWeight[T: ClassTag](context: SerializeContext[T],
modelBuilder: BigDLModule.Builder)(implicit ev: TensorNumeric[T]): Unit = {
val module = context.moduleData.module
val conv = module.asInstanceOf[SpatialDilatedConvolution[T]]
val weightBuilder = AttrValue.newBuilder
ev.getType() match {
case FloatType =>
DataConverter.setAttributeValue(context, weightBuilder, conv.weight,
universe.typeOf[Array[Tensor[Float]]])
case _ => throw new UnsupportedOperationException(s"Only support Float for quantized model")
}
modelBuilder.putAttr("weights", weightBuilder.build)
}
override def loadWeight[T: ClassTag](context: DeserializeContext,
moduleData: ModuleData[T])(implicit ev: TensorNumeric[T]): Unit = {
val conv = moduleData.module.asInstanceOf[SpatialDilatedConvolution[T]]
val attrMap = context.bigdlModule.getAttrMap
val weights = DataConverter.getAttributeValue(context, attrMap.get("weights"))
.asInstanceOf[Array[Tensor[T]]]
for (i <- 0 until conv.weight.length) {
conv.weight(i).asInstanceOf[QuantizedTensor[T]].release()
conv.weight(i).set(weights(i))
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy