com.intel.analytics.bigdl.nn.LocallyConnected2D.scala Maven / Gradle / Ivy
/*
* Copyright 2016 The BigDL Authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.intel.analytics.bigdl.nn
import com.intel.analytics.bigdl.nn.abstractnn.{DataFormat, Initializable, TensorModule}
import com.intel.analytics.bigdl.optim.Regularizer
import com.intel.analytics.bigdl.tensor.TensorNumericMath.TensorNumeric
import com.intel.analytics.bigdl.tensor.{DoubleType, FloatType, Tensor}
import com.intel.analytics.bigdl.utils.{Engine, Shape, T, Table}
import scala.concurrent.Future
import scala.reflect.ClassTag
/**
* The LocallyConnected2D layer works similarly to the [[SpatialConvolution]] layer,
* except that weights are unshared, that is, a different set of filters
* is applied at each different patch of the input.
*
* @param nInputPlane The number of expected input planes
* in the image given into forward()
* @param inputWidth The input width
* @param inputHeight The input height
* @param nOutputPlane The number of output planes the convolution layer will produce.
* @param kernelW The kernel width of the convolution
* @param kernelH The kernel height of the convolution
* @param strideW The step of the convolution in the width dimension
* @param strideH The step of the convolution in the height dimension
* @param padW The additional zeros added per width to the input planes
* @param padH The additional zeros added per height to the input planes
* @param propagateBack propagate gradient back
* @param wRegularizer weight regularizer
* @param bRegularizer bias regularizer
* @param initWeight initial weight
* @param initBias initial bias
* @param initGradWeight initial gradient weight
* @param initGradBias initial gradient bias
* @param withBias if has bias
* @param format data format NCHW, NHWC
* @tparam T The numeric type in the criterion, usually which are [[Float]] or [[Double]]
*/
class LocallyConnected2D[T: ClassTag](
val nInputPlane: Int,
val inputWidth: Int,
val inputHeight: Int,
val nOutputPlane: Int,
val kernelW: Int,
val kernelH: Int,
val strideW: Int = 1,
val strideH: Int = 1,
val padW: Int = 0,
val padH: Int = 0,
val propagateBack: Boolean = true,
var wRegularizer: Regularizer[T] = null,
var bRegularizer: Regularizer[T] = null,
val initWeight: Tensor[T] = null,
val initBias: Tensor[T] = null,
val initGradWeight: Tensor[T] = null,
val initGradBias: Tensor[T] = null,
val withBias: Boolean = true,
val format: DataFormat = DataFormat.NCHW
)(implicit ev: TensorNumeric[T]) extends TensorModule[T] with Initializable {
require((padW >= 0 && padH >= 0) || (padW == -1 && padH == -1),
s"Illegal padding configuration (padW: $padW, padH: $padH)")
val sizes =
if (padW == -1 && padH == -1) {
Utils.getSAMEOutSizeAndPadding(inputHeight, inputWidth, strideH, strideW, kernelH, kernelW)
} else {
Utils.getOutSizeAndPadding(inputHeight, inputWidth, strideH, strideW,
kernelH, kernelW, padH, padW, ceilMode = false)
}
val padTop = sizes(0)
val padBottom = sizes(1)
val padLeft = sizes(2)
val padRight = sizes(3)
val outputHeight = sizes(4)
val outputWidth = sizes(5)
private val weightShape = Array(
outputHeight * outputWidth,
nOutputPlane,
nInputPlane * kernelH * kernelW
)
private val weightFormat = format match {
case DataFormat.NCHW =>
VariableFormat.GP_OUT_IN_KW_KH
case DataFormat.NHWC =>
VariableFormat.GP_KH_KW_IN_OUT
}
val weight: Tensor[T] = if (initWeight != null) {
initWeight
} else {
Tensor[T](weightShape)
}
val bias: Tensor[T] = if (!withBias) null
else if (initBias != null) initBias else Tensor[T](outputHeight * outputWidth, nOutputPlane)
val gradWeight: Tensor[T] = if (initGradWeight != null) {
initGradWeight
} else {
Tensor[T](weightShape)
}
val gradBias: Tensor[T] = if (!withBias) null
else if (initGradBias != null) initGradBias
else Tensor[T](outputHeight * outputWidth, nOutputPlane)
var fInput = Tensor[T]()
var fGradInput = Tensor[T]()
protected val ones = Tensor[T]()
protected val onesBatch = Tensor[T]()
protected val onesBias = if (withBias) Tensor[T]() else null
protected val gradientBiasMT: Tensor[T] = if (withBias) Tensor[T]() else null
protected var gradWeightMM: Tensor[T] = null
@transient
protected var gradWeightMMInBatch: Tensor[T] = null
@transient protected var gradBiasWindow: Tensor[T] = _
protected val _1x1 = if (kernelH == 1 && kernelW == 1 && strideW == 1 && strideH == 1
&& padH == 0 && padW == 0) {
true
} else {
false
}
{
val stdv = 1.0 / math.sqrt(kernelW * kernelH * nInputPlane)
val wInit: InitializationMethod = RandomUniform(-stdv, stdv)
val bInit: InitializationMethod = if (withBias) RandomUniform(-stdv, stdv)
else null
setInitMethod(wInit, bInit)
}
protected var im2colTime = 0L
protected var col2imTime = 0L
def getIm2ColTime(): Double = im2colTime
def getCol2ImgTime(): Double = col2imTime
@transient
protected var results: Array[Future[Unit]] = null
override def reset(): Unit = {
if (initWeight == null) {
weightInitMethod.init(weight, weightFormat)
}
if (withBias && initBias == null) {
biasInitMethod.init(bias, VariableFormat.ONE_D)
}
zeroGradParameters()
}
private def getOutputShape(oh: Int, ow: Int, batchSize: Int = -1): Array[Int] = {
format match {
case DataFormat.NCHW =>
if (batchSize == -1) {
Array(nOutputPlane, oh, ow)
} else {
Array(batchSize, nOutputPlane, oh, ow)
}
case DataFormat.NHWC =>
if (batchSize == -1) {
Array(oh, ow, nOutputPlane)
} else {
Array(batchSize, oh, ow, nOutputPlane)
}
}
}
private def getFInputShape(oh: Int, ow: Int, batchSize: Int = -1): Array[Int] = {
format match {
case DataFormat.NCHW =>
if (batchSize == -1) {
Array(kernelW * kernelH * nInputPlane, oh * ow)
} else {
Array(batchSize, kernelW * kernelH * nInputPlane, oh * ow)
}
case DataFormat.NHWC =>
if (batchSize == -1) {
Array(oh * ow, kernelW * kernelH * nInputPlane)
} else {
Array(batchSize, oh * ow, kernelW * kernelH * nInputPlane)
}
}
}
// return (padTop, padDown, padLeft, padRight)
protected def getPadding(inputHeight: Int, inputWidth: Int): (Int, Int, Int, Int) = {
if (padW == -1 && padH == -1) {
// deal with SAME padding
val oW = Math.ceil(inputWidth.toFloat / strideW.toFloat).toInt
val oH = Math.ceil(inputHeight.toFloat / strideH.toFloat).toInt
val padAlongWidth = Math.max(0, (oW -1) * strideW + kernelW - inputWidth)
val padAlongHeight = Math.max(0, (oH - 1) * strideH + kernelH - inputHeight)
(padAlongHeight/2, padAlongHeight - padAlongHeight/2,
padAlongWidth/2, padAlongWidth - padAlongWidth/2)
} else {
(padH, padH, padW, padW)
}
}
override def computeOutputShape(inputShape: Shape): Shape = {
val input = inputShape.toSingle().toArray
require(input.length == 4,
s"LocallyConnected2D requires 4D input, but got input dim ${input.length}")
val (dimHeight, dimWidth, channelDim) = format.getHWCDims(input.length)
require(input(channelDim -1) == nInputPlane, s"input channel size " +
s"${input(channelDim -1)} is not the same as nInputPlane $nInputPlane")
require(outputWidth >= 1 && outputHeight >= 1,
s"output size is too small. outputWidth: $outputWidth, outputHeight: $outputHeight")
val outputShape = getOutputShape(outputHeight, outputWidth)
Shape(Array(input(0)) ++ outputShape)
}
override def updateOutput(input: Tensor[T]): Tensor[T] = {
require(input.dim() == 3 || input.dim() == 4,
"LocallyConnected2D: " + ErrorInfo.constrainInputAs3DOrBatch)
require(input.isContiguous())
val (dimHeight, dimWidth, channelDim) = format.getHWCDims(input.dim())
require(input.size(channelDim) == nInputPlane, s"input channel size " +
s"${input.size(channelDim)} is not the same as nInputPlane $nInputPlane")
require(outputWidth >= 1 && outputHeight >= 1,
s"output size is too small. outputWidth: $outputWidth, outputHeight: $outputHeight")
if (withBias && (onesBias.dim() != 1 || onesBias.size(1) != outputHeight * outputWidth)) {
onesBias.resize(Array(outputHeight * outputWidth)).fill(ev.fromType(1.0))
}
if (input.dim() == 3) {
require(input.isContiguous())
output.resize(getOutputShape(outputHeight, outputWidth))
if (_1x1) {
fInput.set(input)
fInput.resize(getFInputShape(outputHeight, outputWidth))
} else {
fInput.resize(getFInputShape(outputHeight, outputWidth))
}
val biasUse = if (withBias) {
bias
} else null
updateOutputFrame(
input,
output,
weight,
biasUse,
fInput,
kernelW, kernelH, strideW, strideH,
padLeft, padTop, padRight, padBottom,
nInputPlane, inputWidth, inputHeight,
nOutputPlane, outputWidth, outputHeight)
} else {
val batchSize = input.size(1)
output.resize(getOutputShape(outputHeight, outputWidth, batchSize))
if (_1x1) {
fInput.set(input)
fInput.resize(getFInputShape(outputHeight, outputWidth, batchSize))
} else {
fInput.resize(getFInputShape(outputHeight, outputWidth, batchSize))
}
if (results == null || results.length != batchSize) {
results = new Array[Future[Unit]](batchSize)
}
var i = 0
while (i < batchSize) {
val _i = i + 1
results(i) = Engine.model.invoke(() => {
val inputT = input.select(1, _i)
require(inputT.isContiguous())
val outputT = output.select(1, _i)
val fInputT = fInput.select(1, _i)
val biasUse = if (withBias) {
bias
} else null
updateOutputFrame(
inputT,
outputT,
weight,
biasUse,
fInputT,
kernelW, kernelH, strideW, strideH,
padLeft, padTop, padRight, padBottom,
nInputPlane, inputWidth, inputHeight,
nOutputPlane, outputWidth, outputHeight)
})
i += 1
}
Engine.model.sync(results)
}
output
}
override def updateGradInput(input: Tensor[T], gradOutput: Tensor[T]): Tensor[T] = {
if (!propagateBack) {
return gradInput
}
val (ohDim, owDim, cDim) = format.getHWCDims(input.dim())
val oh = gradOutput.size(ohDim)
val ow = gradOutput.size(owDim)
val inputWidth = input.size(owDim)
val inputHeight = input.size(ohDim)
val (padTop, padBottom, padLeft, padRight) = getPadding(inputHeight, inputWidth)
require(input.nDimension() == 3 || input.nDimension() == 4, "Only support 3D or 4D input")
gradInput.resizeAs(input)
if (_1x1) {
fGradInput.set(gradInput)
fGradInput.resizeAs(fInput)
} else {
fGradInput.resizeAs(fInput)
}
if (input.nDimension() == 3) {
require(gradOutput.isContiguous())
updateGradInputFrame(
gradInput,
gradOutput,
weight.transpose(2, 3),
fGradInput,
kernelW, kernelH, strideW, strideH, padLeft, padTop, padRight, padBottom)
} else {
val batchSize = input.size(1)
var i = 0
while (i < batchSize) {
val _i = i + 1
results(i) = Engine.model.invoke(() => {
val gradInputT = gradInput.select(1, _i)
val gradOutputT = gradOutput.select(1, _i)
require(gradOutputT.isContiguous())
val fgradInputT = fGradInput.select(1, _i)
updateGradInputFrame(
gradInputT,
gradOutputT,
weight.transpose(2, 3),
fgradInputT,
kernelW, kernelH, strideW, strideH, padLeft, padTop, padRight, padBottom)
})
i += 1
}
Engine.model.sync(results)
}
gradInput
}
private def getGradWeightMMInBatchShape(batchSize: Int) =
Array(batchSize, outputHeight * outputWidth,
nOutputPlane, nInputPlane * kernelH * kernelW)
override def accGradParameters(input: Tensor[T], gradOutput: Tensor[T]): Unit = {
require(input.nDimension() == 3 || input.nDimension() == 4,
"Only support 3D or 4D input," +
s"but input has ${input.nDimension()} dimensions")
require(gradOutput.isContiguous())
val (ohDim, owDim, cDim) = format.getHWCDims(input.dim())
val oh = gradOutput.size(ohDim)
val ow = gradOutput.size(owDim)
if (input.nDimension() == 3) {
if (gradWeightMM == null) {
gradWeightMM = gradWeight.view(weightShape)
}
val gradBiasUse = if (withBias) {
gradBias
} else null
accGradParametersFrame(
gradOutput,
gradWeightMM,
gradBiasUse,
fInput,
ev.fromType[Double](scaleW),
ev.fromType[Double](scaleB))
} else {
val batchSize = input.size(1)
if (gradWeightMMInBatch == null) {
gradWeightMMInBatch = Tensor[T]().resize(getGradWeightMMInBatchShape(batchSize))
}
if(withBias && gradientBiasMT.nElement() == 0) {
gradientBiasMT.resize(Array(batchSize, outputWidth * outputHeight, nOutputPlane))
}
if (ones.dim() != 1 || ones.size(1) != oh * ow) {
ones.resize(Array(oh * ow)).fill(ev.fromType(1.0))
}
if (onesBatch.dim() != 1 || onesBatch.size(1) != batchSize) {
onesBatch.resize(Array(batchSize)).fill(ev.fromType(1.0))
}
var i = 0
while (i < batchSize) {
val _i = i + 1
results(i) = Engine.model.invoke(() => {
val gradOutputT = gradOutput.select(1, _i)
val fInputT = fInput.select(1, _i)
val gradientBiasMTUse = if (withBias) {
gradientBiasMT.select(1, _i)
} else null
calcGradParametersFrame(
gradOutputT,
gradWeightMMInBatch.select(1, _i),
gradientBiasMTUse,
fInputT,
ev.fromType[Double](scaleW),
ev.fromType[Double](scaleB))
})
i += 1
}
Engine.model.sync(results)
val gradView = gradWeightMMInBatch.view(batchSize,
outputHeight * outputWidth * nOutputPlane *
nInputPlane * kernelH * kernelW).t
val grad = gradWeight.view(outputHeight * outputWidth *
nOutputPlane * nInputPlane * kernelH * kernelW)
grad.addmv(ev.fromType(1.0), ev.fromType(1.0), gradView, onesBatch)
if (withBias) {
gradBias.sum(gradientBiasMT, 1)
}
}
if (null != wRegularizer) {
wRegularizer.accRegularization(weight, gradWeight, scaleW)
}
if (withBias && null != bRegularizer) {
bRegularizer.accRegularization(bias, gradBias, scaleB)
}
}
override def parameters(): (Array[Tensor[T]], Array[Tensor[T]]) = {
if (withBias) {
(Array(this.weight, this.bias), Array(this.gradWeight, this.gradBias))
} else {
(Array(this.weight), Array(this.gradWeight))
}
}
override def equals(obj: Any): Boolean = {
if (!super.equals(obj)) {
return false
}
if (!obj.isInstanceOf[SpatialConvolution[T]]) {
return false
}
val other = obj.asInstanceOf[SpatialConvolution[T]]
if (this.eq(other)) {
return true
}
nInputPlane == other.nInputPlane &&
nOutputPlane == other.nOutputPlane &&
kernelW == other.kernelW &&
kernelH == other.kernelH &&
strideW == other.strideW &&
strideH == other.strideH &&
padW == other.padW &&
padH == other.padH &&
propagateBack == other.propagateBack &&
weight == other.weight &&
bias == other.bias &&
gradWeight == other.gradWeight &&
gradBias == other.gradBias
}
override def hashCode(): Int = {
val seed = 37
var hash = super.hashCode()
hash = hash * seed + nInputPlane.hashCode()
hash = hash * seed + nOutputPlane.hashCode()
hash = hash * seed + kernelW.hashCode()
hash = hash * seed + kernelH.hashCode()
hash = hash * seed + strideW.hashCode()
hash = hash * seed + strideH.hashCode()
hash = hash * seed + padW.hashCode()
hash = hash * seed + padH.hashCode()
hash = hash * seed + weight.hashCode()
if (withBias) hash = hash * seed + bias.hashCode()
hash = hash * seed + gradWeight.hashCode()
if (withBias) hash = hash * seed + gradBias.hashCode()
hash
}
override def clearState() : this.type = {
super.clearState()
fInput.set()
fGradInput.set()
ones.set()
onesBatch.set()
if (withBias) {
onesBias.set()
gradientBiasMT.set()
}
this
}
override def toString(): String = {
s"${getPrintName}($nInputPlane -> $nOutputPlane, $kernelW x" +
s" $kernelH, $strideW, $strideH, $padW, $padH)"
}
protected def updateOutputFrame(
input: Tensor[T], output: Tensor[T], weight: Tensor[T],
bias: Tensor[T], fInput: Tensor[T],
kW: Int, kH: Int, dW: Int, dH: Int, padLeft: Int, padTop: Int, padRight: Int, padBottom: Int,
nInputPlane: Int, inputWidth: Int, inputHeight: Int,
nOutputPlane: Int, outputWidth: Int, outputHeight: Int)(
implicit ev: TensorNumeric[T]): Unit = {
format match {
case DataFormat.NCHW =>
val output2d = output.view(nOutputPlane, outputHeight * outputWidth)
if (!_1x1) {
ev.getType() match {
case DoubleType =>
val before = System.nanoTime()
NNPrimitive.im2colDouble(fInput.asInstanceOf[Tensor[Double]],
input.asInstanceOf[Tensor[Double]], kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
outputWidth, outputHeight)
im2colTime += System.nanoTime() - before
case FloatType =>
val before = System.nanoTime()
NNPrimitive.im2colFloat(fInput.asInstanceOf[Tensor[Float]],
input.asInstanceOf[Tensor[Float]], kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
outputWidth, outputHeight)
im2colTime += System.nanoTime() - before
case _ => throw new UnsupportedOperationException(s"Only Float/Double supported")
}
}
var j = 1
while (j <= weight.size(1)) {
val outputWindow = output2d.select(2, j)
outputWindow.addmv(ev.fromType[Int](0), outputWindow,
ev.fromType[Int](1), weight.select(1, j), fInput.select(2, j))
j += 1
}
if (withBias) output2d.add(ev.fromType(1), bias)
case DataFormat.NHWC =>
val output2d = output.view(outputHeight * outputWidth, nOutputPlane)
if (!_1x1) {
ev.getType() match {
case DoubleType =>
val before = System.nanoTime()
NNPrimitive.im2colDoubleNHWC(fInput.asInstanceOf[Tensor[Double]],
input.asInstanceOf[Tensor[Double]], kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
outputWidth, outputHeight)
im2colTime += System.nanoTime() - before
case FloatType =>
val before = System.nanoTime()
NNPrimitive.im2colFloatNHWC(fInput.asInstanceOf[Tensor[Float]],
input.asInstanceOf[Tensor[Float]], kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
outputWidth, outputHeight)
im2colTime += System.nanoTime() - before
case _ => throw new UnsupportedOperationException(s"Only Float/Double supported")
}
}
var j = 1
while (j <= weight.size(1)) {
val outputWindow = output2d.select(1, j)
outputWindow.addmv(ev.fromType[Int](0), outputWindow,
ev.fromType[Int](1), weight.select(1, j), fInput.select(1, j))
j += 1
}
if (withBias) output2d.add(ev.fromType(1), bias)
}
}
protected def updateGradInputFrame(
gradInput: Tensor[T], gradOutput: Tensor[T],
weight: Tensor[T], fgradInput: Tensor[T], kW: Int, kH: Int, dW: Int, dH: Int,
padLeft: Int, padTop: Int, padRight: Int, padBottom: Int)
(implicit ev: TensorNumeric[T]): Unit = {
ev.getType() match {
case DoubleType =>
val gradOutDouble = gradOutput.asInstanceOf[Tensor[Double]]
val fGradInDouble = fgradInput.asInstanceOf[Tensor[Double]]
val weightDouble = weight.asInstanceOf[Tensor[Double]]
val gradInputDouble = gradInput.asInstanceOf[Tensor[Double]]
format match {
case DataFormat.NCHW =>
val channel = gradOutDouble.size(1)
val oh = gradOutDouble.size(2)
val ow = gradOutDouble.size(3)
val gradOutput2d = gradOutDouble.view(Array(channel, oh * ow))
var j = 1
while (j <= weight.size(1)) {
val fGradInWindow = fGradInDouble.select(2, j)
fGradInWindow.addmv(0.0f, fGradInWindow,
1.0f, weightDouble.select(1, j), gradOutput2d.select(2, j))
j += 1
}
if (!_1x1) {
gradInputDouble.zero()
val before = System.nanoTime()
NNPrimitive.col2imDouble(fGradInDouble,
gradInputDouble, kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
gradOutput.size(3), gradOutput.size(2))
col2imTime += System.nanoTime() - before
}
case DataFormat.NHWC =>
val channel = gradOutDouble.size(3)
val oh = gradOutDouble.size(1)
val ow = gradOutDouble.size(2)
val gradOutput2d = gradOutDouble.view(Array(oh * ow, channel))
var j = 1
while (j <= weight.size(1)) {
val fGradInWindow = fGradInDouble.select(1, j)
fGradInWindow.addmv(0.0f, fGradInWindow,
1.0f, weightDouble.select(1, j), gradOutput2d.select(1, j))
j += 1
}
if (!_1x1) {
gradInputDouble.zero()
val before = System.nanoTime()
NNPrimitive.col2imDoubleNHWC(fGradInDouble,
gradInputDouble, kW, kH, dW, dH,
padLeft, padTop, padRight, padBottom,
gradOutput.size(2), gradOutput.size(1))
col2imTime += System.nanoTime() - before
}
}
case FloatType =>
val gradOutFloat = gradOutput.asInstanceOf[Tensor[Float]]
val fGradInFloat = fgradInput.asInstanceOf[Tensor[Float]]
val weightFloat = weight.asInstanceOf[Tensor[Float]]
val gradInputFloat = gradInput.asInstanceOf[Tensor[Float]]
format match {
case DataFormat.NCHW =>
val channel = gradOutFloat.size(1)
val oh = gradOutFloat.size(2)
val ow = gradOutFloat.size(3)
val gradOutput2d = gradOutFloat.view(Array(channel, oh * ow))
var j = 1
while (j <= weight.size(1)) {
val fGradInWindow = fGradInFloat.select(2, j)
fGradInWindow.addmv(0.0f, fGradInWindow,
1.0f, weightFloat.select(1, j), gradOutput2d.select(2, j))
j += 1
}
if (!_1x1) {
gradInputFloat.zero()
val before = System.nanoTime()
NNPrimitive.col2imFloat(fGradInFloat,
gradInputFloat, kW, kH, dW, dH, padLeft, padTop, padRight, padBottom,
gradOutput.size(3), gradOutput.size(2))
col2imTime += System.nanoTime() - before
}
case DataFormat.NHWC =>
val channel = gradOutFloat.size(3)
val oh = gradOutFloat.size(1)
val ow = gradOutFloat.size(2)
val gradOutput2d = gradOutFloat.view(Array(oh * ow, channel))
var j = 1
while (j <= weight.size(1)) {
val fGradInWindow = fGradInFloat.select(1, j)
fGradInWindow.addmv(0.0f, fGradInWindow,
1.0f, weightFloat.select(1, j), gradOutput2d.select(1, j))
j += 1
}
if (!_1x1) {
gradInputFloat.zero()
val before = System.nanoTime()
NNPrimitive.col2imFloatNHWC(fGradInFloat,
gradInputFloat, kW, kH, dW, dH, padLeft, padTop, padRight, padBottom,
gradOutput.size(2), gradOutput.size(1))
col2imTime += System.nanoTime() - before
}
}
case _ => throw new UnsupportedOperationException(s"Only Float/Double supported")
}
}
protected def accGradParametersFrame(gradOutput: Tensor[T], gradWeight: Tensor[T],
gradBias: Tensor[T], fInput: Tensor[T],
scaleW: T, scaleB: T)(implicit ev: TensorNumeric[T]): Unit = {
if (gradBiasWindow == null) gradBiasWindow = Tensor[T]()
ev.getType() match {
case DoubleType =>
val gradODouble = gradOutput.asInstanceOf[Tensor[Double]]
val gradWDouble = gradWeight.asInstanceOf[Tensor[Double]]
val fIDouble = fInput.asInstanceOf[Tensor[Double]]
val sWDouble = ev.toType[Double](scaleW)
val sBDouble = ev.toType[Double](scaleB)
val gradBDouble = gradBias.asInstanceOf[Tensor[Double]]
val gradBiasWindowDouble = gradBiasWindow.asInstanceOf[Tensor[Double]]
format match {
case DataFormat.NCHW =>
val outChannel = gradOutput.size(1)
val outSize = gradOutput.size(2) * gradOutput.size(3)
val gradOutput2d = gradODouble.view(Array(outChannel, outSize))
if (sWDouble != 0) {
gradWDouble.addmm(1.0, gradWDouble, sWDouble, gradOutput2d, fIDouble.t)
}
if ( withBias && sBDouble != 0) {
var i = 0
while (i < gradBias.size(1)) {
var sum = 0.0
val data = gradOutput2d.storage().array()
val offset = gradOutput2d.storageOffset() - 1 + i * gradOutput2d.stride(1)
gradBiasWindowDouble.set(gradBDouble.storage(), gradBDouble.storageOffset() + i,
Array(gradOutput2d.size(2)), Array(1))
i += 1
}
}
case DataFormat.NHWC =>
val outChannel = gradOutput.size(3)
val outSize = gradOutput.size(1) * gradOutput.size(2)
val gradOutput2d = gradODouble.view(Array(outSize, outChannel))
if (sWDouble != 0) {
gradWDouble.addmm(1.0, gradWDouble, sWDouble, fIDouble.t, gradOutput2d)
}
if (withBias && sBDouble != 0) {
var i = 0
val gradData = gradOutput2d.storage().array()
val biasData = gradBDouble.storage().array()
val biasOffset = gradBDouble.storageOffset() - 1
while (i < gradODouble.size(1)) {
val gradOffset = gradOutput2d.storageOffset() - 1 + i * gradOutput2d.stride(1)
gradBiasWindowDouble.set(gradBDouble.storage(), gradBDouble.storageOffset() + i,
Array(gradOutput2d.size(2)), Array(1))
i = i + 1
}
}
}
case FloatType =>
val gradOFloat = gradOutput.asInstanceOf[Tensor[Float]]
val gradWFloat = gradWeight.asInstanceOf[Tensor[Float]]
val fIFloat = fInput.asInstanceOf[Tensor[Float]]
val sWFloat = ev.toType[Float](scaleW)
val sBFloat = ev.toType[Float](scaleB)
val gradBFloat = gradBias.asInstanceOf[Tensor[Float]]
val gradBiasWindowFloat = gradBiasWindow.asInstanceOf[Tensor[Float]]
format match {
case DataFormat.NCHW =>
val outChannel = gradOutput.size(1)
val outSize = gradOutput.size(2) * gradOutput.size(3)
val gradOutput2d = gradOFloat.view(Array(outChannel, outSize))
if (sWFloat != 0) {
gradWFloat.addmm(1.0f, gradWFloat, sWFloat, gradOutput2d, fIFloat.t)
}
if (withBias && sBFloat != 0) {
var i = 0
while (i < gradBias.size(1)) {
var sum = 0.0f
val data = gradOutput2d.storage().array()
val offset = gradOutput2d.storageOffset() - 1 + i * gradOutput2d.stride(1)
gradBiasWindowFloat.set(gradBFloat.storage(), gradBFloat.storageOffset() + i,
Array(gradOutput2d.size(2)), Array(1))
i += 1
}
}
case DataFormat.NHWC =>
val outChannel = gradOutput.size(3)
val outSize = gradOutput.size(1) * gradOutput.size(2)
val gradOutput2d = gradOFloat.view(Array(outSize, outChannel))
if (sWFloat != 0) {
gradWFloat.addmm(1.0f, gradWFloat, sWFloat, fIFloat.t, gradOutput2d)
}
if (withBias && sBFloat != 0) {
var i = 0
val gradData = gradOutput2d.storage().array()
val biasData = gradBFloat.storage().array()
val biasOffset = gradBFloat.storageOffset() - 1
while (i < gradOFloat.size(1)) {
val gradOffset = gradOutput2d.storageOffset() - 1 + i * gradOutput2d.stride(1)
gradBiasWindowFloat.set(gradBFloat.storage(), gradBFloat.storageOffset() + i,
Array(gradOutput2d.size(2)), Array(1))
i = i + 1
}
}
}
case _ => throw new UnsupportedOperationException(s"Only Float/Double supported")
}
}
protected def calcGradParametersFrame(gradOutput: Tensor[T], gradWeight: Tensor[T],
gradBias: Tensor[T],
fInput: Tensor[T], scaleW: T, scaleB: T)(implicit ev: TensorNumeric[T]): Unit = {
ev.getType() match {
case DoubleType =>
val gradODouble = gradOutput.asInstanceOf[Tensor[Double]]
val gradWDouble = gradWeight.asInstanceOf[Tensor[Double]]
val sWDouble = ev.toType[Double](scaleW)
val sBDouble = ev.toType[Double](scaleB)
val fIDouble = fInput.asInstanceOf[Tensor[Double]]
val gradBDouble = gradBias.asInstanceOf[Tensor[Double]]
val onesDouble = ones.asInstanceOf[Tensor[Double]]
format match {
case DataFormat.NCHW =>
val channel = gradODouble.size(1)
val oh = gradODouble.size(2)
val ow = gradODouble.size(3)
val gradOutput2d = gradODouble.view(Array(channel, oh * ow))
var j = 1
while (j <= weight.size(1)) {
val gradWDoubleWindow = gradWDouble.select(1, j)
gradWDoubleWindow.addr(0.0f, gradWDoubleWindow,
sWDouble, gradOutput2d.select(2, j), fIDouble.select(2, j))
j += 1
}
if (withBias && scaleB != 0) {
gradBDouble.add(sBDouble, gradOutput2d)
}
case DataFormat.NHWC =>
val channel = gradODouble.size(3)
val oh = gradODouble.size(1)
val ow = gradODouble.size(2)
val gradOutput2d = gradODouble.view(Array(oh * ow, channel))
var j = 1
while (j <= weight.size(1)) {
val gradWDoubleWindow = gradWDouble.select(1, j)
gradWDoubleWindow.addr(0.0f, gradWDoubleWindow,
sWDouble, gradOutput2d.select(1, j), fIDouble.select(1, j))
j += 1
}
if (withBias && scaleB != 0) {
gradBDouble.add(sBDouble, gradOutput2d)
}
}
case FloatType =>
val gradOFloat = gradOutput.asInstanceOf[Tensor[Float]]
val gradWFloat = gradWeight.asInstanceOf[Tensor[Float]]
val sWFloat = ev.toType[Float](scaleW)
val sBFloat = ev.toType[Float](scaleB)
val fIFloat = fInput.asInstanceOf[Tensor[Float]]
val gradBFloat = gradBias.asInstanceOf[Tensor[Float]]
val onesFloat = ones.asInstanceOf[Tensor[Float]]
format match {
case DataFormat.NCHW =>
val channel = gradOFloat.size(1)
val oh = gradOFloat.size(2)
val ow = gradOFloat.size(3)
val gradOutput2d = gradOFloat.view(Array(channel, oh * ow))
var j = 1
while (j <= weight.size(1)) {
val gradWFloatWindow = gradWFloat.select(1, j)
gradWFloatWindow.addr(0.0f, gradWFloatWindow,
sWFloat, gradOutput2d.select(2, j), fIFloat.select(2, j))
j += 1
}
if (withBias && scaleB != 0) {
gradBFloat.add(sBFloat, gradOutput2d)
}
case DataFormat.NHWC =>
val channel = gradOFloat.size(3)
val oh = gradOFloat.size(1)
val ow = gradOFloat.size(2)
val gradOutput2d = gradOFloat.view(Array(oh * ow, channel))
var j = 1
while (j <= weight.size(1)) {
val gradWFloatWindow = gradWFloat.select(1, j)
gradWFloatWindow.addr(0.0f, gradWFloatWindow,
sWFloat, gradOutput2d.select(1, j), fIFloat.select(1, j))
j += 1
}
if (withBias && scaleB != 0) {
gradBFloat.add(sBFloat, gradOutput2d)
}
}
case _ => throw new UnsupportedOperationException(s"Only Float/Double supported")
}
}
}
object LocallyConnected2D {
def apply[@specialized(Float, Double) T: ClassTag](
nInputPlane: Int,
inputWidth: Int,
inputHeight: Int,
nOutputPlane: Int,
kernelW: Int,
kernelH: Int,
strideW: Int = 1,
strideH: Int = 1,
padW: Int = 0,
padH: Int = 0,
propagateBack: Boolean = true,
wRegularizer: Regularizer[T] = null,
bRegularizer: Regularizer[T] = null,
initWeight: Tensor[T] = null,
initBias: Tensor[T] = null,
initGradWeight: Tensor[T] = null,
initGradBias: Tensor[T] = null,
withBias: Boolean = true,
format: DataFormat = DataFormat.NCHW
)(implicit ev: TensorNumeric[T]): LocallyConnected2D[T] = {
new LocallyConnected2D[T](nInputPlane, inputWidth, inputHeight, nOutputPlane, kernelW, kernelH,
strideW, strideH, padW, padH, propagateBack, wRegularizer,
bRegularizer, initWeight, initBias, initGradWeight, initGradBias, withBias, format)
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy