blob: b56331ebb4b0970856266d2e736ed9da422d87b9 [file] [log] [blame]
#-------------------------------------------------------------
#
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
#
#-------------------------------------------------------------
args <- commandArgs(TRUE)
library("Matrix")
library("matrixStats")
imgSize=as.integer(args[1])
numImg=as.integer(args[2])
numChannels=as.integer(args[3])
poolSize1=as.integer(args[4])
poolSize2=as.integer(args[5])
stride=as.integer(args[6])
pad=as.integer(args[7])
P=as.integer(args[8])
Q=as.integer(args[9])
# Assumption: NCHW image format
x=matrix(seq(1, numImg*numChannels*imgSize*imgSize), numImg, numChannels*imgSize*imgSize, byrow=TRUE)
dout=matrix(seq(1, numImg*numChannels*P*Q), numImg, numChannels*P*Q, byrow=TRUE)
if(as.logical(args[11])) {
zero_mask = (x - mean(x)*1.5) > 0
x = x * zero_mask
} else {
x = x - mean(x)
}
if(as.logical(args[12])) {
zero_mask = (dout - mean(dout)*1.5) > 0
dout = dout * zero_mask
} else {
dout = dout - mean(dout)
}
max_pool_backward <- function(dout, Hout, Wout, X, C,
Hin, Win, Hf, Wf, strideh, stridew)
{
N = nrow(X)
# Create gradient volume
dX = matrix(0, N, C*Hin*Win, byrow=TRUE)
# Gradient of max pooling
for (n in 1:N) { # all examples
img = matrix(X[n,], C, Hin*Win, byrow=TRUE)
dimg = matrix(0, C, Hin*Win, byrow=TRUE)
for (c in 1:C) { # all channels
img_slice = matrix(img[c,], Hin, Win, byrow=TRUE)
dimg_slice = matrix(0, Hin, Win, byrow=TRUE)
for (hout in 1:Hout) { # all output rows
hin = (hout-1) * strideh + 1
for (wout in 1:Wout) { # all output columns
win = (wout-1) * stridew + 1
img_slice_patch = img_slice[hin:(hin+Hf-1), win:(win+Wf-1)]
max_val = max(img_slice_patch)
max_val_ind = matrix(0, nrow(img_slice_patch), ncol(img_slice_patch))
max_val_ind[which.max(img_slice_patch)] = 1 # first max value indicator
# gradient passes through only for the max value in this patch
dimg_slice_patch = max_val_ind * dout[n, (c-1)*Hout*Wout + (hout-1)*Wout + wout]
dimg_slice[hin:(hin+Hf-1), win:(win+Wf-1)] =
dimg_slice[hin:(hin+Hf-1), win:(win+Wf-1)] + dimg_slice_patch
}
}
dimg[c,] = matrix(t(dimg_slice), 1, Hin*Win)
}
dX[n,] = matrix(t(dimg), 1, C*Hin*Win)
}
dX
}
output = max_pool_backward(dout, P, Q, x, numChannels, imgSize, imgSize, poolSize1, poolSize2, stride, stride)
writeMM(as(output,"CsparseMatrix"), paste(args[10], "B", sep=""))