src/operator/nn/dropout.cc - mxnet - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 /*!
  * Copyright (c) 2015 by Contributors
  * \file dropout.cc
  * \brief
  * \author Bing Xu, Da Zheng, Hang Zhang
 */

 #include "./dropout-inl.h"
 #include "../operator_common.h"

 namespace mxnet {
 namespace op {

 struct DropoutGrad {
   const char *op_name;
   std::vector<nnvm::NodeEntry> operator()(const nnvm::NodePtr& n,
                                           const std::vector<nnvm::NodeEntry>& ograds) const {
     std::vector<nnvm::NodeEntry> heads;
     heads.push_back(ograds[0]);
     heads.emplace_back(nnvm::NodeEntry{n, dropout::kMask, 0});
     return MakeGradNode(op_name, n, heads, n->attrs.dict);
   }
 };

 DMLC_REGISTER_PARAMETER(DropoutParam);

 NNVM_REGISTER_OP(Dropout)
 .describe(R"(Applies dropout operation to input array.

 - During training, each element of the input is set to zero with probability p.
   The whole array is rescaled by :math:`1/(1-p)` to keep the expected
   sum of the input unchanged.

 - During testing, this operator does not change the input if mode is 'training'.
   If mode is 'always', the same computaion as during training will be applied.

 Example::

   random.seed(998)
   input_array = array([[3., 0.5,  -0.5,  2., 7.],
                       [2., -0.4,   7.,  3., 0.2]])
   a = symbol.Variable('a')
   dropout = symbol.Dropout(a, p = 0.2)
   executor = dropout.simple_bind(a = input_array.shape)

   ## If training
   executor.forward(is_train = True, a = input_array)
   executor.outputs
   [[ 3.75   0.625 -0.     2.5    8.75 ]
    [ 2.5   -0.5    8.75   3.75   0.   ]]

   ## If testing
   executor.forward(is_train = False, a = input_array)
   executor.outputs
   [[ 3.     0.5   -0.5    2.     7.   ]
    [ 2.    -0.4    7.     3.     0.2  ]]
 )" ADD_FILELINE)
 .set_num_inputs(1)
 .set_num_outputs(2)
 .set_attr_parser(ParamParser<DropoutParam>)
 .set_attr<nnvm::FListInputNames>("FListInputNames",
     [](const NodeAttrs& attrs) {
   return std::vector<std::string>{"data"};
 })
 .set_attr<nnvm::FListOutputNames>("FListOutputNames",
     [](const NodeAttrs& attrs) {
   return std::vector<std::string>{"output", "mask"};
 })
 .set_attr<nnvm::FNumVisibleOutputs>("FNumVisibleOutputs",
     [](const NodeAttrs& attrs) {
   return 1;
 })
 .set_attr<nnvm::FInferShape>("FInferShape", [](const nnvm::NodeAttrs& attrs,
       std::vector<TShape> *in_shape, std::vector<TShape> *out_shape){
   using namespace mshadow;
   CHECK_EQ(in_shape->size(), 1U);
   const DropoutParam& param = nnvm::get<DropoutParam>(attrs.parsed);
   TShape dshape(in_shape->at(0));
   if (dshape.ndim() == 0) return false;
   out_shape->clear();
   out_shape->push_back(dshape);
   for (index_t i = 0; i < param.axes.ndim(); ++i) {
     dshape[param.axes[i]] = 1;
   }
   out_shape->push_back(dshape);
   return true;
 })
 .set_attr<nnvm::FInferType>("FInferType", [](const nnvm::NodeAttrs& attrs,
       std::vector<int> *in_type, std::vector<int> *out_type) {
   CHECK_EQ(in_type->size(), 1U);
   int dtype = in_type->at(0);

   if (dtype == -1) {
     LOG(FATAL) << "input type to dropout is not specified.";
     return false;
   }

   size_t nout = 2;
   out_type->clear();
   for (size_t i = 0; i < nout; ++i) out_type->push_back(dtype);
   return true;
 })
 .set_attr<FCompute>("FCompute<cpu>", DropoutCompute<cpu>)
 .set_attr<nnvm::FGradient>("FGradient", DropoutGrad{"_backward_Dropout"})
 .set_attr<nnvm::FInplaceOption>("FInplaceOption", [](const NodeAttrs& attrs){
   return std::vector<std::pair<int, int> >{{0, 0}};
 })
 .set_attr<FResourceRequest>("FResourceRequest", [](const NodeAttrs& n) {
   return std::vector<ResourceRequest>{ ResourceRequest::kParallelRandom };
 })
 .add_argument("data", "NDArray-or-Symbol", "Input array to which dropout will be applied.")
 .add_arguments(DropoutParam::__FIELDS__());

 NNVM_REGISTER_OP(_backward_Dropout)
 .set_num_outputs(1)
 .set_attr<nnvm::TIsBackward>("TIsBackward", true)
 .set_attr_parser(ParamParser<DropoutParam>)
 .set_attr<nnvm::FInplaceOption>("FInplaceOption", [](const NodeAttrs& attrs){
   return std::vector<std::pair<int, int> >{{0, 0}};
 })
 .set_attr<FCompute>("FCompute<cpu>", DropoutGradCompute<cpu>);

 }  // namespace op
 }  // namespace mxnet
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing,
	* software distributed under the License is distributed on an
	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	* KIND, either express or implied. See the License for the
	* specific language governing permissions and limitations
	* under the License.
	*/

	/*!
	* Copyright (c) 2015 by Contributors
	* \file dropout.cc
	* \brief
	* \author Bing Xu, Da Zheng, Hang Zhang
	*/

	#include "./dropout-inl.h"
	#include "../operator_common.h"

	namespace mxnet {
	namespace op {

	struct DropoutGrad {
	const char *op_name;
	std::vector<nnvm::NodeEntry> operator()(const nnvm::NodePtr& n,
	const std::vector<nnvm::NodeEntry>& ograds) const {
	std::vector<nnvm::NodeEntry> heads;
	heads.push_back(ograds[0]);
	heads.emplace_back(nnvm::NodeEntry{n, dropout::kMask, 0});
	return MakeGradNode(op_name, n, heads, n->attrs.dict);
	}
	};

	DMLC_REGISTER_PARAMETER(DropoutParam);

	NNVM_REGISTER_OP(Dropout)
	.describe(R"(Applies dropout operation to input array.

	- During training, each element of the input is set to zero with probability p.
	The whole array is rescaled by :math:`1/(1-p)` to keep the expected
	sum of the input unchanged.

	- During testing, this operator does not change the input if mode is 'training'.
	If mode is 'always', the same computaion as during training will be applied.

	Example::

	random.seed(998)
	input_array = array([[3., 0.5, -0.5, 2., 7.],
	[2., -0.4, 7., 3., 0.2]])
	a = symbol.Variable('a')
	dropout = symbol.Dropout(a, p = 0.2)
	executor = dropout.simple_bind(a = input_array.shape)

	## If training
	executor.forward(is_train = True, a = input_array)
	executor.outputs
	[[ 3.75 0.625 -0. 2.5 8.75 ]
	[ 2.5 -0.5 8.75 3.75 0. ]]

	## If testing
	executor.forward(is_train = False, a = input_array)
	executor.outputs
	[[ 3. 0.5 -0.5 2. 7. ]
	[ 2. -0.4 7. 3. 0.2 ]]
	)" ADD_FILELINE)
	.set_num_inputs(1)
	.set_num_outputs(2)
	.set_attr_parser(ParamParser<DropoutParam>)
	.set_attr<nnvm::FListInputNames>("FListInputNames",
	[](const NodeAttrs& attrs) {
	return std::vector<std::string>{"data"};
	})
	.set_attr<nnvm::FListOutputNames>("FListOutputNames",
	[](const NodeAttrs& attrs) {
	return std::vector<std::string>{"output", "mask"};
	})
	.set_attr<nnvm::FNumVisibleOutputs>("FNumVisibleOutputs",
	[](const NodeAttrs& attrs) {
	return 1;
	})
	.set_attr<nnvm::FInferShape>("FInferShape", [](const nnvm::NodeAttrs& attrs,
	std::vector<TShape> in_shape, std::vector<TShape> out_shape){
	using namespace mshadow;
	CHECK_EQ(in_shape->size(), 1U);
	const DropoutParam& param = nnvm::get<DropoutParam>(attrs.parsed);
	TShape dshape(in_shape->at(0));
	if (dshape.ndim() == 0) return false;
	out_shape->clear();
	out_shape->push_back(dshape);
	for (index_t i = 0; i < param.axes.ndim(); ++i) {
	dshape[param.axes[i]] = 1;
	}
	out_shape->push_back(dshape);
	return true;
	})
	.set_attr<nnvm::FInferType>("FInferType", [](const nnvm::NodeAttrs& attrs,
	std::vector<int> in_type, std::vector<int> out_type) {
	CHECK_EQ(in_type->size(), 1U);
	int dtype = in_type->at(0);

	if (dtype == -1) {
	LOG(FATAL) << "input type to dropout is not specified.";
	return false;
	}

	size_t nout = 2;
	out_type->clear();
	for (size_t i = 0; i < nout; ++i) out_type->push_back(dtype);
	return true;
	})
	.set_attr<FCompute>("FCompute<cpu>", DropoutCompute<cpu>)
	.set_attr<nnvm::FGradient>("FGradient", DropoutGrad{"_backward_Dropout"})
	.set_attr<nnvm::FInplaceOption>("FInplaceOption", [](const NodeAttrs& attrs){
	return std::vector<std::pair<int, int> >{{0, 0}};
	})
	.set_attr<FResourceRequest>("FResourceRequest", [](const NodeAttrs& n) {
	return std::vector<ResourceRequest>{ ResourceRequest::kParallelRandom };
	})
	.add_argument("data", "NDArray-or-Symbol", "Input array to which dropout will be applied.")
	.add_arguments(DropoutParam::__FIELDS__());

	NNVM_REGISTER_OP(_backward_Dropout)
	.set_num_outputs(1)
	.set_attr<nnvm::TIsBackward>("TIsBackward", true)
	.set_attr_parser(ParamParser<DropoutParam>)
	.set_attr<nnvm::FInplaceOption>("FInplaceOption", [](const NodeAttrs& attrs){
	return std::vector<std::pair<int, int> >{{0, 0}};
	})
	.set_attr<FCompute>("FCompute<cpu>", DropoutGradCompute<cpu>);

	} // namespace op
	} // namespace mxnet