src/model/layer/cudnn_rnn.h - singa - Git at Google

 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #ifndef SRC_MODEL_LAYER_CUDNN_RNN_H_
 #define SRC_MODEL_LAYER_CUDNN_RNN_H_
 #include "singa/singa_config.h"
 #ifdef USE_CUDNN
 #include <cudnn.h>
 #if CUDNN_VERSION >= 5005
 #include <string>
 #include <utility>
 #include <vector>
 #include "./rnn.h"
 #include "singa/core/common.h"
 #include "singa/model/layer.h"
 #include "singa/proto/core.pb.h"
 #include "singa/utils/string.h"
 #include <cudnn.h>
 #include <chrono>
 #include "./cudnn_utils.h"
 #include "singa/utils/logging.h"

 namespace singa {
 class CudnnRNN : public RNN {
  public:
   ~CudnnRNN();
   /// \copydoc Layer::layer_type()
   // const std::string layer_type() const override { return "CudnnRNN"; }

   const vector<Tensor> Forward(int flag, const vector<Tensor>& inputs) override;
   const std::pair<vector<Tensor>, vector<Tensor>> Backward(
       int flag, const vector<Tensor>& grads) override;

   void ToDevice(std::shared_ptr<Device> device) override;

   void SetRNNDescriptor(shared_ptr<Device> dev);
   void ResetHiddenAndCellDescriptors(size_t batch_size);
   void DestroyIODescriptors();
   void UpdateIODescriptors(size_t num, const vector<Tensor>& inputs);
   void UpdateSpaces(size_t num, shared_ptr<Device> dev);
   void UpdateStates(size_t num, const vector<Tensor>& inputs);
   Tensor MergeInputs(size_t num, const vector<Tensor>& in);
   vector<Tensor> SplitOutput(size_t num, size_t dim, const vector<Tensor>& in,
                              const Tensor output);

  protected:
   cudnnTensorDescriptor_t* x_descs_ = nullptr;
   cudnnTensorDescriptor_t* dx_descs_ = nullptr;
   cudnnTensorDescriptor_t* y_descs_ = nullptr;
   cudnnTensorDescriptor_t* dy_descs_ = nullptr;
   cudnnTensorDescriptor_t hx_desc_ = nullptr;
   cudnnTensorDescriptor_t dhx_desc_ = nullptr;
   cudnnTensorDescriptor_t cx_desc_ = nullptr;
   cudnnTensorDescriptor_t dcx_desc_ = nullptr;
   cudnnTensorDescriptor_t hy_desc_ = nullptr;
   cudnnTensorDescriptor_t dhy_desc_ = nullptr;
   cudnnTensorDescriptor_t cy_desc_ = nullptr;
   cudnnTensorDescriptor_t dcy_desc_ = nullptr;
   cudnnFilterDescriptor_t weight_desc_ = nullptr;
   cudnnFilterDescriptor_t dweight_desc_ = nullptr;
   cudnnRNNDescriptor_t rnn_desc_ = nullptr;
   cudnnDropoutDescriptor_t dropout_desc_ = nullptr;
   cudnnDataType_t dtype_ = CUDNN_DATA_FLOAT;
   Tensor workspace_;
   Tensor reserve_space_;
   Tensor dropout_state_;
 };

 }  // namespace singa

 #endif  // CUDNN_VERSION >= 5005
 #endif  // USE_CUDNN
 #endif  // SRC_MODEL_LAYER_CUDNN_RNN_H_
	/**
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	#ifndef SRC_MODEL_LAYER_CUDNN_RNN_H_
	#define SRC_MODEL_LAYER_CUDNN_RNN_H_
	#include "singa/singa_config.h"
	#ifdef USE_CUDNN
	#include <cudnn.h>
	#if CUDNN_VERSION >= 5005
	#include <string>
	#include <utility>
	#include <vector>
	#include "./rnn.h"
	#include "singa/core/common.h"
	#include "singa/model/layer.h"
	#include "singa/proto/core.pb.h"
	#include "singa/utils/string.h"
	#include <cudnn.h>
	#include <chrono>
	#include "./cudnn_utils.h"
	#include "singa/utils/logging.h"

	namespace singa {
	class CudnnRNN : public RNN {
	public:
	~CudnnRNN();
	/// \copydoc Layer::layer_type()
	// const std::string layer_type() const override { return "CudnnRNN"; }

	const vector<Tensor> Forward(int flag, const vector<Tensor>& inputs) override;
	const std::pair<vector<Tensor>, vector<Tensor>> Backward(
	int flag, const vector<Tensor>& grads) override;

	void ToDevice(std::shared_ptr<Device> device) override;

	void SetRNNDescriptor(shared_ptr<Device> dev);
	void ResetHiddenAndCellDescriptors(size_t batch_size);
	void DestroyIODescriptors();
	void UpdateIODescriptors(size_t num, const vector<Tensor>& inputs);
	void UpdateSpaces(size_t num, shared_ptr<Device> dev);
	void UpdateStates(size_t num, const vector<Tensor>& inputs);
	Tensor MergeInputs(size_t num, const vector<Tensor>& in);
	vector<Tensor> SplitOutput(size_t num, size_t dim, const vector<Tensor>& in,
	const Tensor output);

	protected:
	cudnnTensorDescriptor_t* x_descs_ = nullptr;
	cudnnTensorDescriptor_t* dx_descs_ = nullptr;
	cudnnTensorDescriptor_t* y_descs_ = nullptr;
	cudnnTensorDescriptor_t* dy_descs_ = nullptr;
	cudnnTensorDescriptor_t hx_desc_ = nullptr;
	cudnnTensorDescriptor_t dhx_desc_ = nullptr;
	cudnnTensorDescriptor_t cx_desc_ = nullptr;
	cudnnTensorDescriptor_t dcx_desc_ = nullptr;
	cudnnTensorDescriptor_t hy_desc_ = nullptr;
	cudnnTensorDescriptor_t dhy_desc_ = nullptr;
	cudnnTensorDescriptor_t cy_desc_ = nullptr;
	cudnnTensorDescriptor_t dcy_desc_ = nullptr;
	cudnnFilterDescriptor_t weight_desc_ = nullptr;
	cudnnFilterDescriptor_t dweight_desc_ = nullptr;
	cudnnRNNDescriptor_t rnn_desc_ = nullptr;
	cudnnDropoutDescriptor_t dropout_desc_ = nullptr;
	cudnnDataType_t dtype_ = CUDNN_DATA_FLOAT;
	Tensor workspace_;
	Tensor reserve_space_;
	Tensor dropout_state_;
	};

	} // namespace singa

	#endif // CUDNN_VERSION >= 5005
	#endif // USE_CUDNN
	#endif // SRC_MODEL_LAYER_CUDNN_RNN_H_