blob: 5e642e0c4888f62bf38f11c64bdd127e5d73e3f3 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef SRC_MODEL_LAYER_CUDNN_RNN_H_
#define SRC_MODEL_LAYER_CUDNN_RNN_H_
#include "singa/singa_config.h"
#ifdef USE_CUDNN
#include <cudnn.h>
#if CUDNN_VERSION >= 5005
#include <string>
#include <utility>
#include <vector>
#include "./rnn.h"
#include "singa/core/common.h"
#include "singa/model/layer.h"
#include "singa/proto/core.pb.h"
#include "singa/utils/string.h"
#include <cudnn.h>
#include <chrono>
#include "./cudnn_utils.h"
#include "singa/utils/logging.h"
namespace singa {
class CudnnRNN : public RNN {
public:
~CudnnRNN();
/// \copydoc Layer::layer_type()
// const std::string layer_type() const override { return "CudnnRNN"; }
const vector<Tensor> Forward(int flag, const vector<Tensor>& inputs) override;
const std::pair<vector<Tensor>, vector<Tensor>> Backward(
int flag, const vector<Tensor>& grads) override;
void ToDevice(std::shared_ptr<Device> device) override;
void SetRNNDescriptor(shared_ptr<Device> dev);
void ResetHiddenAndCellDescriptors(size_t batch_size);
void DestroyIODescriptors();
void UpdateIODescriptors(size_t num, const vector<Tensor>& inputs);
void UpdateSpaces(size_t num, shared_ptr<Device> dev);
void UpdateStates(size_t num, const vector<Tensor>& inputs);
Tensor MergeInputs(size_t num, const vector<Tensor>& in);
vector<Tensor> SplitOutput(size_t num, size_t dim, const vector<Tensor>& in,
const Tensor output);
protected:
cudnnTensorDescriptor_t* x_descs_ = nullptr;
cudnnTensorDescriptor_t* dx_descs_ = nullptr;
cudnnTensorDescriptor_t* y_descs_ = nullptr;
cudnnTensorDescriptor_t* dy_descs_ = nullptr;
cudnnTensorDescriptor_t hx_desc_ = nullptr;
cudnnTensorDescriptor_t dhx_desc_ = nullptr;
cudnnTensorDescriptor_t cx_desc_ = nullptr;
cudnnTensorDescriptor_t dcx_desc_ = nullptr;
cudnnTensorDescriptor_t hy_desc_ = nullptr;
cudnnTensorDescriptor_t dhy_desc_ = nullptr;
cudnnTensorDescriptor_t cy_desc_ = nullptr;
cudnnTensorDescriptor_t dcy_desc_ = nullptr;
cudnnFilterDescriptor_t weight_desc_ = nullptr;
cudnnFilterDescriptor_t dweight_desc_ = nullptr;
cudnnRNNDescriptor_t rnn_desc_ = nullptr;
cudnnDropoutDescriptor_t dropout_desc_ = nullptr;
cudnnDataType_t dtype_ = CUDNN_DATA_FLOAT;
Tensor workspace_;
Tensor reserve_space_;
Tensor dropout_state_;
};
} // namespace singa
#endif // CUDNN_VERSION >= 5005
#endif // USE_CUDNN
#endif // SRC_MODEL_LAYER_CUDNN_RNN_H_