54 lines
2.5 KiB
C++
54 lines
2.5 KiB
C++
#pragma once
|
|
|
|
#include <ATen/core/Tensor.h>
|
|
#include <ATen/native/DispatchStub.h>
|
|
|
|
namespace at::native {
|
|
|
|
using lstm_fn = void(*)(Tensor&, Tensor&, Tensor&, const Tensor&, TensorList, TensorList, bool, int64_t, double, bool, bool, bool);
|
|
using rnn_fn = void(*)(Tensor&, Tensor&, const Tensor&, const Tensor&, TensorList, bool, int64_t, double, bool, bool, bool);
|
|
using lstm_packed_fn = void(*)(Tensor&, Tensor&, Tensor&, const Tensor&, const Tensor&, TensorList, TensorList, bool, int64_t, double, bool, bool);
|
|
using rnn_packed_fn = void(*)(Tensor&, Tensor&, const Tensor&, const Tensor&, const Tensor&, TensorList, bool, int64_t, double, bool, bool);
|
|
|
|
DECLARE_DISPATCH(lstm_fn, lstm_cudnn_stub);
|
|
DECLARE_DISPATCH(lstm_fn, lstm_miopen_stub);
|
|
DECLARE_DISPATCH(lstm_fn, lstm_mkldnn_stub);
|
|
DECLARE_DISPATCH(rnn_fn, gru_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_fn, gru_miopen_stub);
|
|
DECLARE_DISPATCH(rnn_fn, rnn_tanh_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_fn, rnn_tanh_miopen_stub);
|
|
DECLARE_DISPATCH(rnn_fn, rnn_relu_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_fn, rnn_relu_miopen_stub);
|
|
DECLARE_DISPATCH(lstm_packed_fn, lstm_packed_cudnn_stub);
|
|
DECLARE_DISPATCH(lstm_packed_fn, lstm_packed_miopen_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, gru_packed_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, gru_packed_miopen_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, rnn_tanh_packed_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, rnn_tanh_packed_miopen_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, rnn_relu_packed_cudnn_stub);
|
|
DECLARE_DISPATCH(rnn_packed_fn, rnn_relu_packed_miopen_stub);
|
|
|
|
inline void check_attributes(const Tensor& input, const TensorList& params, const TensorList& hiddens, bool check_dtype=false) {
|
|
auto input_device = input.device();
|
|
auto input_dtype = input.scalar_type();
|
|
|
|
auto check_tensors = [&](const std::string& name, const Tensor& t) {
|
|
if (!t.defined()) return;
|
|
auto t_device = t.device();
|
|
TORCH_CHECK(input_device == t_device,
|
|
"Input and ", name, " tensors are not at the same device, found input tensor at ",
|
|
input_device, " and ", name, " tensor at ", t_device);
|
|
if (check_dtype) {
|
|
auto t_dtype = t.scalar_type();
|
|
TORCH_CHECK(input_dtype == t_dtype,
|
|
"Input and ", name, " tensors are not the same dtype, found input tensor with ",
|
|
input_dtype, " and ", name, " tensor with ", t_dtype);
|
|
}
|
|
};
|
|
|
|
for (const auto& h : hiddens) check_tensors("hidden", h);
|
|
for (const auto& p : params) check_tensors("parameter", p);
|
|
}
|
|
|
|
} // namespace at::native
|