#include "src/naive/rnn/funcs.h"
namespace megdnn {
namespace naive {
namespace rnn {
template <>
void cell_opr_exec<LSTMCellForward>(
_megdnn_tensor_in input, _megdnn_tensor_in weight_ih,
_megdnn_tensor_in weight_hh, _megdnn_tensor_in bias_ih,
_megdnn_tensor_in bias_hh, const TensorNDArray& states,
TensorNDArray& states_new, _megdnn_workspace workspace,
param::RNNCell::NonlineMode , Handle* handle) {
auto opr = handle->create_operator<LSTMCellForward>();
TensorLayout gates, h_new, c_new;
opr->deduce_layout(
input.layout, weight_ih.layout, bias_ih.layout, states[0].layout,
weight_hh.layout, bias_hh.layout, states[1].layout, h_new, c_new, gates);
TensorND gates_tensor{workspace.raw_ptr, gates};
_megdnn_workspace new_workspace = {
workspace.raw_ptr + gates.span().dist_byte(),
workspace.size - gates.span().dist_byte()};
opr->exec(
input, weight_ih, bias_ih, states[0], weight_hh, bias_hh, states[1],
states_new[0], states_new[1], gates_tensor, new_workspace);
}
template <>
size_t cell_opr_get_workspace_in_bytes<LSTMCellForward>(
const TensorLayout& input, const TensorLayout& weight_ih,
const TensorLayout& weight_hh, const TensorLayout& bias_ih,
const TensorLayout& bias_hh, const TensorLayout& hx, Handle* handle) {
TensorLayout cx = hx;
TensorLayout h_new, c_new, gates;
auto cell_opr = handle->create_operator<LSTMCellForward>();
cell_opr->deduce_layout(
input, weight_ih, bias_ih, hx, weight_hh, bias_hh, cx, h_new, c_new, gates);
return cell_opr->get_workspace_in_bytes(
input, weight_ih, bias_ih, hx, weight_hh, bias_hh, cx, h_new, c_new,
gates) +
gates.span().dist_byte();
}
} } }