#pragma once
#include "megdnn/oprs.h"
#include "megdnn/handle.h"
namespace megdnn {
namespace cuda {
class TileForwardImpl : public TileForward {
public:
using TileForward::TileForward;
void exec(
_megdnn_tensor_in src, _megdnn_tensor_out dst,
_megdnn_workspace workspace) override;
size_t get_workspace_in_bytes(const TensorLayout&, const TensorLayout&) override {
return 0;
}
};
class TileBackwardImpl : public TileBackward {
public:
TileBackwardImpl(Handle* handle);
void exec(
_megdnn_tensor_in diff, _megdnn_tensor_out grad,
_megdnn_workspace workspace) override;
size_t get_workspace_in_bytes(const TensorLayout&, const TensorLayout&) override;
private:
std::unique_ptr<Reduce> m_opr;
template <typename T>
void exec_internal(
_megdnn_tensor_in diff, _megdnn_tensor_out grad,
_megdnn_workspace workspace);
};
} }