#pragma once
#include "megdnn/oprs.h"
#include "src/cuda/utils.h"
namespace megdnn {
namespace cuda {
class SVDForwardImpl : public SVDForward {
public:
using SVDForward::SVDForward;
size_t get_workspace_in_bytes(
size_t block_cnt, size_t m, size_t n, size_t dtype_size) override;
void exec(
_megdnn_tensor_in src, _megdnn_tensor_out u, _megdnn_tensor_out s,
_megdnn_tensor_out vt, _megdnn_workspace workspace) override;
private:
size_t get_cusolver_buffer_size(size_t m, size_t n);
WorkspaceBundle get_workspace_bundle(
size_t block_cnt, size_t m, size_t n, size_t dtype_size,
void* raw_ptr = nullptr);
};
} }