MNN/source/backend/cuda/execution/ConvWinogradExecution.hpp

69 lines
2.0 KiB
C++
Raw Normal View History

2022-08-12 10:30:48 +08:00
//
// ConvWinogradExecution.hpp
// MNN
//
// Created by MNN on 2022/05/11.
// Copyright © 2018, Alibaba Group Holding Limited
//
#ifndef ConvWinogradExecution_hpp_
#define ConvWinogradExecution_hpp_
#include "ConvSingleInputExecution.hpp"
2022-11-08 17:05:14 +08:00
#include "CutlassGemmBatchedParam.hpp"
2022-09-30 10:02:52 +08:00
#include "MNNCUDADefine.hpp"
#include "MNNCUDAFunction.cuh"
2022-08-12 10:30:48 +08:00
namespace MNN {
namespace CUDA {
class ConvWinogradExecution : public Execution {
public:
struct Resource;
2022-09-30 10:02:52 +08:00
static bool isValid(const Convolution2D* conv);
2022-08-12 10:30:48 +08:00
ConvWinogradExecution(Backend* backend, const MNN::Op* op, std::shared_ptr<Resource> res);
virtual ~ConvWinogradExecution();
struct Resource {
Resource(Backend* backend, const MNN::Op* op);
~ Resource();
void* mFilter;
void* mBias;
std::shared_ptr<Tensor> weightTensor;
std::shared_ptr<Tensor> biasTensor;
KernelInfo mKernelInfo;
Backend* mBackend = nullptr;
bool mUseHPack = false;
};
virtual ErrorCode onResize(const std::vector<Tensor*> &inputs, const std::vector<Tensor*> &outputs) override;
virtual ErrorCode onExecute(const std::vector<Tensor*> &inputs, const std::vector<Tensor*> &outputs) override;
virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;
private:
std::shared_ptr<Resource> mResource;
const Op* mOp = nullptr;
__half* mBtdB_Buffer;
void* mMatmul_Buffer;
2022-11-08 17:05:14 +08:00
GemmBatchedTensor_F16_F16_Linear_AlignTensor_Row_Column_Sm75 mGemmBatchedF16LnSm75;
GemmBatchedTensor_F16_F32_Linear_AlignTensor_Row_Column_Sm75 mGemmBatchedF32LnSm75;
GemmBatchedCuda_F16_F16_Linear_AlignCuda_Row_Column mGemmBatchedCudaF16Ln;
GemmBatchedCuda_F16_F32_Linear_AlignCuda_Row_Column mGemmBatchedCudaF32Ln;
2022-09-30 10:02:52 +08:00
std::shared_ptr<Tensor> workspaceTensor;
uint8_t* mWorkspace;
CutlassGemmInfo mGemmInfo;
2022-08-12 10:30:48 +08:00
int mPadX;
int mPadY;
int mBlock2;
2022-11-08 17:05:14 +08:00
int mGpuComputeCap;
int mActivationType;
2022-08-12 10:30:48 +08:00
};
} // namespace CUDA
} // namespace MNN
#endif /* ConvWinogradExecution_hpp_ */