2019-04-17 10:49:11 +08:00
|
|
|
//
|
2021-03-12 18:41:50 +08:00
|
|
|
// ConvBufExecution.hpp
|
2019-04-17 10:49:11 +08:00
|
|
|
// MNN
|
|
|
|
//
|
|
|
|
// Created by MNN on 2019/01/31.
|
|
|
|
// Copyright © 2018, Alibaba Group Holding Limited
|
|
|
|
//
|
|
|
|
|
2021-03-12 18:41:50 +08:00
|
|
|
#ifndef MNN_OPENCL_BUFFER_CLOSED
|
|
|
|
|
|
|
|
#ifndef ConvBufExecution_hpp
|
|
|
|
#define ConvBufExecution_hpp
|
2019-04-17 10:49:11 +08:00
|
|
|
|
2024-04-19 11:58:21 +08:00
|
|
|
#include "backend/opencl/execution/image/CommonExecution.hpp"
|
2019-04-17 10:49:11 +08:00
|
|
|
namespace MNN {
|
|
|
|
namespace OpenCL {
|
|
|
|
|
2024-04-19 11:58:21 +08:00
|
|
|
struct ConvBufResource {
|
|
|
|
const Convolution2DCommon *mConv2dCommonParams;
|
|
|
|
const Convolution2D *mConv2dParams;
|
|
|
|
std::shared_ptr<cl::Buffer> mKernelBuffer;
|
2024-05-11 19:17:02 +08:00
|
|
|
std::shared_ptr<cl::Image2D> mKernelImage;
|
2024-04-19 11:58:21 +08:00
|
|
|
std::shared_ptr<Tensor> dequantScale;
|
|
|
|
std::shared_ptr<Tensor> dequantOffset;
|
|
|
|
std::shared_ptr<Tensor> mFilter;
|
|
|
|
std::shared_ptr<Tensor> mBias;
|
|
|
|
int mKernelWidth;
|
|
|
|
int mKernelHeight;
|
|
|
|
int mOutputChannel;
|
|
|
|
int mInputChannel;
|
|
|
|
std::vector<int> mStrides{1, 1};
|
|
|
|
std::vector<int> mDilations{1, 1};
|
|
|
|
std::set<std::string> mBuildOptions;
|
|
|
|
bool mConv1x1Opt = false;
|
|
|
|
bool mConv1x1C8Opt = false;
|
2024-06-03 20:09:34 +08:00
|
|
|
/*
|
|
|
|
0 -> not use
|
|
|
|
1 -> use small tile
|
|
|
|
2 -> use quieter large tile
|
|
|
|
*/
|
|
|
|
int mConvGemmOptLevel = 0;
|
2024-04-19 11:58:21 +08:00
|
|
|
std::shared_ptr<Execution> mRasterExe;
|
2024-05-11 19:17:02 +08:00
|
|
|
bool mUseImage = false;
|
2024-04-19 11:58:21 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
class ConvBufCommonExecution {
|
2019-04-17 10:49:11 +08:00
|
|
|
public:
|
2023-12-27 17:26:44 +08:00
|
|
|
ConvBufCommonExecution(Backend *backend);
|
2021-03-12 18:41:50 +08:00
|
|
|
ConvBufCommonExecution(const Convolution2D *op, Backend *backend);
|
|
|
|
virtual ~ConvBufCommonExecution();
|
2019-04-17 10:49:11 +08:00
|
|
|
|
2024-04-19 11:58:21 +08:00
|
|
|
std::pair<std::vector<uint32_t>, uint32_t> gws2dLwsTune(const std::shared_ptr<KernelWrap> &kernel, const std::vector<uint32_t> &gws, const std::string &kernelName, const uint32_t maxWorkGroupSize);
|
2019-04-17 10:49:11 +08:00
|
|
|
protected:
|
2024-04-19 11:58:21 +08:00
|
|
|
std::shared_ptr<ConvBufResource> mResource;
|
2021-03-12 18:41:50 +08:00
|
|
|
OpenCLBackend *mOpenCLBackend;
|
2019-04-17 10:49:11 +08:00
|
|
|
};
|
|
|
|
|
2024-04-19 11:58:21 +08:00
|
|
|
class ConvBufExecution : public ConvBufCommonExecution, public CommonExecution {
|
2019-04-17 10:49:11 +08:00
|
|
|
public:
|
2021-03-12 18:41:50 +08:00
|
|
|
ConvBufExecution(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs, const MNN::Op *op, Backend *backend);
|
2024-04-19 11:58:21 +08:00
|
|
|
ConvBufExecution(std::shared_ptr<ConvBufResource> resource, const MNN::Op* op, Backend* backend);
|
2021-03-12 18:41:50 +08:00
|
|
|
virtual ~ConvBufExecution();
|
2019-04-17 10:49:11 +08:00
|
|
|
|
|
|
|
virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
|
|
|
|
virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
|
2024-04-19 11:58:21 +08:00
|
|
|
virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;
|
2019-04-17 10:49:11 +08:00
|
|
|
|
2021-03-12 18:41:50 +08:00
|
|
|
void setConv1x1WeightBuffer(int packCout, int packCin, const float* filterDataPtr);
|
2019-04-17 10:49:11 +08:00
|
|
|
private:
|
2023-04-27 15:11:05 +08:00
|
|
|
void _generateFilterConvertRegion(Tensor *virtualFilter, Tensor *originBuffer) const;
|
2021-06-11 17:17:13 +08:00
|
|
|
|
2019-04-17 10:49:11 +08:00
|
|
|
std::vector<int> mPaddings{0, 0};
|
|
|
|
std::vector<uint32_t> mGlobalWorkSize{1, 1, 1};
|
|
|
|
std::vector<uint32_t> mLocalWorkSize{1, 1, 1, 1};
|
2024-04-19 11:58:21 +08:00
|
|
|
std::shared_ptr<KernelWrap> mKernel;
|
2024-06-03 20:09:34 +08:00
|
|
|
std::shared_ptr<Tensor> mConvGemmInpTensor;
|
|
|
|
std::shared_ptr<Tensor> mConvGemmOutTensor;
|
|
|
|
std::shared_ptr<KernelWrap> mPreKernel = nullptr;
|
|
|
|
std::vector<uint32_t> mPreGlobalWorkSize{1, 1, 1};
|
|
|
|
std::vector<uint32_t> mPreLocalWorkSize{1, 1, 1, 1};
|
|
|
|
std::shared_ptr<KernelWrap> mPostKernel = nullptr;
|
|
|
|
std::vector<uint32_t> mPostGlobalWorkSize{1, 1, 1};
|
|
|
|
std::vector<uint32_t> mPostLocalWorkSize{1, 1, 1, 1};
|
2021-03-12 18:41:50 +08:00
|
|
|
const float* mFilterDataPtr = nullptr;
|
2019-04-17 10:49:11 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
} // namespace OpenCL
|
|
|
|
} // namespace MNN
|
2021-03-12 18:41:50 +08:00
|
|
|
#endif /* ConvBufExecution_hpp */
|
|
|
|
#endif /* MNN_OPENCL_BUFFER_CLOSED */
|