MNN/source/backend/cpu/CPUConvolutionDepthwise.hpp

76 lines
3.3 KiB
C++

//
// CPUConvolutionDepthwise.hpp
// MNN
//
// Created by MNN on 2018/07/20.
// Copyright © 2018, Alibaba Group Holding Limited
//
#ifndef CPUConvolutionDepthwise_hpp
#define CPUConvolutionDepthwise_hpp
#include "core/AutoStorage.h"
#include "backend/cpu/CPUConvolution.hpp"
#include "backend/cpu/compute/ConvolutionIntFactory.hpp"
namespace MNN {
class CPUConvolutionDepthwise {
public:
class BasicFloatExecution : public CPUConvolution {
public:
BasicFloatExecution(const Convolution2DCommon *common, Backend *b) : CPUConvolution(common, b) {
}
virtual ~BasicFloatExecution() = default;
virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
private:
std::function<void(const uint8_t *, uint8_t *, int)> mExecutor;
std::function<void(float* dst, const float* src, const float* weight, size_t width, size_t src_w_setup,
size_t fw, size_t fh, size_t dilateX_step, size_t dilateY_step, size_t height,
size_t srcHStep, size_t dstHStep)> mFastKernel;
int mNumber = 1;
std::shared_ptr<Tensor> mInputPad;
bool mFastKernelApply = false;
};
class MultiInputFloatExecution : public BasicFloatExecution {
public:
MultiInputFloatExecution(const Convolution2DCommon *common, Backend *b) : BasicFloatExecution(common, b) {
}
virtual ~MultiInputFloatExecution() = default;
virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
private:
std::unique_ptr<Tensor> mWeight;
std::unique_ptr<Tensor> mBias;
std::vector<Tensor *> mTempInputs;
};
class FloatExecution : public CPUConvolution {
public:
FloatExecution(const Convolution2DCommon *common, Backend *b, const float *originWeight,
size_t originWeightSize, const float *bias, size_t biasSize);
virtual ~FloatExecution();
virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs,
const std::vector<Tensor *> &outputs) override {
return mOrigin->onExecute(mTempInputs, outputs);
}
virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override {
mTempInputs = {inputs[0], mResource->mWeight.get(), mResource->mBias.get()};
return mOrigin->onResize(mTempInputs, outputs);
}
virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;
private:
FloatExecution(std::shared_ptr<Resource> resource, const Convolution2DCommon* common, Backend* b) : CPUConvolution(common, b) {
mResource = resource;
mOrigin.reset(new BasicFloatExecution(common, b));
}
std::shared_ptr<CPUConvolution::Resource> mResource;
std::vector<Tensor *> mTempInputs;
std::unique_ptr<BasicFloatExecution> mOrigin;
};
};
} // namespace MNN
#endif /* CPUConvolutionDepthwise_hpp */