MNN/source/backend/cpu/OneDNNConvInt8.hpp

//
//  OneDNNConvInt8.hpp
//
//

#ifndef OneDNNConvInt8_hpp
#define OneDNNConvInt8_hpp

#include "backend/cpu/CPUConvolution.hpp"
#include "dnnl.hpp"

using namespace dnnl;
namespace MNN {

class OneDNNConvInt8 : public CPUConvolution {
public:
    struct Resource : public CPUConvolution::Resource {
        memory conv_weights;
        memory conv_bias;
        primitive_attr conv_attr;
        engine eng;
    };
    static Execution* create(Backend *backend, const MNN::Op* op, const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs);
    OneDNNConvInt8(std::shared_ptr<OneDNNConvInt8::Resource> resource, const MNN::Convolution2DCommon* common, Backend* bn);
    virtual ~OneDNNConvInt8();
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
    virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
    virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;

private:
    std::shared_ptr<OneDNNConvInt8::Resource> mResource;
    stream stm;
    convolution_forward conv;
    std::shared_ptr<Tensor> mSrcTemp;
    std::shared_ptr<Tensor> mDstTemp;
    memory user_src;
    memory user_dst;
    memory conv_src;
    memory conv_dst;
};
} // namespace MNN
#endif /* OneDNNConvInt8_hpp */
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`//`
			`// OneDNNConvInt8.hpp`
			`//`
			`//`

			`#ifndef OneDNNConvInt8_hpp`
			`#define OneDNNConvInt8_hpp`

			`#include "backend/cpu/CPUConvolution.hpp"`
			`#include "dnnl.hpp"`

			`using namespace dnnl;`
			`namespace MNN {`

			`class OneDNNConvInt8 : public CPUConvolution {`
			`public:`
			`struct Resource : public CPUConvolution::Resource {`
			`memory conv_weights;`
			`memory conv_bias;`
			`primitive_attr conv_attr;`
			`engine eng;`
			`};`
align OneDNNConvInt8 with updated function signature 2025-06-24 09:43:53 +08:00			`static Execution* create(Backend backend, const MNN::Op op, const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs);`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`OneDNNConvInt8(std::shared_ptr<OneDNNConvInt8::Resource> resource, const MNN::Convolution2DCommon* common, Backend* bn);`
			`virtual ~OneDNNConvInt8();`
			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
			`virtual ErrorCode onExecute(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
			`virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;`

			`private:`
			`std::shared_ptr<OneDNNConvInt8::Resource> mResource;`
			`stream stm;`
			`convolution_forward conv;`
			`std::shared_ptr<Tensor> mSrcTemp;`
			`std::shared_ptr<Tensor> mDstTemp;`
			`memory user_src;`
			`memory user_dst;`
			`memory conv_src;`
			`memory conv_dst;`
			`};`
			`} // namespace MNN`
			`#endif /* OneDNNConvInt8_hpp */`