MNN/source/backend/cpu/compute/ConvInt8TiledExecutor.hpp

//
//  ConvInt8TiledExecutor.hpp
//  MNN
//
//  Created by MNN on 2019/5/17.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef ConvInt8TiledExecutor_hpp
#define ConvInt8TiledExecutor_hpp

#include "backend/cpu/CPUConvolution.hpp"
#include "ConvInt8Winograd.hpp"
#include "Int8FunctionsOpt.h"

namespace MNN {

class ConvInt8TiledExecutor : public CPUConvolution {
public:
    // given weight+bias+scale, do post process
    ConvInt8TiledExecutor(Backend* backend, const Convolution2D* convOp, std::shared_ptr<ResourceInt8> res);
    // only given weight, not do post process
    ConvInt8TiledExecutor(Backend* backend, const Convolution2DCommon* common, std::shared_ptr<Tensor> weight, bool fastgemm);
    virtual ~ConvInt8TiledExecutor();
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
    virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
    virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;
private:
    ConvInt8TiledExecutor(Backend* backend, const Convolution2DCommon* common, const ConvInt8TiledExecutor& exe);
    ConvolutionCommon::Im2ColParameter mIm2ColParamter;
    int mTileCount;
    int mThreadNums;
    std::shared_ptr<Tensor> mTempIm2ColBuffer;
    decltype(CoreInt8Functions::Int8GemmKernel) mGemmKernel;
    bool mDoPostProcess = true; //whether quan post process (add bias, min/max then scale to int8)
    std::shared_ptr<CPUConvolution::ResourceInt8> mResource;
    
    friend class ConvInt8Winograd;
};

} // namespace MNN

#endif /* ConvInt8TiledExecutor_hpp */
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`//`
			`// ConvInt8TiledExecutor.hpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/5/17.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#ifndef ConvInt8TiledExecutor_hpp`
			`#define ConvInt8TiledExecutor_hpp`

			`#include "backend/cpu/CPUConvolution.hpp"`
			`#include "ConvInt8Winograd.hpp"`
			`#include "Int8FunctionsOpt.h"`

			`namespace MNN {`

			`class ConvInt8TiledExecutor : public CPUConvolution {`
			`public:`
			`// given weight+bias+scale, do post process`
			`ConvInt8TiledExecutor(Backend* backend, const Convolution2D* convOp, std::shared_ptr<ResourceInt8> res);`
			`// only given weight, not do post process`
			`ConvInt8TiledExecutor(Backend* backend, const Convolution2DCommon* common, std::shared_ptr<Tensor> weight, bool fastgemm);`
			`virtual ~ConvInt8TiledExecutor();`
			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
			`virtual ErrorCode onExecute(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
			`virtual bool onClone(Backend* bn, const Op* op, Execution** dst) override;`
			`private:`
			`ConvInt8TiledExecutor(Backend* backend, const Convolution2DCommon* common, const ConvInt8TiledExecutor& exe);`
			`ConvolutionCommon::Im2ColParameter mIm2ColParamter;`
			`int mTileCount;`
			`int mThreadNums;`
			`std::shared_ptr<Tensor> mTempIm2ColBuffer;`
			`decltype(CoreInt8Functions::Int8GemmKernel) mGemmKernel;`
			`bool mDoPostProcess = true; //whether quan post process (add bias, min/max then scale to int8)`
			`std::shared_ptr<CPUConvolution::ResourceInt8> mResource;`

			`friend class ConvInt8Winograd;`
			`};`

			`} // namespace MNN`

			`#endif /* ConvInt8TiledExecutor_hpp */`