MNN/source/core/ConvolutionCommon.hpp

//
//  ConvolutionCommon.hpp
//  MNN
//
//  Created by MNN on 2020/03/02.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef ConvolutionCommon_hpp
#define ConvolutionCommon_hpp
#include "AutoStorage.h"
#include "Execution.hpp"
#include "MNN_generated.h"
namespace MNN {
class MNN_PUBLIC ConvolutionCommon : public Execution {
public:
    struct Int8Common {
        AutoStorage<int8_t> weight;
        AutoStorage<float> alpha;
        AutoStorage<float> weightFloat;
        const IDSTQuan* quan;
        bool asymmetric;
        std::vector<int8_t> weightMap;
        bool canUseInt4 = false;
        Backend* backend = nullptr;
        int originBits = 8;
        int alphaSize;
    };
    static std::shared_ptr<Int8Common> load(const Op* op, Backend* backend = nullptr, bool forceFloat = false, bool forceInt8 = false, void* weightPtr = nullptr);
    // if can not get quant bits, return 0
    static int getQuantBitFromExternalFile(const Op* op);
    static void getConvParameters(std::shared_ptr<ConvolutionCommon::Int8Common> *quanCommon, Backend* backend, const MNN::Op *op, const float** originWeight, int* originWeightSize);
    static bool getConvInt8Parameters(const MNN::Op* op, std::shared_ptr<Int8Common>& quanCommon, Backend* backend,
                                      const int8_t*& weight, int& weightSize, float* scale, int32_t* bias, int ocUp4);

    // Return padX, padY
    static std::pair<int, int> convolutionPad(const Tensor* input, const Tensor* output,
                                              const Convolution2DCommon* common);
    // Return padLeft, padTop, padRight, padBottom
    static std::tuple<int, int, int, int> convolutionPadFull(const Tensor* input, const Tensor* output,
                                              const Convolution2DCommon* common);
    static std::pair<int, int> convolutionTransposePad(const Tensor* input, const Tensor* output,
                                                       const Convolution2DCommon* common);
    struct Im2ColParameter {
        int32_t padX;
        int32_t padY;
        int32_t dilateX;
        int32_t dilateY;
        int32_t strideX;
        int32_t strideY;
        int32_t kernelX;
        int32_t kernelY;
        int32_t icDiv4;
        int32_t kernelCountUnit;
        int32_t iw;
        int32_t ih;
        int32_t ow;
        int32_t oh;
        int32_t srcZStep;
        int32_t srcYStep;
        int32_t packCUnit;
        int32_t destICStride;
        int32_t ic; // ic packed by LP, used by im2col dst data.
        int32_t icup4; // ic packed by LP, used by im2col src data.
    };
};
} // namespace MNN
#endif
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`//`
			`// ConvolutionCommon.hpp`
			`// MNN`
			`//`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`// Created by MNN on 2020/03/02.`
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`
Github release 1.1.0 2020-11-05 16:41:56 +08:00
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`#ifndef ConvolutionCommon_hpp`
			`#define ConvolutionCommon_hpp`
			`#include "AutoStorage.h"`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include "Execution.hpp"`
			`#include "MNN_generated.h"`
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`namespace MNN {`
			`class MNN_PUBLIC ConvolutionCommon : public Execution {`
			`public:`
			`struct Int8Common {`
			`AutoStorage<int8_t> weight;`
			`AutoStorage<float> alpha;`
			`AutoStorage<float> weightFloat;`
			`const IDSTQuan* quan;`
[MNN:Sync] Sync Internal Gitlab: 2.5.1 2023-05-18 19:11:50 +08:00			`bool asymmetric;`
			`std::vector<int8_t> weightMap;`
			`bool canUseInt4 = false;`
[MNN:Sync] Sync Internal 2.7.1 2023-09-20 20:16:25 +08:00			`Backend* backend = nullptr;`
MNN:Sync: Sync Internal 3.0.0 2024-11-18 14:37:45 +08:00			`int originBits = 8;`
MNN:Sync: Sync Internal 3.1.1 2025-03-12 11:35:16 +08:00			`int alphaSize;`
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`};`
MNN:Sync: Sync Internal 3.1.3 2025-04-28 11:38:44 +08:00			`static std::shared_ptr<Int8Common> load(const Op* op, Backend* backend = nullptr, bool forceFloat = false, bool forceInt8 = false, void* weightPtr = nullptr);`
			`// if can not get quant bits, return 0`
			`static int getQuantBitFromExternalFile(const Op* op);`
MNN:Sync: Sync Internal 2.9.4 2024-08-24 15:46:21 +08:00			`static void getConvParameters(std::shared_ptr<ConvolutionCommon::Int8Common> quanCommon, Backend backend, const MNN::Op op, const float* originWeight, int* originWeightSize);`
			`static bool getConvInt8Parameters(const MNN::Op* op, std::shared_ptr<Int8Common>& quanCommon, Backend* backend,`
[MNN:Sync] Sync Internal 3.1.4. 2025-05-08 12:39:44 +08:00			`const int8_t& weight, int& weightSize, float scale, int32_t* bias, int ocUp4);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00
[PATCH 114/160] [MNN:Refractor] Seperate the pad compute for convolution and deconvolution 2020-03-12 20:29:43 +08:00			`// Return padX, padY`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`static std::pair<int, int> convolutionPad(const Tensor* input, const Tensor* output,`
			`const Convolution2DCommon* common);`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`// Return padLeft, padTop, padRight, padBottom`
			`static std::tuple<int, int, int, int> convolutionPadFull(const Tensor* input, const Tensor* output,`
			`const Convolution2DCommon* common);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`static std::pair<int, int> convolutionTransposePad(const Tensor* input, const Tensor* output,`
			`const Convolution2DCommon* common);`
			`struct Im2ColParameter {`
			`int32_t padX;`
			`int32_t padY;`
			`int32_t dilateX;`
			`int32_t dilateY;`
			`int32_t strideX;`
			`int32_t strideY;`
			`int32_t kernelX;`
			`int32_t kernelY;`
			`int32_t icDiv4;`
			`int32_t kernelCountUnit;`
			`int32_t iw;`
			`int32_t ih;`
			`int32_t ow;`
			`int32_t oh;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`int32_t srcZStep;`
			`int32_t srcYStep;`
[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`int32_t packCUnit;`
			`int32_t destICStride;`
MNN:Sync: Sync Internal 3.0.4 2025-01-22 14:47:50 +08:00			`int32_t ic; // ic packed by LP, used by im2col dst data.`
			`int32_t icup4; // ic packed by LP, used by im2col src data.`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`};`
[PATCH 070/160] [MNN:Refract] Seperate the load of quan and half to ConvolutionCommon 2020-03-02 22:13:38 +08:00			`};`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`} // namespace MNN`
[PATCH 114/160] [MNN:Refractor] Seperate the pad compute for convolution and deconvolution 2020-03-12 20:29:43 +08:00			`#endif`