MNN/source/backend/cpu/compute/SparseConvolutionTiledExecu...

//
//  SparseConvolutionTiledExecutor
//  MNN
//
//  Created by MNN on 2021/04/06.
//  Copyright © 2018-2021 Alibaba Group Holding Limited.
//

#ifndef SparseConvolutionTiledExecutor_hpp
#define SparseConvolutionTiledExecutor_hpp

#include <functional>
#include "backend/cpu/CPUConvolution.hpp"
#include "ConvolutionTiledExecutor.hpp"
// Tiled Slide Window or Im2Col + GEMM
#define SPARSITY_THRESHOLD (0.3f)
namespace MNN {

typedef void(*MNNPackedSparseMatMul)(float* C, const float* A, const float* B, size_t eSize, const size_t* parameter, const float* postParameters, const float* bias, unsigned int* NNZMap, int* dataOffsetMap);

class SparseConvolutionTiledImpl : public ConvolutionTiledImpl {
public:
    SparseConvolutionTiledImpl(const Convolution2DCommon *common, MNNPackedSparseMatMul packedSparseMatmul, int sparseBlockOC, Backend *b) : mPackedSparseMatmul{packedSparseMatmul}, mSparseBlockOC{sparseBlockOC}, ConvolutionTiledImpl(common, b) {

    }
    virtual ~SparseConvolutionTiledImpl() = default;
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs, Tensor* NNZMap, Tensor* dataOffsetMap);
    void getPackParameter(int* eP, int* lP, int* hP, const CoreFunctions* core) override;
public:
    MNNPackedSparseMatMul mPackedSparseMatmul;
    int mSparseBlockOC;
};

class SparseConvolutionTiledExecutor : public ConvolutionTiledExecutor {
public:
    SparseConvolutionTiledExecutor(const Convolution2DCommon *common, Backend *b, const float *originWeight,
                                   size_t originWeightSize, const SparseCommon* sparseCommon, const float *bias, size_t biasSize);

    SparseConvolutionTiledExecutor(std::shared_ptr<CPUConvolution::Resource> res, std::shared_ptr<Tensor> NNZMapSharePtr, std::shared_ptr<Tensor> dataOffsetMapSharePtr,
                                  const Convolution2DCommon *common, MNNPackedSparseMatMul packedSparseMatmul, int sparseBlockOC, Backend *b);
    virtual ~SparseConvolutionTiledExecutor();

    virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override {
        return mProxy->onExecute(inputs, outputs);
    }
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override {
        mInputs = {inputs[0], mResource->mWeight.get(), mResource->mBias.get()};
        return mProxy->onResize(mInputs, outputs, mNNZMap.get(), mDataOffsetMap.get());
    }
    virtual bool onClone(Backend *bn, const Op *op, Execution **dst) override;

    void initWeight(float *dest, unsigned int *NNZMap, int *dataOffsetMap, int sparseBlockOC, const float *source,
                    float *cache, int depth, int outputCount, int kernelSize, int eP, size_t weightNNZElement,
                    size_t weightBlockNumber, const CoreFunctions *function);

    static bool shouldUseSparseConvolution(size_t originWeightSize, const SparseCommon* sparseCommon) {
        return originWeightSize - sparseCommon->args()->LookupByKey("NNZElement")->i() >= originWeightSize * SPARSITY_THRESHOLD;
    }
    static float getSparsityThreshold() {
        return SPARSITY_THRESHOLD;
    }
protected:
    std::shared_ptr<SparseConvolutionTiledImpl> mProxy;
    std::shared_ptr<Tensor> mNNZMap;
    std::shared_ptr<Tensor> mDataOffsetMap;
};
} // namespace MNN

#undef SPARSITY_THRESHOLD

#endif /* SparseConvolutionTiledExecutor_hpp */
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`//`
			`// SparseConvolutionTiledExecutor`
			`// MNN`
			`//`
			`// Created by MNN on 2021/04/06.`
			`// Copyright © 2018-2021 Alibaba Group Holding Limited.`
			`//`

			`#ifndef SparseConvolutionTiledExecutor_hpp`
			`#define SparseConvolutionTiledExecutor_hpp`

			`#include <functional>`
			`#include "backend/cpu/CPUConvolution.hpp"`
			`#include "ConvolutionTiledExecutor.hpp"`
			`// Tiled Slide Window or Im2Col + GEMM`
			`#define SPARSITY_THRESHOLD (0.3f)`
			`namespace MNN {`

[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`typedef void(MNNPackedSparseMatMul)(float C, const float* A, const float* B, size_t eSize, const size_t* parameter, const float* postParameters, const float* bias, unsigned int* NNZMap, int* dataOffsetMap);`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
			`class SparseConvolutionTiledImpl : public ConvolutionTiledImpl {`
			`public:`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`SparseConvolutionTiledImpl(const Convolution2DCommon common, MNNPackedSparseMatMul packedSparseMatmul, int sparseBlockOC, Backend b) : mPackedSparseMatmul{packedSparseMatmul}, mSparseBlockOC{sparseBlockOC}, ConvolutionTiledImpl(common, b) {`

Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`}`
			`virtual ~SparseConvolutionTiledImpl() = default;`
			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs, Tensor* NNZMap, Tensor* dataOffsetMap);`
			`void getPackParameter(int* eP, int* lP, int* hP, const CoreFunctions* core) override;`
			`public:`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`MNNPackedSparseMatMul mPackedSparseMatmul;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`int mSparseBlockOC;`
			`};`

			`class SparseConvolutionTiledExecutor : public ConvolutionTiledExecutor {`
			`public:`
			`SparseConvolutionTiledExecutor(const Convolution2DCommon common, Backend b, const float *originWeight,`
			`size_t originWeightSize, const SparseCommon* sparseCommon, const float *bias, size_t biasSize);`

			`SparseConvolutionTiledExecutor(std::shared_ptr<CPUConvolution::Resource> res, std::shared_ptr<Tensor> NNZMapSharePtr, std::shared_ptr<Tensor> dataOffsetMapSharePtr,`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`const Convolution2DCommon common, MNNPackedSparseMatMul packedSparseMatmul, int sparseBlockOC, Backend b);`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`virtual ~SparseConvolutionTiledExecutor();`

			`virtual ErrorCode onExecute(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override {`
			`return mProxy->onExecute(inputs, outputs);`
			`}`
			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override {`
			`mInputs = {inputs[0], mResource->mWeight.get(), mResource->mBias.get()};`
			`return mProxy->onResize(mInputs, outputs, mNNZMap.get(), mDataOffsetMap.get());`
			`}`
			`virtual bool onClone(Backend bn, const Op op, Execution **dst) override;`

			`void initWeight(float dest, unsigned int NNZMap, int dataOffsetMap, int sparseBlockOC, const float source,`
			`float *cache, int depth, int outputCount, int kernelSize, int eP, size_t weightNNZElement,`
			`size_t weightBlockNumber, const CoreFunctions *function);`

[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`static bool shouldUseSparseConvolution(size_t originWeightSize, const SparseCommon* sparseCommon) {`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`return originWeightSize - sparseCommon->args()->LookupByKey("NNZElement")->i() >= originWeightSize * SPARSITY_THRESHOLD;`
			`}`
[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`static float getSparsityThreshold() {`
			`return SPARSITY_THRESHOLD;`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`protected:`
			`std::shared_ptr<SparseConvolutionTiledImpl> mProxy;`
			`std::shared_ptr<Tensor> mNNZMap;`
			`std::shared_ptr<Tensor> mDataOffsetMap;`
			`};`
			`} // namespace MNN`

[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`#undef SPARSITY_THRESHOLD`

Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`#endif /* SparseConvolutionTiledExecutor_hpp */`