MNN/source/backend/cpu/CPUConvolution.hpp

//
//  CPUConvolution.hpp
//  MNN
//
//  Created by MNN on 2018/07/15.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef CPUConvolution_hpp
#define CPUConvolution_hpp

#include "CPUBackend.hpp"
#include "core/ConvolutionCommon.hpp"
namespace MNN {
class CPUConvolution : public Execution {
public:
    CPUConvolution(const Convolution2DCommon *convOp, Backend *b);
    virtual ~CPUConvolution() = default;
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;

    typedef void (*POSTFUNCTION)(float *dst, const float *bias, size_t planeNumber, size_t biasNumber);

    POSTFUNCTION getPostFunction() const;
    
    static int reorderWeightSize(int depth, int outputCount, int kernelSize, int unitDepth, int unitOC);
    // Inefficient but need not cache, use it when speed insensitive (init, onResize)
    template<typename T> static void reorderWeightSlow(T* dest, const T* source, size_t depth, size_t outputCount, size_t kernelSize,
                                                       size_t unitDepth, size_t unitOC, bool transpose = false);
    /* Inefficient because of not use memcpy to support different type copy (T -> U), use it when speed insensitive (init, onResize)
       return: False if acquire failed
     */
    template<typename T, typename U> static bool acquireMemoryAndCopy(std::shared_ptr<Tensor> dest, const T* source, size_t count, Backend*);

    std::vector<float> getPostParameters() const;
protected:
    const Convolution2DCommon *mCommon;

    // In execute, use pad from mPadX and mPadY, don't use mCommon's pad
    mutable int mPadX;
    mutable int mPadY;
    CPUConvolution::POSTFUNCTION mPostFunction;
};

} // namespace MNN

#endif /* CPUConvolution_hpp */
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// CPUConvolution.hpp`
			`// MNN`
			`//`
			`// Created by MNN on 2018/07/15.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#ifndef CPUConvolution_hpp`
			`#define CPUConvolution_hpp`

[MNN:Sync] Sync Internal Github 2020-07-04 01:21:30 +08:00			`#include "CPUBackend.hpp"`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include "core/ConvolutionCommon.hpp"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`namespace MNN {`
			`class CPUConvolution : public Execution {`
			`public:`
			`CPUConvolution(const Convolution2DCommon convOp, Backend b);`
			`virtual ~CPUConvolution() = default;`
			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`

			`typedef void (POSTFUNCTION)(float dst, const float *bias, size_t planeNumber, size_t biasNumber);`

			`POSTFUNCTION getPostFunction() const;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00
			`static int reorderWeightSize(int depth, int outputCount, int kernelSize, int unitDepth, int unitOC);`
			`// Inefficient but need not cache, use it when speed insensitive (init, onResize)`
			`template<typename T> static void reorderWeightSlow(T* dest, const T* source, size_t depth, size_t outputCount, size_t kernelSize,`
			`size_t unitDepth, size_t unitOC, bool transpose = false);`
			`/* Inefficient because of not use memcpy to support different type copy (T -> U), use it when speed insensitive (init, onResize)`
			`return: False if acquire failed`
			`*/`
			`template<typename T, typename U> static bool acquireMemoryAndCopy(std::shared_ptr<Tensor> dest, const T* source, size_t count, Backend*);`

[MNN:Sync] Sync Internal Github 2020-07-04 01:21:30 +08:00			`std::vector<float> getPostParameters() const;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`protected:`
			`const Convolution2DCommon *mCommon;`

			`// In execute, use pad from mPadX and mPadY, don't use mCommon's pad`
			`mutable int mPadX;`
			`mutable int mPadY;`
			`CPUConvolution::POSTFUNCTION mPostFunction;`
			`};`

			`} // namespace MNN`

			`#endif /* CPUConvolution_hpp */`