MNN/source/core/Pipeline.hpp

//
//  Pipeline.hpp
//  MNN
//
//  Created by MNN on 2019/01/14.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef Pipeline_hpp
#define Pipeline_hpp

#include "Schedule.hpp"
#include "core/Execution.hpp"
#include "geometry/GeometryComputer.hpp"

namespace MNN {
struct OperatorInfo::Info {
    std::string name;
    std::string type;
    float flops = 0.0f;
};
class SizeComputer;
/** pipeline. one session may contains multiple pipeline, and one pipeline may contains more than one unit. */
class Pipeline : public NonCopyable {
public:
    struct TuningAttr {
        bool autoSetOpType;
        int maxTuningNumber;
    };
    Pipeline(const std::string& externalFile, Schedule::PipelineInfo&& info, bool allocInput, bool outputStatic, const TuningAttr& tune, const Runtime* rt, const Runtime* cpuRt);
    ~Pipeline();
    ErrorCode fixResizeCache();
    void openResizeCheck();

    class UnitInfo : public OperatorInfo {
    public:
        UnitInfo()          = default;
        virtual ~UnitInfo() = default;
        void setUp(const Command& cmd, int index, const Op* originOp, int totalIndex);
    };
public:
    /** encode :
       1. compute shape for every op's inputs and outputs;
       2. geometry transform;
       3. copy op, inputs and outputs tensor info to mBuffer
       static_model:  3; dynamic_model: 1,2,3
    */
    ErrorCode encode(bool supportDebug = false, bool permitCodegen = false);
    /** allocMemory: create Execution and alloc memory for every op */
    ErrorCode allocMemory(bool firstMalloc, bool permitCodegen);
    /** execute this pipline */
    ErrorCode execute();
    ErrorCode executeCallBack(const TensorCallBackWithInfo& before, const TensorCallBackWithInfo& after);
    Schedule::PipelineInfo& getPipelineInfo() {
        return mInfo;
    }

    float flops() const {
        return mFlops;
    }
    friend class Session;
    MNNForwardType getMainForwardType() const  {
        return mInfo.first.cache.first->type();
    }
    typedef std::map<std::pair<Tensor::InsideDescribe::NativeInsideDescribe*, Backend*>, std::pair<std::weak_ptr<Tensor::InsideDescribe::NativeInsideDescribe>, std::shared_ptr<Tensor>>> WrapTensorCache;
private:
    ErrorCode _allocForTensor(int index, bool allocInput);
    void _copyInputs();
    void _pushTuningTask(std::vector<Schedule::OpCacheInfo>&& initInfos);
    void _recycleDynamicMemory(Command* command);
    Schedule::PipelineInfo mInfo;
    bool mAllocInput;
    bool mOutputStatic;
    TuningAttr mTuneAttr;
    float mFlops = 0.0f;
    bool mIsQuantModel = false;

    // For gpu or other backend
    std::map<Tensor*, std::shared_ptr<Tensor>> mCacheConstTensors;
    WrapTensorCache mWrapTensors;
#ifndef MNN_BUILD_MINI
    GeometryComputer::Context mContext;
    Runtime::CompilerType mUseGeometry;
#endif
    const Runtime* mRuntime;
    const Runtime* mCpuRuntime;
    std::string mExternalFile;
    std::vector<std::shared_ptr<BufferStorage>> mExternalStorage;
};
} // namespace MNN

#endif /* Pipeline_hpp */
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// Pipeline.hpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/01/14.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#ifndef Pipeline_hpp`
			`#define Pipeline_hpp`

			`#include "Schedule.hpp"`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include "core/Execution.hpp"`
			`#include "geometry/GeometryComputer.hpp"`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`namespace MNN {`
			`struct OperatorInfo::Info {`
			`std::string name;`
			`std::string type;`
			`float flops = 0.0f;`
			`};`
			`class SizeComputer;`
			`/** pipeline. one session may contains multiple pipeline, and one pipeline may contains more than one unit. */`
			`class Pipeline : public NonCopyable {`
			`public:`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`struct TuningAttr {`
			`bool autoSetOpType;`
			`int maxTuningNumber;`
			`};`
[MNN:Sync] Sync Internal 2.8.4 2024-04-19 11:58:21 +08:00			`Pipeline(const std::string& externalFile, Schedule::PipelineInfo&& info, bool allocInput, bool outputStatic, const TuningAttr& tune, const Runtime* rt, const Runtime* cpuRt);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`~Pipeline();`
[MNN:Sync] Sync Internal 2.8.4 2024-04-19 11:58:21 +08:00			`ErrorCode fixResizeCache();`
			`void openResizeCheck();`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`class UnitInfo : public OperatorInfo {`
			`public:`
			`UnitInfo() = default;`
			`virtual ~UnitInfo() = default;`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`void setUp(const Command& cmd, int index, const Op* originOp, int totalIndex);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`};`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`public:`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`/** encode :`
			`1. compute shape for every op's inputs and outputs;`
			`2. geometry transform;`
			`3. copy op, inputs and outputs tensor info to mBuffer`
			`static_model: 3; dynamic_model: 1,2,3`
			`*/`
[MNN:Sync] Sync Internal Gitlab 2023-07-18 09:36:26 +08:00			`ErrorCode encode(bool supportDebug = false, bool permitCodegen = false);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`/** allocMemory: create Execution and alloc memory for every op */`
[MNN:Sync] Sync Internal Gitlab 2023-07-18 09:36:26 +08:00			`ErrorCode allocMemory(bool firstMalloc, bool permitCodegen);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`/** execute this pipline */`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`ErrorCode execute();`
			`ErrorCode executeCallBack(const TensorCallBackWithInfo& before, const TensorCallBackWithInfo& after);`
[MNN:Sync] Sync Internal 2.3.0 2022-12-30 15:18:58 +08:00			`Schedule::PipelineInfo& getPipelineInfo() {`
			`return mInfo;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`float flops() const {`
			`return mFlops;`
			`}`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`friend class Session;`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`MNNForwardType getMainForwardType() const {`
[MNN:Sync] Sync Internal 2.3.0 2022-12-30 15:18:58 +08:00			`return mInfo.first.cache.first->type();`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`}`
[MNN:Bugfix] Fix bug for resize opt bug, support llama3 8b 2024-04-23 13:54:38 +08:00			`typedef std::map<std::pair<Tensor::InsideDescribe::NativeInsideDescribe, Backend>, std::pair<std::weak_ptr<Tensor::InsideDescribe::NativeInsideDescribe>, std::shared_ptr<Tensor>>> WrapTensorCache;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`private:`
[MNN:Sync] Sync Internal 2.8.4 2024-04-19 11:58:21 +08:00			`ErrorCode _allocForTensor(int index, bool allocInput);`
[MNN:Sync] Sync Internal 2.3.0 2022-12-30 15:18:58 +08:00			`void _copyInputs();`
			`void _pushTuningTask(std::vector<Schedule::OpCacheInfo>&& initInfos);`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`void _recycleDynamicMemory(Command* command);`
[MNN:Sync] Sync Internal 2.3.0 2022-12-30 15:18:58 +08:00			`Schedule::PipelineInfo mInfo;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`bool mAllocInput;`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`bool mOutputStatic;`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`TuningAttr mTuneAttr;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`float mFlops = 0.0f;`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`bool mIsQuantModel = false;`

			`// For gpu or other backend`
			`std::map<Tensor*, std::shared_ptr<Tensor>> mCacheConstTensors;`
[MNN:Bugfix] Fix bug for resize opt bug, support llama3 8b 2024-04-23 13:54:38 +08:00			`WrapTensorCache mWrapTensors;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#ifndef MNN_BUILD_MINI`
			`GeometryComputer::Context mContext;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`Runtime::CompilerType mUseGeometry;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#endif`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`const Runtime* mRuntime;`
			`const Runtime* mCpuRuntime;`
[MNN:Sync] Sync Internal 2.8.4 2024-04-19 11:58:21 +08:00			`std::string mExternalFile;`
			`std::vector<std::shared_ptr<BufferStorage>> mExternalStorage;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`};`
			`} // namespace MNN`

			`#endif /* Pipeline_hpp */`