MNN/source/core/Session.cpp

//
//  Session.cpp
//  MNN
//
//  Created by MNN on 2018/07/30.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#include "core/Session.hpp"
#include <string.h>
#include <MNN/AutoTime.hpp>
#include <map>
#include <set>
#include "MNN_generated.h"
#include "core/AutoStorage.h"
#include "core/RuntimeFactory.hpp"
#include "core/TensorUtils.hpp"
#include "core/WrapExecution.hpp"

using namespace std;

namespace MNN {
Session::Session(Schedule::ScheduleInfo&& info, Interpreter::SessionMode callBackMode,
                 Interpreter::SessionMode inputMode, RuntimeInfo&& runtime) {
    mRuntime = std::move(runtime);
    if (info.pipelineInfo.empty()) {
        mValid = false;
        return;
    }
    Backend::Info defaultInfo;
    defaultInfo.type      = MNN_FORWARD_CPU;
    defaultInfo.numThread = 1;
    mTensors              = std::move(info.allTensors);
    for (auto& iter : info.pipelineInfo) {
        auto rt    = mRuntime.first.find(iter.first.type)->second.get();
        auto cpuRuntime = mRuntime.second;
        std::shared_ptr<Backend> first(rt->onCreate());
        std::shared_ptr<Backend> second;
        if (first->type() == MNN_FORWARD_CPU) {
            second = first;
        } else {
            second.reset(cpuRuntime->onCreate());
        }
        std::shared_ptr<Pipeline> newPipeline(new Pipeline(std::move(iter.second), first, second, inputMode == Interpreter::Session_Input_Inside, rt->onGetCompilerType() == Runtime::Compiler_Geometry));
        mPipelines.emplace_back(std::move(newPipeline));
    }
    mInputs       = std::move(info.inputTensors);
    mOutputs      = std::move(info.outputTensor);
    mCallBackMode = callBackMode;
}

Session::~Session() {
    for (auto& t : mTensors) {
        TensorUtils::clearHandleData(t.second.get());
    }
    mPipelines.clear();
    mRuntime.first.clear();
    mTensors.clear();
    mRuntime.second = nullptr;
}

bool Session::loadCache(const void* buffer, size_t size) {
    for (auto iter : mRuntime.first) {
        auto res = iter.second->onSetCache(buffer, size);
        if (res) {
            return true;
        }
    }
    return false;
}

std::pair<const void*, size_t> Session::getCache() {
    for (auto iter : mRuntime.first) {
        auto res = iter.second->onGetCache();
        if (res.first != nullptr) {
            return res;
        }
    }
    return std::make_pair(nullptr, 0);
}
void Session::cloneExecution(const std::map<const Op*, std::shared_ptr<Execution>>& cache, int pipelineIndex) {
    mPipelines[pipelineIndex]->cloneExecution(cache);
}
const std::map<const Op*, std::shared_ptr<Execution>>& Session::getExecution(int pipelineIndex) {
    return mPipelines[pipelineIndex]->getCache();
}

ErrorCode Session::run() const {
    if (mNeedResize) {
        MNN_ERROR("Can't run session because not resized\n");
        return COMPUTE_SIZE_ERROR;
    }
    for (auto& iter : mPipelines) {
        auto error = iter->execute();
        if (NO_ERROR != error) {
            return error;
        }
    }
    return NO_ERROR;
}

ErrorCode Session::runWithCallBack(const TensorCallBackWithInfo& before, const TensorCallBackWithInfo& end,
                                   bool sync) const {
    if (mNeedResize) {
        MNN_ERROR("Can't run session because not resized\n");
        return COMPUTE_SIZE_ERROR;
    }
    for (auto& iter : mPipelines) {
        auto error = iter->executeCallBack(before, end);
        if (NO_ERROR != error) {
            return error;
        }
    }
    return NO_ERROR;
}

void Session::_clearCache() {
    for (auto& t : mTensors) {
        auto describe = TensorUtils::getDescribe(t.second.get());
        TensorUtils::clearHandleData(t.second.get());
        describe->useCount = 0;
        describe->backend  = nullptr;
        describe->regions.clear();
    }
}

ErrorCode Session::resize(bool isStatic) {
    for (auto& iter : mRuntime.first) {
        iter.second->onGabageCollect(100);
    }
    if (!isStatic) {
        _clearCache();
    }
    bool debug = mCallBackMode == Interpreter::Session_Debug;
    // Turn Pipeline to Command Buffer and Malloc resource
    // TODO: Seperate Schedule and Malloc
    for (auto& iter : mPipelines) {
        auto error = iter->encode(isStatic);
        if (NO_ERROR != error) {
            return error;
        }
        error = iter->allocMemory(debug);
        if (NO_ERROR != error) {
            return error;
        }
    }
    mNeedResize = false;
    for (auto& iter : mRuntime.first) {
        iter.second->onGabageCollect(0);
    }
    return NO_ERROR;
}
bool Session::getInfo(Interpreter::SessionInfoCode code, void* ptr) const {
    switch (code) {
        case Interpreter::MEMORY: {
            auto dst     = (float*)ptr;
            float summer = mRuntime.second->onGetMemoryInMB();
            for (auto& r : mRuntime.first) {
                summer += r.second->onGetMemoryInMB();
            }
            *dst = summer;
            return true;
        } break;
        // TODO: Support other debug info
        default:
            break;
    }
    return false;
}

const Backend* Session::getBackEnd(const Tensor* tensor) const {
    return TensorUtils::getDescribe(tensor)->backend;
}

Tensor* Session::getInput(const char* name) const {
    MNN_ASSERT(!mInputs.empty());
    if (nullptr == name) {
        return mInputs.begin()->second;
    }
    auto iter = mInputs.find(name);
    if (iter == mInputs.end()) {
        MNN_PRINT("Error: can't find input: %s\n", name);
        return nullptr;
    }
    return iter->second;
}

Tensor* Session::getOutput(const char* name) const {
    MNN_ASSERT(!mOutputs.empty());
    if (nullptr == name) {
        return mOutputs.begin()->second;
    }

    auto iter = mOutputs.find(name);
    if (iter == mOutputs.end()) {
        MNN_PRINT("Error: can't find output: %s\n", name);
        return nullptr;
    }
    return iter->second;
}

const std::map<std::string, Tensor*>& Session::getInputAll() const {
    return mInputs;
}

const std::map<std::string, Tensor*>& Session::getOutputAll() const {
    return mOutputs;
}

ErrorCode Session::releaseCache() {
    return NO_ERROR;
}
ErrorCode Session::updateToModel(Net* net) const {
    int opSize = net->oplists()->size();
    for (int i = 0; i < opSize; ++i) {
        auto op = net->oplists()->GetAs<Op>(i);
        if ((net->usage() == Usage_INFERENCE || net->usage() == Usage_INFERENCE_STATIC) && op->type() != OpType_Const) {
            continue;
        }
        if (net->usage() == Usage_TRAIN && op->type() != OpType_TrainableParam) {
            continue;
        }
        if (!op->outputIndexes() || op->outputIndexes()->size() != 1) {
            continue;
        }
        auto index = op->outputIndexes()->data()[0];
        auto blob  = op->main_as_Blob();
        if (blob->dataType() != DataType_DT_FLOAT) {
            continue;
        }
        std::shared_ptr<Tensor> tensor = mTensors[index].second;
        if (tensor->host<void>() == nullptr && tensor->deviceId() != 0) {
            tensor.reset(Tensor::createHostTensorFromDevice(tensor.get(), true));
            if (tensor.get() == nullptr) {
                MNN_ERROR("failed to copy trained param from device to host\n");
                return INVALID_VALUE;
            }
        }
        ::memcpy((void*)blob->float32s()->data(), tensor->host<float>(), tensor->size());
    }

    return NO_ERROR;
}

} // namespace MNN
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// Session.cpp`
			`// MNN`
			`//`
			`// Created by MNN on 2018/07/30.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

Update 2019-12-27 22:16:57 +08:00			`#include "core/Session.hpp"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`#include <string.h>`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`#include <MNN/AutoTime.hpp>`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`#include <map>`
			`#include <set>`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`#include "MNN_generated.h"`
Update 2019-12-27 22:16:57 +08:00			`#include "core/AutoStorage.h"`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include "core/RuntimeFactory.hpp"`
Update 2019-12-27 22:16:57 +08:00			`#include "core/TensorUtils.hpp"`
			`#include "core/WrapExecution.hpp"`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`using namespace std;`

			`namespace MNN {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`Session::Session(Schedule::ScheduleInfo&& info, Interpreter::SessionMode callBackMode,`
			`Interpreter::SessionMode inputMode, RuntimeInfo&& runtime) {`
			`mRuntime = std::move(runtime);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`if (info.pipelineInfo.empty()) {`
			`mValid = false;`
			`return;`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`Backend::Info defaultInfo;`
			`defaultInfo.type = MNN_FORWARD_CPU;`
			`defaultInfo.numThread = 1;`
			`mTensors = std::move(info.allTensors);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`for (auto& iter : info.pipelineInfo) {`
[PATCH 51/78] [MNN:Refractor] Solve compile warning in Session 2020-11-18 10:48:38 +08:00			`auto rt = mRuntime.first.find(iter.first.type)->second.get();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto cpuRuntime = mRuntime.second;`
[PATCH 51/78] [MNN:Refractor] Solve compile warning in Session 2020-11-18 10:48:38 +08:00			`std::shared_ptr<Backend> first(rt->onCreate());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`std::shared_ptr<Backend> second;`
			`if (first->type() == MNN_FORWARD_CPU) {`
			`second = first;`
			`} else {`
			`second.reset(cpuRuntime->onCreate());`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`}`
[PATCH 51/78] [MNN:Refractor] Solve compile warning in Session 2020-11-18 10:48:38 +08:00			`std::shared_ptr<Pipeline> newPipeline(new Pipeline(std::move(iter.second), first, second, inputMode == Interpreter::Session_Input_Inside, rt->onGetCompilerType() == Runtime::Compiler_Geometry));`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`mPipelines.emplace_back(std::move(newPipeline));`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mInputs = std::move(info.inputTensors);`
			`mOutputs = std::move(info.outputTensor);`
			`mCallBackMode = callBackMode;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`

			`Session::~Session() {`
			`for (auto& t : mTensors) {`
			`TensorUtils::clearHandleData(t.second.get());`
			`}`
beta 0.2.0.9 - fix quantization tool compiling on Windows - fix converter compiling on Windows - fix eltwise optimization on Windows - separate sse & avx for Windows - add LeakyReLU support for TensorFlow - fix reshape, const for TensorFlow - fix dimension format error for ONNX ops - optimize winograd, ReLU for OpenCL - add fp16 availability & dimensions size check-up for OpenCL - optimize GEMM for arm32 - fix ExpandDims shape calculation when inputs size == 1 2019-09-01 19:25:26 +08:00			`mPipelines.clear();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mRuntime.first.clear();`
beta 0.2.0.9 - fix quantization tool compiling on Windows - fix converter compiling on Windows - fix eltwise optimization on Windows - separate sse & avx for Windows - add LeakyReLU support for TensorFlow - fix reshape, const for TensorFlow - fix dimension format error for ONNX ops - optimize winograd, ReLU for OpenCL - add fp16 availability & dimensions size check-up for OpenCL - optimize GEMM for arm32 - fix ExpandDims shape calculation when inputs size == 1 2019-09-01 19:25:26 +08:00			`mTensors.clear();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mRuntime.second = nullptr;`
			`}`

			`bool Session::loadCache(const void* buffer, size_t size) {`
			`for (auto iter : mRuntime.first) {`
			`auto res = iter.second->onSetCache(buffer, size);`
			`if (res) {`
			`return true;`
			`}`
			`}`
			`return false;`
			`}`

			`std::pair<const void*, size_t> Session::getCache() {`
			`for (auto iter : mRuntime.first) {`
			`auto res = iter.second->onGetCache();`
			`if (res.first != nullptr) {`
			`return res;`
			`}`
			`}`
			`return std::make_pair(nullptr, 0);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`void Session::cloneExecution(const std::map<const Op*, std::shared_ptr<Execution>>& cache, int pipelineIndex) {`
			`mPipelines[pipelineIndex]->cloneExecution(cache);`
			`}`
			`const std::map<const Op*, std::shared_ptr<Execution>>& Session::getExecution(int pipelineIndex) {`
			`return mPipelines[pipelineIndex]->getCache();`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`ErrorCode Session::run() const {`
add validation check before running 2019-08-08 14:42:14 +08:00			`if (mNeedResize) {`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`MNN_ERROR("Can't run session because not resized\n");`
add validation check before running 2019-08-08 14:42:14 +08:00			`return COMPUTE_SIZE_ERROR;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`for (auto& iter : mPipelines) {`
			`auto error = iter->execute();`
			`if (NO_ERROR != error) {`
			`return error;`
			`}`
			`}`
			`return NO_ERROR;`
			`}`

			`ErrorCode Session::runWithCallBack(const TensorCallBackWithInfo& before, const TensorCallBackWithInfo& end,`
			`bool sync) const {`
add validation check before running 2019-08-08 14:42:14 +08:00			`if (mNeedResize) {`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`MNN_ERROR("Can't run session because not resized\n");`
add validation check before running 2019-08-08 14:42:14 +08:00			`return COMPUTE_SIZE_ERROR;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`for (auto& iter : mPipelines) {`
			`auto error = iter->executeCallBack(before, end);`
			`if (NO_ERROR != error) {`
			`return error;`
			`}`
			`}`
			`return NO_ERROR;`
			`}`

			`void Session::_clearCache() {`
			`for (auto& t : mTensors) {`
			`auto describe = TensorUtils::getDescribe(t.second.get());`
			`TensorUtils::clearHandleData(t.second.get());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`describe->useCount = 0;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`describe->backend = nullptr;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`describe->regions.clear();`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`}`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`ErrorCode Session::resize(bool isStatic) {`
			`for (auto& iter : mRuntime.first) {`
			`iter.second->onGabageCollect(100);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (!isStatic) {`
			`_clearCache();`
			`}`
			`bool debug = mCallBackMode == Interpreter::Session_Debug;`
			`// Turn Pipeline to Command Buffer and Malloc resource`
			`// TODO: Seperate Schedule and Malloc`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`for (auto& iter : mPipelines) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto error = iter->encode(isStatic);`
			`if (NO_ERROR != error) {`
			`return error;`
			`}`
			`error = iter->allocMemory(debug);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`if (NO_ERROR != error) {`
			`return error;`
			`}`
			`}`
			`mNeedResize = false;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`for (auto& iter : mRuntime.first) {`
			`iter.second->onGabageCollect(0);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`return NO_ERROR;`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`bool Session::getInfo(Interpreter::SessionInfoCode code, void* ptr) const {`
			`switch (code) {`
			`case Interpreter::MEMORY: {`
			`auto dst = (float*)ptr;`
			`float summer = mRuntime.second->onGetMemoryInMB();`
			`for (auto& r : mRuntime.first) {`
			`summer += r.second->onGetMemoryInMB();`
			`}`
			`*dst = summer;`
			`return true;`
			`} break;`
			`// TODO: Support other debug info`
			`default:`
			`break;`
			`}`
			`return false;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`const Backend* Session::getBackEnd(const Tensor* tensor) const {`
			`return TensorUtils::getDescribe(tensor)->backend;`
			`}`

			`Tensor* Session::getInput(const char* name) const {`
			`MNN_ASSERT(!mInputs.empty());`
			`if (nullptr == name) {`
			`return mInputs.begin()->second;`
			`}`
			`auto iter = mInputs.find(name);`
			`if (iter == mInputs.end()) {`
			`MNN_PRINT("Error: can't find input: %s\n", name);`
			`return nullptr;`
			`}`
			`return iter->second;`
			`}`

			`Tensor* Session::getOutput(const char* name) const {`
			`MNN_ASSERT(!mOutputs.empty());`
			`if (nullptr == name) {`
			`return mOutputs.begin()->second;`
			`}`

			`auto iter = mOutputs.find(name);`
			`if (iter == mOutputs.end()) {`
			`MNN_PRINT("Error: can't find output: %s\n", name);`
			`return nullptr;`
			`}`
			`return iter->second;`
			`}`

			`const std::map<std::string, Tensor*>& Session::getInputAll() const {`
			`return mInputs;`
			`}`

			`const std::map<std::string, Tensor*>& Session::getOutputAll() const {`
			`return mOutputs;`
			`}`

			`ErrorCode Session::releaseCache() {`
			`return NO_ERROR;`
			`}`
beta 0.2.0.0 - replace FreeImage with stb_image - warn unicode error in Windows compiling - separate clang/gcc build script for android - add default values in fbs - optimize CPU conv / conv depthwise / deconv / deconv depthwise / lstm / sigmoid - add sub support in eltwise - add reciprocal / log1p / log in unary - add zero like / select / set diff 1d - add batch support for permute - add training codes - fix metal error in dynamic separate storage type handling 2019-06-17 20:10:35 +08:00			`ErrorCode Session::updateToModel(Net* net) const {`
			`int opSize = net->oplists()->size();`
			`for (int i = 0; i < opSize; ++i) {`
			`auto op = net->oplists()->GetAs<Op>(i);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if ((net->usage() == Usage_INFERENCE \|\| net->usage() == Usage_INFERENCE_STATIC) && op->type() != OpType_Const) {`
Update 2019-12-27 22:16:57 +08:00			`continue;`
			`}`
			`if (net->usage() == Usage_TRAIN && op->type() != OpType_TrainableParam) {`
beta 0.2.0.0 - replace FreeImage with stb_image - warn unicode error in Windows compiling - separate clang/gcc build script for android - add default values in fbs - optimize CPU conv / conv depthwise / deconv / deconv depthwise / lstm / sigmoid - add sub support in eltwise - add reciprocal / log1p / log in unary - add zero like / select / set diff 1d - add batch support for permute - add training codes - fix metal error in dynamic separate storage type handling 2019-06-17 20:10:35 +08:00			`continue;`
			`}`
			`if (!op->outputIndexes() \|\| op->outputIndexes()->size() != 1) {`
			`continue;`
			`}`
			`auto index = op->outputIndexes()->data()[0];`
			`auto blob = op->main_as_Blob();`
			`if (blob->dataType() != DataType_DT_FLOAT) {`
			`continue;`
			`}`
Update 2019-12-27 22:16:57 +08:00			`std::shared_ptr<Tensor> tensor = mTensors[index].second;`
			`if (tensor->host<void>() == nullptr && tensor->deviceId() != 0) {`
			`tensor.reset(Tensor::createHostTensorFromDevice(tensor.get(), true));`
			`if (tensor.get() == nullptr) {`
			`MNN_ERROR("failed to copy trained param from device to host\n");`
			`return INVALID_VALUE;`
			`}`
			`}`
			`::memcpy((void*)blob->float32s()->data(), tensor->host<float>(), tensor->size());`
beta 0.2.0.0 - replace FreeImage with stb_image - warn unicode error in Windows compiling - separate clang/gcc build script for android - add default values in fbs - optimize CPU conv / conv depthwise / deconv / deconv depthwise / lstm / sigmoid - add sub support in eltwise - add reciprocal / log1p / log in unary - add zero like / select / set diff 1d - add batch support for permute - add training codes - fix metal error in dynamic separate storage type handling 2019-06-17 20:10:35 +08:00			`}`

			`return NO_ERROR;`
			`}`

beta 0.1.0 2019-04-17 10:49:11 +08:00			`} // namespace MNN`