MNN/express/module/StaticModule.cpp

//
//  StaticModule.cpp
//  MNN
//
//  Created by MNN on b'2020/09/10'.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#include "StaticModule.hpp"
#include <MNN/expr/ExprCreator.hpp>
#include <MNN/AutoTime.hpp>
#include "core/TensorUtils.hpp"
#include "core/Session.hpp"
#include <MNN/expr/Executor.hpp>
#include <MNN/AutoTime.hpp>
#include <MNN/expr/ExecutorScope.hpp>
#include "core/MNNMemoryUtils.h"
#include "core/Schedule.hpp"
#include "Utils.hpp"

namespace MNN {
namespace Express {

struct NetStorage {
    size_t size() const {
        return allocated_size - offset;
    }

    const uint8_t* buffer() const {
        return storage.get() + offset;
    }
    size_t allocated_size;
    size_t offset;
    std::unique_ptr<uint8_t> storage;
};
static std::shared_ptr<NetStorage> preRearrangeWeights(  // NOLINT
    const MNN::Net* net, std::map<const Op*, std::shared_ptr<Execution>>& cache, Backend* backend) {
    std::unique_ptr<MNN::NetT> net_table(net->UnPack());
    std::map<int, std::shared_ptr<Execution>> exeCache;
    for (int i = 0; i < net->oplists()->size(); ++i) {
        auto op = net->oplists()->Get(i);
        auto op_table = net_table->oplists[i].get();
        switch (op->type()) {
            case MNN::OpType_DepthwiseConvInt8:
            case MNN::OpType_ConvInt8:
            case MNN::OpType_ConvolutionDepthwise:
            case MNN::OpType_Convolution: {
                std::shared_ptr<Execution> exe(backend->onCreate({}, {}, op));
                if (nullptr == exe) {
                    break;
                }
                if (!exe->onClone(nullptr, op, nullptr)) {
                    break;
                }
                exeCache.insert(std::make_pair(i, exe));
                if (OpParameter_Convolution2D == op_table->main.type) {
                    op_table->main.AsConvolution2D()->bias.clear();
                    op_table->main.AsConvolution2D()->weight.clear();
                    if (nullptr != op_table->main.AsConvolution2D()->symmetricQuan) {
                        op_table->main.AsConvolution2D()->symmetricQuan->bias.clear();
                        op_table->main.AsConvolution2D()->symmetricQuan->weight.clear();
                    }
                    if (nullptr != op_table->main.AsConvolution2D()->quanParameter) {
                        op_table->main.AsConvolution2D()->quanParameter->alpha.clear();
                        op_table->main.AsConvolution2D()->quanParameter->buffer.clear();
                    }
                }
                break;
            }
            default: {
                break;
            }
        }
    }
    flatbuffers::FlatBufferBuilder builder(1024);
    builder.Finish(MNN::Net::Pack(builder, net_table.get()));
    // Swap the raw buffer ownership.
    std::shared_ptr<NetStorage> net_storage(new NetStorage);
    net_storage->storage.reset(builder.ReleaseRaw(net_storage->allocated_size,  // NOLINT
                                                  net_storage->offset));
    net = GetNet(net_storage->buffer());
    for (auto& iter : exeCache) {
        auto op = net->oplists()->Get(iter.first);
        cache.insert(std::make_pair(op, iter.second));
    }
    for (int i = 0; i < net->oplists()->size(); ++i) {
        auto op = net->oplists()->Get(i);
    }
    return net_storage;
}

StaticModule::StaticModule(const void* buffer, size_t length, const std::vector<std::string>& inputs, const std::vector<std::string>& outputs, const Module::Config& moduleconfig) : mInputs(inputs), mOutputs(outputs) {
    setType("StaticModule");
    std::shared_ptr<NetStorage> net_storage;
    std::map<const Op*, std::shared_ptr<Execution>> exeCache;
    if (moduleconfig.rearrange) {
        auto rt = Express::ExecutorScope::Current()->getRuntime();
        MNN_CHECK(rt.first.size() == 1, "The number of formal backends should be 1.");
        mResourceBackend.reset(rt.first.begin()->second->onCreate());
        net_storage = preRearrangeWeights(GetNet(buffer), exeCache, mResourceBackend.get());
        buffer = net_storage->buffer();
        length = net_storage->size();
    } else {
        net_storage.reset(new NetStorage);
        net_storage->storage.reset((uint8_t*)malloc(length));
        if (nullptr == net_storage->storage.get()) {
            MNN_ERROR("Allock Error in StaticModule's net\n");
            return;
        }
        net_storage->allocated_size = length;
        net_storage->offset = 0;
        ::memcpy(net_storage->storage.get(), buffer, length);
        buffer = net_storage->storage.get();
    }
    mNetStorage = std::move(net_storage);
    mShapeFix = !moduleconfig.shapeMutable;
    mOutputNumbers = (int)outputs.size();
    /** Compute:
     std::vector<int, int> mOutputFromTensor;
     std::vector<int, int> mOutputFromInput;
     */
    for (int i=0; i<outputs.size(); ++i) {
        auto& t = outputs[i];
        bool fromInput = false;
        for (int j=0; j<inputs.size(); ++j) {
            if (inputs[j] == t) {
                fromInput = true;
                mOutputFromInput.emplace_back(std::make_pair(i, j));
                break;
            }
        }
        if (fromInput) {
            continue;
        }
        mOutputFromTensor.emplace_back(i);
    }
    if (mOutputFromTensor.empty()) {
        return;
    }
    auto rt = Express::ExecutorScope::Current()->getRuntime();
    // TODO: Add Config
    ScheduleConfig config;
    config.numThread = 1;
    config.type = rt.first.begin()->first;
    config.saveTensors = outputs;
    auto scheduleInfo = Schedule::schedule(GetNet(buffer), {config});
#ifdef MNN_EXPR_ENABLE_PROFILER
    Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;
#else
    Interpreter::SessionMode callBackMode = Interpreter::Session_Release;
#endif
    Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;
    mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));
    mSession->cloneExecution(exeCache, 0);
    if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {
        mSession->resize(false);
    }
    mInputTensors.resize(inputs.size());
    for (int i=0; i<inputs.size(); ++i) {
        mInputTensors[i] = mSession->getInput(inputs[i].c_str());
    }
    mOutputTensors.resize(mOutputFromTensor.size());
    for (int i=0; i<mOutputFromTensor.size(); ++i) {
        mOutputTensors[i] = mSession->getOutput(outputs[mOutputFromTensor[i]].c_str());
    }
}
StaticModule:: ~ StaticModule() {
    mSession = nullptr;
    mResourceBackend = nullptr;
}
std::vector<Express::VARP> StaticModule::onForward(const std::vector<Express::VARP>& inputs) {
    AUTOTIME;
    std::vector<Express::VARP> outputs(mOutputNumbers);
    for (auto& iter : mOutputFromInput) {
        outputs[iter.first] = inputs[iter.second];
    }
    if (mOutputFromTensor.empty()) {
        return outputs;
    }
    Variable::compute(inputs);

    MNN_ASSERT(inputs.size() == mInputTensors.size());
    for (int i=0; i<inputs.size(); ++i) {
        auto info = inputs[i]->getInfo();
        mInputTensors[i]->buffer().type = info->type;
        auto des = TensorUtils::getDescribe(mInputTensors[i]);
        if (info->order == Express::NCHW) {
            des->dimensionFormat = MNN_DATA_FORMAT_NCHW;
        }
        if (info->order == Express::NHWC) {
            des->dimensionFormat = MNN_DATA_FORMAT_NHWC;
        }
        if (info->order == Express::NC4HW4) {
            des->dimensionFormat = MNN_DATA_FORMAT_NC4HW4;
        }
        if (info->tensorArrayAttr != nullptr) {
            des->tensorArrayAttr = info->tensorArrayAttr;
        }
        resizeTensor(mInputTensors[i], info->dim);
    }
    if (!mShapeFix) {
        for (int i=0; i<inputs.size(); ++i) {
            auto srcPtr = (uint8_t*)inputs[i]->readMap<void>();
            if (srcPtr != mInputTensors[i]->buffer().host) {
                mInputTensors[i]->buffer().host = srcPtr;
                mSession->setNeedResize();
            }
        }
    }
    if (mSession->getNeedResize()) {
        mSession->resize();
    }
    if (mShapeFix) {
        for (int i=0; i<inputs.size(); ++i) {
            auto exprInfo = inputs[i]->expr();
            auto inside = exprInfo.first->inside();
            auto inputTensor = inside->mOutputTensors[exprInfo.second];
            if (nullptr != inside->mCache) {
                inputTensor = Executor::getOutput(inside->mCache.get(), inside->mCacheOffset);
            }
            auto backend = TensorUtils::getDescribe(mInputTensors[i])->backend;
            if (nullptr != backend) {
                // For zero shape, backend is null
                backend->onCopyBuffer(inputTensor, mInputTensors[i]);
            }
        }
    }
#ifdef MNN_EXPR_ENABLE_PROFILER
    auto globalExecutor = ExecutorScope::Current();
    Timer cost;
    TensorCallBackWithInfo beforeCallBack = [&cost] (const std::vector<Tensor*>&, const OperatorInfo* info) {
        cost.reset();
        return true;
    };
    TensorCallBackWithInfo afterCallBack = [&cost, globalExecutor] (const std::vector<Tensor*>&, const OperatorInfo* info) {
        auto costTimes = (float)cost.durationInUs() / 1000.0f;
        globalExecutor->addOpCostTime(info->type(), costTimes);
        globalExecutor->addOpFlops(info->type(), info->flops());
        return true;
    };
    mSession->runWithCallBack(beforeCallBack, afterCallBack);
#else
    mSession->run();
#endif
    for (int i=0; i<mOutputTensors.size(); ++i) {
	    auto currentTensor = mOutputTensors[i];	
        // copy the data when reused as input tensor with data;		
        if (currentTensor->elementSize() != 0 && mReusedTensors.find(mOutputFromTensor[i]) != mReusedTensors.end()) {		
            std::shared_ptr<Tensor> tmpTensor(new Tensor(currentTensor, currentTensor->getDimensionType(), false));		
            tmpTensor->buffer().host = (uint8_t*)MNNMemoryAllocAlign(currentTensor->size(), MNN_MEMORY_ALIGN_DEFAULT);		
            currentTensor->copyToHostTensor(tmpTensor.get());	

            Express::Variable::Info info;		
            info.dim = currentTensor->shape();		
            info.type = currentTensor->getType();		
            auto des = TensorUtils::getDescribe(mOutputTensors[i]);		
            auto format = des->dimensionFormat;		
            info.order = Express::NHWC;		
            if (format == MNN_DATA_FORMAT_NCHW) {		
                info.order = Express::NCHW;		
            } else if (format == MNN_DATA_FORMAT_NC4HW4) {		
                info.order = Express::NC4HW4;		
            }		
            // if this output tensor is TensorArray, copy attr		
            if (des->tensorArrayAttr != nullptr) {		
                info.tensorArrayAttr = des->tensorArrayAttr;		
            }	

            outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(std::move(info), tmpTensor->host<void>(), Express::VARP::CONSTANT, Expr::MemoryType::MOVE), 0);		
        } else {
            outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(mOutputTensors[i]));
        }
    }
    return outputs;
}

void StaticModule::setReusedTensors(std::set<int> reused) {
    mReusedTensors = std::move(reused);
}

Module* StaticModule::clone(CloneContext* ctx) const {
    StaticModule* module(new StaticModule);
    module->mInputs = mInputs;
    module->mOutputs = mOutputs;

    module->mShapeFix = mShapeFix;
    module->mOutputNumbers = mOutputNumbers;
    module->mOutputFromInput = mOutputFromInput;
    module->mOutputFromTensor = mOutputFromTensor;
    if (mOutputFromTensor.empty()) {
        return this->cloneBaseTo(ctx, module);
    }
    module->mNetStorage = mNetStorage;
    auto rt = Express::ExecutorScope::Current()->getRuntime();
    ScheduleConfig config;
    config.numThread = 1;
    config.type = rt.first.begin()->first;
    config.saveTensors = mOutputs;
    auto scheduleInfo = Schedule::schedule(GetNet(module->mNetStorage->buffer()), {config});
#ifdef MNN_EXPR_ENABLE_PROFILER
    Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;
#else
    Interpreter::SessionMode callBackMode = Interpreter::Session_Release;
#endif
    Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;
    module->mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));
    module->mSession->cloneExecution(mSession->getExecution(0), 0);
    if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {
        module->mSession->resize(false);
    }
    module->mResourceBackend = mResourceBackend;
    module->mInputTensors.resize(mInputs.size());
    module->mOutputTensors.resize(mOutputFromTensor.size());
    for (int i=0; i<mInputs.size(); ++i) {
        module->mInputTensors[i] =
            module->mSession->getInput(mInputs[i].c_str());
    }
    for (int i=0; i<mOutputFromTensor.size(); ++i) {
        module->mOutputTensors[i] = module->mSession->getOutput(mOutputs[mOutputFromTensor[i]].c_str());
    }
    return this->cloneBaseTo(ctx, module);
}

void StaticModule::resizeTensor(Tensor* tensor, const std::vector<int>& dims) {
    MNN_ASSERT(nullptr != tensor);
    bool dirty = false;
    if (tensor->buffer().dimensions != dims.size()) {
        dirty = true;
    } else {
        for (int i = 0; i < dims.size(); ++i) {
            if (tensor->buffer().dim[i].extent != dims[i]) {
                dirty = true;
                break;
            }
        }
    }

    if (!dirty) {
        return;
    }

    tensor->buffer().dimensions = (int)dims.size();
    for (int i = 0; i < dims.size(); ++i) {
        tensor->buffer().dim[i].extent = dims[i];
    }

    MNN_ASSERT(nullptr != mSession);
    mSession->setNeedResize();
}

}
}
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`//`
			`// StaticModule.cpp`
			`// MNN`
			`//`
			`// Created by MNN on b'2020/09/10'.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#include "StaticModule.hpp"`
			`#include <MNN/expr/ExprCreator.hpp>`
			`#include <MNN/AutoTime.hpp>`
			`#include "core/TensorUtils.hpp"`
			`#include "core/Session.hpp"`
			`#include <MNN/expr/Executor.hpp>`
			`#include <MNN/AutoTime.hpp>`
			`#include <MNN/expr/ExecutorScope.hpp>`
Synchronize internal master to Github 2020-12-15 14:12:35 +08:00			`#include "core/MNNMemoryUtils.h"`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`#include "core/Schedule.hpp"`
Synchronize internal master to Github 2020-12-15 14:12:35 +08:00			`#include "Utils.hpp"`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`namespace MNN {`
			`namespace Express {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00
			`struct NetStorage {`
			`size_t size() const {`
			`return allocated_size - offset;`
			`}`

			`const uint8_t* buffer() const {`
			`return storage.get() + offset;`
			`}`
			`size_t allocated_size;`
			`size_t offset;`
			`std::unique_ptr<uint8_t> storage;`
			`};`
			`static std::shared_ptr<NetStorage> preRearrangeWeights( // NOLINT`
			`const MNN::Net* net, std::map<const Op, std::shared_ptr<Execution>>& cache, Backend backend) {`
			`std::unique_ptr<MNN::NetT> net_table(net->UnPack());`
			`std::map<int, std::shared_ptr<Execution>> exeCache;`
			`for (int i = 0; i < net->oplists()->size(); ++i) {`
			`auto op = net->oplists()->Get(i);`
			`auto op_table = net_table->oplists[i].get();`
			`switch (op->type()) {`
			`case MNN::OpType_DepthwiseConvInt8:`
			`case MNN::OpType_ConvInt8:`
			`case MNN::OpType_ConvolutionDepthwise:`
			`case MNN::OpType_Convolution: {`
			`std::shared_ptr<Execution> exe(backend->onCreate({}, {}, op));`
			`if (nullptr == exe) {`
			`break;`
			`}`
			`if (!exe->onClone(nullptr, op, nullptr)) {`
			`break;`
			`}`
			`exeCache.insert(std::make_pair(i, exe));`
			`if (OpParameter_Convolution2D == op_table->main.type) {`
			`op_table->main.AsConvolution2D()->bias.clear();`
			`op_table->main.AsConvolution2D()->weight.clear();`
			`if (nullptr != op_table->main.AsConvolution2D()->symmetricQuan) {`
			`op_table->main.AsConvolution2D()->symmetricQuan->bias.clear();`
			`op_table->main.AsConvolution2D()->symmetricQuan->weight.clear();`
			`}`
			`if (nullptr != op_table->main.AsConvolution2D()->quanParameter) {`
			`op_table->main.AsConvolution2D()->quanParameter->alpha.clear();`
			`op_table->main.AsConvolution2D()->quanParameter->buffer.clear();`
			`}`
			`}`
			`break;`
			`}`
			`default: {`
			`break;`
			`}`
			`}`
			`}`
			`flatbuffers::FlatBufferBuilder builder(1024);`
			`builder.Finish(MNN::Net::Pack(builder, net_table.get()));`
			`// Swap the raw buffer ownership.`
			`std::shared_ptr<NetStorage> net_storage(new NetStorage);`
			`net_storage->storage.reset(builder.ReleaseRaw(net_storage->allocated_size, // NOLINT`
			`net_storage->offset));`
			`net = GetNet(net_storage->buffer());`
			`for (auto& iter : exeCache) {`
			`auto op = net->oplists()->Get(iter.first);`
			`cache.insert(std::make_pair(op, iter.second));`
			`}`
			`for (int i = 0; i < net->oplists()->size(); ++i) {`
			`auto op = net->oplists()->Get(i);`
			`}`
			`return net_storage;`
			`}`

			`StaticModule::StaticModule(const void* buffer, size_t length, const std::vector<std::string>& inputs, const std::vector<std::string>& outputs, const Module::Config& moduleconfig) : mInputs(inputs), mOutputs(outputs) {`
			`setType("StaticModule");`
			`std::shared_ptr<NetStorage> net_storage;`
			`std::map<const Op*, std::shared_ptr<Execution>> exeCache;`
			`if (moduleconfig.rearrange) {`
			`auto rt = Express::ExecutorScope::Current()->getRuntime();`
			`MNN_CHECK(rt.first.size() == 1, "The number of formal backends should be 1.");`
			`mResourceBackend.reset(rt.first.begin()->second->onCreate());`
			`net_storage = preRearrangeWeights(GetNet(buffer), exeCache, mResourceBackend.get());`
			`buffer = net_storage->buffer();`
			`length = net_storage->size();`
			`} else {`
			`net_storage.reset(new NetStorage);`
			`net_storage->storage.reset((uint8_t*)malloc(length));`
			`if (nullptr == net_storage->storage.get()) {`
			`MNN_ERROR("Allock Error in StaticModule's net\n");`
			`return;`
			`}`
			`net_storage->allocated_size = length;`
			`net_storage->offset = 0;`
			`::memcpy(net_storage->storage.get(), buffer, length);`
			`buffer = net_storage->storage.get();`
			`}`
			`mNetStorage = std::move(net_storage);`
			`mShapeFix = !moduleconfig.shapeMutable;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mOutputNumbers = (int)outputs.size();`
			`/** Compute:`
			`std::vector<int, int> mOutputFromTensor;`
			`std::vector<int, int> mOutputFromInput;`
			`*/`
			`for (int i=0; i<outputs.size(); ++i) {`
			`auto& t = outputs[i];`
			`bool fromInput = false;`
			`for (int j=0; j<inputs.size(); ++j) {`
			`if (inputs[j] == t) {`
			`fromInput = true;`
			`mOutputFromInput.emplace_back(std::make_pair(i, j));`
			`break;`
			`}`
			`}`
			`if (fromInput) {`
			`continue;`
			`}`
			`mOutputFromTensor.emplace_back(i);`
			`}`
			`if (mOutputFromTensor.empty()) {`
			`return;`
			`}`
			`auto rt = Express::ExecutorScope::Current()->getRuntime();`
			`// TODO: Add Config`
			`ScheduleConfig config;`
			`config.numThread = 1;`
			`config.type = rt.first.begin()->first;`
			`config.saveTensors = outputs;`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`auto scheduleInfo = Schedule::schedule(GetNet(buffer), {config});`
			`#ifdef MNN_EXPR_ENABLE_PROFILER`
			`Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;`
			`#else`
			`Interpreter::SessionMode callBackMode = Interpreter::Session_Release;`
			`#endif`
			`Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;`
			`mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));`
			`mSession->cloneExecution(exeCache, 0);`
			`if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {`
			`mSession->resize(false);`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mInputTensors.resize(inputs.size());`
			`for (int i=0; i<inputs.size(); ++i) {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`mInputTensors[i] = mSession->getInput(inputs[i].c_str());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`mOutputTensors.resize(mOutputFromTensor.size());`
			`for (int i=0; i<mOutputFromTensor.size(); ++i) {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`mOutputTensors[i] = mSession->getOutput(outputs[mOutputFromTensor[i]].c_str());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`}`
			`StaticModule:: ~ StaticModule() {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`mSession = nullptr;`
			`mResourceBackend = nullptr;`
[PATCH 233/350] Apply patch for Remove lock in StaticModule::onForward and implement EXPRP/VARP clone. The original code review is https://code.aone.alibaba-inc.com/AliNN/MNN/codereview/4328129 2020-12-17 16:14:25 +08:00			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`std::vector<Express::VARP> StaticModule::onForward(const std::vector<Express::VARP>& inputs) {`
			`AUTOTIME;`
			`std::vector<Express::VARP> outputs(mOutputNumbers);`
			`for (auto& iter : mOutputFromInput) {`
			`outputs[iter.first] = inputs[iter.second];`
			`}`
			`if (mOutputFromTensor.empty()) {`
			`return outputs;`
			`}`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`Variable::compute(inputs);`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`MNN_ASSERT(inputs.size() == mInputTensors.size());`
			`for (int i=0; i<inputs.size(); ++i) {`
			`auto info = inputs[i]->getInfo();`
			`mInputTensors[i]->buffer().type = info->type;`
			`auto des = TensorUtils::getDescribe(mInputTensors[i]);`
			`if (info->order == Express::NCHW) {`
			`des->dimensionFormat = MNN_DATA_FORMAT_NCHW;`
			`}`
			`if (info->order == Express::NHWC) {`
			`des->dimensionFormat = MNN_DATA_FORMAT_NHWC;`
			`}`
			`if (info->order == Express::NC4HW4) {`
			`des->dimensionFormat = MNN_DATA_FORMAT_NC4HW4;`
			`}`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`if (info->tensorArrayAttr != nullptr) {`
			`des->tensorArrayAttr = info->tensorArrayAttr;`
			`}`
[PATCH 233/350] Apply patch for Remove lock in StaticModule::onForward and implement EXPRP/VARP clone. The original code review is https://code.aone.alibaba-inc.com/AliNN/MNN/codereview/4328129 2020-12-17 16:14:25 +08:00			`resizeTensor(mInputTensors[i], info->dim);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`if (!mShapeFix) {`
			`for (int i=0; i<inputs.size(); ++i) {`
[PATCH 200/350] Don't resize when ptr is the same 2020-12-14 15:38:24 +08:00			`auto srcPtr = (uint8_t*)inputs[i]->readMap<void>();`
			`if (srcPtr != mInputTensors[i]->buffer().host) {`
			`mInputTensors[i]->buffer().host = srcPtr;`
			`mSession->setNeedResize();`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`}`
[PATCH 235/350] merge conflict fix 2020-12-17 16:24:28 +08:00			`if (mSession->getNeedResize()) {`
			`mSession->resize();`
			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (mShapeFix) {`
			`for (int i=0; i<inputs.size(); ++i) {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`auto exprInfo = inputs[i]->expr();`
			`auto inside = exprInfo.first->inside();`
			`auto inputTensor = inside->mOutputTensors[exprInfo.second];`
			`if (nullptr != inside->mCache) {`
			`inputTensor = Executor::getOutput(inside->mCache.get(), inside->mCacheOffset);`
			`}`
			`auto backend = TensorUtils::getDescribe(mInputTensors[i])->backend;`
			`if (nullptr != backend) {`
			`// For zero shape, backend is null`
			`backend->onCopyBuffer(inputTensor, mInputTensors[i]);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`}`
			`}`
			`#ifdef MNN_EXPR_ENABLE_PROFILER`
			`auto globalExecutor = ExecutorScope::Current();`
			`Timer cost;`
			`TensorCallBackWithInfo beforeCallBack = [&cost] (const std::vector<Tensor>&, const OperatorInfo info) {`
			`cost.reset();`
			`return true;`
			`};`
			`TensorCallBackWithInfo afterCallBack = [&cost, globalExecutor] (const std::vector<Tensor>&, const OperatorInfo info) {`
			`auto costTimes = (float)cost.durationInUs() / 1000.0f;`
			`globalExecutor->addOpCostTime(info->type(), costTimes);`
			`globalExecutor->addOpFlops(info->type(), info->flops());`
			`return true;`
			`};`
[PATCH 233/350] Apply patch for Remove lock in StaticModule::onForward and implement EXPRP/VARP clone. The original code review is https://code.aone.alibaba-inc.com/AliNN/MNN/codereview/4328129 2020-12-17 16:14:25 +08:00			`mSession->runWithCallBack(beforeCallBack, afterCallBack);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#else`
[PATCH 233/350] Apply patch for Remove lock in StaticModule::onForward and implement EXPRP/VARP clone. The original code review is https://code.aone.alibaba-inc.com/AliNN/MNN/codereview/4328129 2020-12-17 16:14:25 +08:00			`mSession->run();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#endif`
			`for (int i=0; i<mOutputTensors.size(); ++i) {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`auto currentTensor = mOutputTensors[i];`
			`// copy the data when reused as input tensor with data;`
			`if (currentTensor->elementSize() != 0 && mReusedTensors.find(mOutputFromTensor[i]) != mReusedTensors.end()) {`
			`std::shared_ptr<Tensor> tmpTensor(new Tensor(currentTensor, currentTensor->getDimensionType(), false));`
			`tmpTensor->buffer().host = (uint8_t*)MNNMemoryAllocAlign(currentTensor->size(), MNN_MEMORY_ALIGN_DEFAULT);`
			`currentTensor->copyToHostTensor(tmpTensor.get());`

			`Express::Variable::Info info;`
			`info.dim = currentTensor->shape();`
			`info.type = currentTensor->getType();`
			`auto des = TensorUtils::getDescribe(mOutputTensors[i]);`
			`auto format = des->dimensionFormat;`
			`info.order = Express::NHWC;`
			`if (format == MNN_DATA_FORMAT_NCHW) {`
			`info.order = Express::NCHW;`
			`} else if (format == MNN_DATA_FORMAT_NC4HW4) {`
			`info.order = Express::NC4HW4;`
			`}`
			`// if this output tensor is TensorArray, copy attr`
			`if (des->tensorArrayAttr != nullptr) {`
			`info.tensorArrayAttr = des->tensorArrayAttr;`
			`}`

			`outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(std::move(info), tmpTensor->host<void>(), Express::VARP::CONSTANT, Expr::MemoryType::MOVE), 0);`
Synchronize internal master to Github 2020-12-15 14:12:35 +08:00			`} else {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(mOutputTensors[i]));`
Synchronize internal master to Github 2020-12-15 14:12:35 +08:00			`}`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`return outputs;`
			`}`

[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`void StaticModule::setReusedTensors(std::set<int> reused) {`
			`mReusedTensors = std::move(reused);`
			`}`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`Module* StaticModule::clone(CloneContext* ctx) const {`
			`StaticModule* module(new StaticModule);`
			`module->mInputs = mInputs;`
			`module->mOutputs = mOutputs;`

			`module->mShapeFix = mShapeFix;`
			`module->mOutputNumbers = mOutputNumbers;`
			`module->mOutputFromInput = mOutputFromInput;`
			`module->mOutputFromTensor = mOutputFromTensor;`
			`if (mOutputFromTensor.empty()) {`
			`return this->cloneBaseTo(ctx, module);`
			`}`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`module->mNetStorage = mNetStorage;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto rt = Express::ExecutorScope::Current()->getRuntime();`
			`ScheduleConfig config;`
			`config.numThread = 1;`
			`config.type = rt.first.begin()->first;`
			`config.saveTensors = mOutputs;`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`auto scheduleInfo = Schedule::schedule(GetNet(module->mNetStorage->buffer()), {config});`
			`#ifdef MNN_EXPR_ENABLE_PROFILER`
			`Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;`
			`#else`
			`Interpreter::SessionMode callBackMode = Interpreter::Session_Release;`
			`#endif`
			`Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;`
			`module->mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));`
			`module->mSession->cloneExecution(mSession->getExecution(0), 0);`
			`if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {`
			`module->mSession->resize(false);`
			`}`
			`module->mResourceBackend = mResourceBackend;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`module->mInputTensors.resize(mInputs.size());`
			`module->mOutputTensors.resize(mOutputFromTensor.size());`
			`for (int i=0; i<mInputs.size(); ++i) {`
			`module->mInputTensors[i] =`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`module->mSession->getInput(mInputs[i].c_str());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`for (int i=0; i<mOutputFromTensor.size(); ++i) {`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`module->mOutputTensors[i] = module->mSession->getOutput(mOutputs[mOutputFromTensor[i]].c_str());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`return this->cloneBaseTo(ctx, module);`
			`}`

[PATCH 233/350] Apply patch for Remove lock in StaticModule::onForward and implement EXPRP/VARP clone. The original code review is https://code.aone.alibaba-inc.com/AliNN/MNN/codereview/4328129 2020-12-17 16:14:25 +08:00			`void StaticModule::resizeTensor(Tensor* tensor, const std::vector<int>& dims) {`
			`MNN_ASSERT(nullptr != tensor);`
			`bool dirty = false;`
			`if (tensor->buffer().dimensions != dims.size()) {`
			`dirty = true;`
			`} else {`
			`for (int i = 0; i < dims.size(); ++i) {`
			`if (tensor->buffer().dim[i].extent != dims[i]) {`
			`dirty = true;`
			`break;`
			`}`
			`}`
			`}`

			`if (!dirty) {`
			`return;`
			`}`

			`tensor->buffer().dimensions = (int)dims.size();`
			`for (int i = 0; i < dims.size(); ++i) {`
			`tensor->buffer().dim[i].extent = dims[i];`
			`}`

			`MNN_ASSERT(nullptr != mSession);`
			`mSession->setNeedResize();`
			`}`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`}`