2020-11-05 16:41:56 +08:00
|
|
|
//
|
|
|
|
// StaticModule.cpp
|
|
|
|
// MNN
|
|
|
|
//
|
|
|
|
// Created by MNN on b'2020/09/10'.
|
|
|
|
// Copyright © 2018, Alibaba Group Holding Limited
|
|
|
|
//
|
|
|
|
|
|
|
|
#include "StaticModule.hpp"
|
|
|
|
#include <MNN/expr/ExprCreator.hpp>
|
|
|
|
#include <MNN/AutoTime.hpp>
|
|
|
|
#include "core/TensorUtils.hpp"
|
|
|
|
#include "core/Session.hpp"
|
|
|
|
#include <MNN/expr/Executor.hpp>
|
|
|
|
#include <MNN/AutoTime.hpp>
|
|
|
|
#include <MNN/expr/ExecutorScope.hpp>
|
2020-12-15 14:12:35 +08:00
|
|
|
#include "core/MNNMemoryUtils.h"
|
2021-01-06 16:29:37 +08:00
|
|
|
#include "core/Schedule.hpp"
|
2020-12-15 14:12:35 +08:00
|
|
|
#include "Utils.hpp"
|
|
|
|
|
2020-11-05 16:41:56 +08:00
|
|
|
namespace MNN {
|
|
|
|
namespace Express {
|
2021-01-06 16:29:37 +08:00
|
|
|
|
|
|
|
struct NetStorage {
|
|
|
|
size_t size() const {
|
|
|
|
return allocated_size - offset;
|
|
|
|
}
|
|
|
|
|
|
|
|
const uint8_t* buffer() const {
|
|
|
|
return storage.get() + offset;
|
|
|
|
}
|
|
|
|
size_t allocated_size;
|
|
|
|
size_t offset;
|
|
|
|
std::unique_ptr<uint8_t> storage;
|
|
|
|
};
|
|
|
|
static std::shared_ptr<NetStorage> preRearrangeWeights( // NOLINT
|
|
|
|
const MNN::Net* net, std::map<const Op*, std::shared_ptr<Execution>>& cache, Backend* backend) {
|
|
|
|
std::unique_ptr<MNN::NetT> net_table(net->UnPack());
|
|
|
|
std::map<int, std::shared_ptr<Execution>> exeCache;
|
|
|
|
for (int i = 0; i < net->oplists()->size(); ++i) {
|
|
|
|
auto op = net->oplists()->Get(i);
|
|
|
|
auto op_table = net_table->oplists[i].get();
|
|
|
|
switch (op->type()) {
|
|
|
|
case MNN::OpType_DepthwiseConvInt8:
|
|
|
|
case MNN::OpType_ConvInt8:
|
|
|
|
case MNN::OpType_ConvolutionDepthwise:
|
|
|
|
case MNN::OpType_Convolution: {
|
|
|
|
std::shared_ptr<Execution> exe(backend->onCreate({}, {}, op));
|
|
|
|
if (nullptr == exe) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (!exe->onClone(nullptr, op, nullptr)) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
exeCache.insert(std::make_pair(i, exe));
|
|
|
|
if (OpParameter_Convolution2D == op_table->main.type) {
|
|
|
|
op_table->main.AsConvolution2D()->bias.clear();
|
|
|
|
op_table->main.AsConvolution2D()->weight.clear();
|
|
|
|
if (nullptr != op_table->main.AsConvolution2D()->symmetricQuan) {
|
|
|
|
op_table->main.AsConvolution2D()->symmetricQuan->bias.clear();
|
|
|
|
op_table->main.AsConvolution2D()->symmetricQuan->weight.clear();
|
|
|
|
}
|
|
|
|
if (nullptr != op_table->main.AsConvolution2D()->quanParameter) {
|
|
|
|
op_table->main.AsConvolution2D()->quanParameter->alpha.clear();
|
|
|
|
op_table->main.AsConvolution2D()->quanParameter->buffer.clear();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
default: {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
flatbuffers::FlatBufferBuilder builder(1024);
|
|
|
|
builder.Finish(MNN::Net::Pack(builder, net_table.get()));
|
|
|
|
// Swap the raw buffer ownership.
|
|
|
|
std::shared_ptr<NetStorage> net_storage(new NetStorage);
|
|
|
|
net_storage->storage.reset(builder.ReleaseRaw(net_storage->allocated_size, // NOLINT
|
|
|
|
net_storage->offset));
|
|
|
|
net = GetNet(net_storage->buffer());
|
|
|
|
for (auto& iter : exeCache) {
|
|
|
|
auto op = net->oplists()->Get(iter.first);
|
|
|
|
cache.insert(std::make_pair(op, iter.second));
|
|
|
|
}
|
|
|
|
for (int i = 0; i < net->oplists()->size(); ++i) {
|
|
|
|
auto op = net->oplists()->Get(i);
|
|
|
|
}
|
|
|
|
return net_storage;
|
|
|
|
}
|
|
|
|
|
|
|
|
StaticModule::StaticModule(const void* buffer, size_t length, const std::vector<std::string>& inputs, const std::vector<std::string>& outputs, const Module::Config& moduleconfig) : mInputs(inputs), mOutputs(outputs) {
|
|
|
|
setType("StaticModule");
|
|
|
|
std::shared_ptr<NetStorage> net_storage;
|
|
|
|
std::map<const Op*, std::shared_ptr<Execution>> exeCache;
|
|
|
|
if (moduleconfig.rearrange) {
|
|
|
|
auto rt = Express::ExecutorScope::Current()->getRuntime();
|
|
|
|
MNN_CHECK(rt.first.size() == 1, "The number of formal backends should be 1.");
|
|
|
|
mResourceBackend.reset(rt.first.begin()->second->onCreate());
|
|
|
|
net_storage = preRearrangeWeights(GetNet(buffer), exeCache, mResourceBackend.get());
|
|
|
|
buffer = net_storage->buffer();
|
|
|
|
length = net_storage->size();
|
|
|
|
} else {
|
|
|
|
net_storage.reset(new NetStorage);
|
|
|
|
net_storage->storage.reset((uint8_t*)malloc(length));
|
|
|
|
if (nullptr == net_storage->storage.get()) {
|
|
|
|
MNN_ERROR("Allock Error in StaticModule's net\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
net_storage->allocated_size = length;
|
|
|
|
net_storage->offset = 0;
|
|
|
|
::memcpy(net_storage->storage.get(), buffer, length);
|
|
|
|
buffer = net_storage->storage.get();
|
|
|
|
}
|
|
|
|
mNetStorage = std::move(net_storage);
|
|
|
|
mShapeFix = !moduleconfig.shapeMutable;
|
2020-11-05 16:41:56 +08:00
|
|
|
mOutputNumbers = (int)outputs.size();
|
|
|
|
/** Compute:
|
|
|
|
std::vector<int, int> mOutputFromTensor;
|
|
|
|
std::vector<int, int> mOutputFromInput;
|
|
|
|
*/
|
|
|
|
for (int i=0; i<outputs.size(); ++i) {
|
|
|
|
auto& t = outputs[i];
|
|
|
|
bool fromInput = false;
|
|
|
|
for (int j=0; j<inputs.size(); ++j) {
|
|
|
|
if (inputs[j] == t) {
|
|
|
|
fromInput = true;
|
|
|
|
mOutputFromInput.emplace_back(std::make_pair(i, j));
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (fromInput) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
mOutputFromTensor.emplace_back(i);
|
|
|
|
}
|
|
|
|
if (mOutputFromTensor.empty()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
auto rt = Express::ExecutorScope::Current()->getRuntime();
|
|
|
|
// TODO: Add Config
|
|
|
|
ScheduleConfig config;
|
|
|
|
config.numThread = 1;
|
|
|
|
config.type = rt.first.begin()->first;
|
|
|
|
config.saveTensors = outputs;
|
2021-01-06 16:29:37 +08:00
|
|
|
auto scheduleInfo = Schedule::schedule(GetNet(buffer), {config});
|
|
|
|
#ifdef MNN_EXPR_ENABLE_PROFILER
|
|
|
|
Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;
|
|
|
|
#else
|
|
|
|
Interpreter::SessionMode callBackMode = Interpreter::Session_Release;
|
|
|
|
#endif
|
|
|
|
Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;
|
|
|
|
mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));
|
|
|
|
mSession->cloneExecution(exeCache, 0);
|
|
|
|
if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {
|
|
|
|
mSession->resize(false);
|
|
|
|
}
|
2020-11-05 16:41:56 +08:00
|
|
|
mInputTensors.resize(inputs.size());
|
|
|
|
for (int i=0; i<inputs.size(); ++i) {
|
2021-01-06 16:29:37 +08:00
|
|
|
mInputTensors[i] = mSession->getInput(inputs[i].c_str());
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
mOutputTensors.resize(mOutputFromTensor.size());
|
|
|
|
for (int i=0; i<mOutputFromTensor.size(); ++i) {
|
2021-01-06 16:29:37 +08:00
|
|
|
mOutputTensors[i] = mSession->getOutput(outputs[mOutputFromTensor[i]].c_str());
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
StaticModule:: ~ StaticModule() {
|
2021-01-06 16:29:37 +08:00
|
|
|
mSession = nullptr;
|
|
|
|
mResourceBackend = nullptr;
|
2020-12-17 16:14:25 +08:00
|
|
|
}
|
2020-11-05 16:41:56 +08:00
|
|
|
std::vector<Express::VARP> StaticModule::onForward(const std::vector<Express::VARP>& inputs) {
|
|
|
|
AUTOTIME;
|
|
|
|
std::vector<Express::VARP> outputs(mOutputNumbers);
|
|
|
|
for (auto& iter : mOutputFromInput) {
|
|
|
|
outputs[iter.first] = inputs[iter.second];
|
|
|
|
}
|
|
|
|
if (mOutputFromTensor.empty()) {
|
|
|
|
return outputs;
|
|
|
|
}
|
2021-01-06 16:29:37 +08:00
|
|
|
Variable::compute(inputs);
|
|
|
|
|
2020-11-05 16:41:56 +08:00
|
|
|
MNN_ASSERT(inputs.size() == mInputTensors.size());
|
|
|
|
for (int i=0; i<inputs.size(); ++i) {
|
|
|
|
auto info = inputs[i]->getInfo();
|
|
|
|
mInputTensors[i]->buffer().type = info->type;
|
|
|
|
auto des = TensorUtils::getDescribe(mInputTensors[i]);
|
|
|
|
if (info->order == Express::NCHW) {
|
|
|
|
des->dimensionFormat = MNN_DATA_FORMAT_NCHW;
|
|
|
|
}
|
|
|
|
if (info->order == Express::NHWC) {
|
|
|
|
des->dimensionFormat = MNN_DATA_FORMAT_NHWC;
|
|
|
|
}
|
|
|
|
if (info->order == Express::NC4HW4) {
|
|
|
|
des->dimensionFormat = MNN_DATA_FORMAT_NC4HW4;
|
|
|
|
}
|
2021-01-06 16:29:37 +08:00
|
|
|
if (info->tensorArrayAttr != nullptr) {
|
|
|
|
des->tensorArrayAttr = info->tensorArrayAttr;
|
|
|
|
}
|
2020-12-17 16:14:25 +08:00
|
|
|
resizeTensor(mInputTensors[i], info->dim);
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
if (!mShapeFix) {
|
|
|
|
for (int i=0; i<inputs.size(); ++i) {
|
2020-12-14 15:38:24 +08:00
|
|
|
auto srcPtr = (uint8_t*)inputs[i]->readMap<void>();
|
|
|
|
if (srcPtr != mInputTensors[i]->buffer().host) {
|
|
|
|
mInputTensors[i]->buffer().host = srcPtr;
|
|
|
|
mSession->setNeedResize();
|
|
|
|
}
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
}
|
2020-12-17 16:24:28 +08:00
|
|
|
if (mSession->getNeedResize()) {
|
|
|
|
mSession->resize();
|
|
|
|
}
|
2020-11-05 16:41:56 +08:00
|
|
|
if (mShapeFix) {
|
|
|
|
for (int i=0; i<inputs.size(); ++i) {
|
2021-01-06 16:29:37 +08:00
|
|
|
auto exprInfo = inputs[i]->expr();
|
|
|
|
auto inside = exprInfo.first->inside();
|
|
|
|
auto inputTensor = inside->mOutputTensors[exprInfo.second];
|
|
|
|
if (nullptr != inside->mCache) {
|
|
|
|
inputTensor = Executor::getOutput(inside->mCache.get(), inside->mCacheOffset);
|
|
|
|
}
|
|
|
|
auto backend = TensorUtils::getDescribe(mInputTensors[i])->backend;
|
|
|
|
if (nullptr != backend) {
|
|
|
|
// For zero shape, backend is null
|
|
|
|
backend->onCopyBuffer(inputTensor, mInputTensors[i]);
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#ifdef MNN_EXPR_ENABLE_PROFILER
|
|
|
|
auto globalExecutor = ExecutorScope::Current();
|
|
|
|
Timer cost;
|
|
|
|
TensorCallBackWithInfo beforeCallBack = [&cost] (const std::vector<Tensor*>&, const OperatorInfo* info) {
|
|
|
|
cost.reset();
|
|
|
|
return true;
|
|
|
|
};
|
|
|
|
TensorCallBackWithInfo afterCallBack = [&cost, globalExecutor] (const std::vector<Tensor*>&, const OperatorInfo* info) {
|
|
|
|
auto costTimes = (float)cost.durationInUs() / 1000.0f;
|
|
|
|
globalExecutor->addOpCostTime(info->type(), costTimes);
|
|
|
|
globalExecutor->addOpFlops(info->type(), info->flops());
|
|
|
|
return true;
|
|
|
|
};
|
2020-12-17 16:14:25 +08:00
|
|
|
mSession->runWithCallBack(beforeCallBack, afterCallBack);
|
2020-11-05 16:41:56 +08:00
|
|
|
#else
|
2020-12-17 16:14:25 +08:00
|
|
|
mSession->run();
|
2020-11-05 16:41:56 +08:00
|
|
|
#endif
|
|
|
|
for (int i=0; i<mOutputTensors.size(); ++i) {
|
2021-01-06 16:29:37 +08:00
|
|
|
auto currentTensor = mOutputTensors[i];
|
|
|
|
// copy the data when reused as input tensor with data;
|
|
|
|
if (currentTensor->elementSize() != 0 && mReusedTensors.find(mOutputFromTensor[i]) != mReusedTensors.end()) {
|
|
|
|
std::shared_ptr<Tensor> tmpTensor(new Tensor(currentTensor, currentTensor->getDimensionType(), false));
|
|
|
|
tmpTensor->buffer().host = (uint8_t*)MNNMemoryAllocAlign(currentTensor->size(), MNN_MEMORY_ALIGN_DEFAULT);
|
|
|
|
currentTensor->copyToHostTensor(tmpTensor.get());
|
|
|
|
|
|
|
|
Express::Variable::Info info;
|
|
|
|
info.dim = currentTensor->shape();
|
|
|
|
info.type = currentTensor->getType();
|
|
|
|
auto des = TensorUtils::getDescribe(mOutputTensors[i]);
|
|
|
|
auto format = des->dimensionFormat;
|
|
|
|
info.order = Express::NHWC;
|
|
|
|
if (format == MNN_DATA_FORMAT_NCHW) {
|
|
|
|
info.order = Express::NCHW;
|
|
|
|
} else if (format == MNN_DATA_FORMAT_NC4HW4) {
|
|
|
|
info.order = Express::NC4HW4;
|
|
|
|
}
|
|
|
|
// if this output tensor is TensorArray, copy attr
|
|
|
|
if (des->tensorArrayAttr != nullptr) {
|
|
|
|
info.tensorArrayAttr = des->tensorArrayAttr;
|
|
|
|
}
|
|
|
|
|
|
|
|
outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(std::move(info), tmpTensor->host<void>(), Express::VARP::CONSTANT, Expr::MemoryType::MOVE), 0);
|
2020-12-15 14:12:35 +08:00
|
|
|
} else {
|
2021-01-06 16:29:37 +08:00
|
|
|
outputs[mOutputFromTensor[i]] = Express::Variable::create(Express::Expr::create(mOutputTensors[i]));
|
2020-12-15 14:12:35 +08:00
|
|
|
}
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
return outputs;
|
|
|
|
}
|
|
|
|
|
2021-01-06 16:29:37 +08:00
|
|
|
void StaticModule::setReusedTensors(std::set<int> reused) {
|
|
|
|
mReusedTensors = std::move(reused);
|
|
|
|
}
|
|
|
|
|
2020-11-05 16:41:56 +08:00
|
|
|
Module* StaticModule::clone(CloneContext* ctx) const {
|
|
|
|
StaticModule* module(new StaticModule);
|
|
|
|
module->mInputs = mInputs;
|
|
|
|
module->mOutputs = mOutputs;
|
|
|
|
|
|
|
|
module->mShapeFix = mShapeFix;
|
|
|
|
module->mOutputNumbers = mOutputNumbers;
|
|
|
|
module->mOutputFromInput = mOutputFromInput;
|
|
|
|
module->mOutputFromTensor = mOutputFromTensor;
|
|
|
|
if (mOutputFromTensor.empty()) {
|
|
|
|
return this->cloneBaseTo(ctx, module);
|
|
|
|
}
|
2021-01-06 16:29:37 +08:00
|
|
|
module->mNetStorage = mNetStorage;
|
2020-11-05 16:41:56 +08:00
|
|
|
auto rt = Express::ExecutorScope::Current()->getRuntime();
|
|
|
|
ScheduleConfig config;
|
|
|
|
config.numThread = 1;
|
|
|
|
config.type = rt.first.begin()->first;
|
|
|
|
config.saveTensors = mOutputs;
|
2021-01-06 16:29:37 +08:00
|
|
|
auto scheduleInfo = Schedule::schedule(GetNet(module->mNetStorage->buffer()), {config});
|
|
|
|
#ifdef MNN_EXPR_ENABLE_PROFILER
|
|
|
|
Interpreter::SessionMode callBackMode = Interpreter::Session_Debug;
|
|
|
|
#else
|
|
|
|
Interpreter::SessionMode callBackMode = Interpreter::Session_Release;
|
|
|
|
#endif
|
|
|
|
Interpreter::SessionMode inputMode = mShapeFix ? Interpreter::Session_Input_Inside : Interpreter::Session_Input_User;
|
|
|
|
module->mSession.reset(new Session(std::move(scheduleInfo), callBackMode, inputMode, std::move(rt)));
|
|
|
|
module->mSession->cloneExecution(mSession->getExecution(0), 0);
|
|
|
|
if (scheduleInfo.validForResize && inputMode == Interpreter::Session_Input_Inside) {
|
|
|
|
module->mSession->resize(false);
|
|
|
|
}
|
|
|
|
module->mResourceBackend = mResourceBackend;
|
2020-11-05 16:41:56 +08:00
|
|
|
module->mInputTensors.resize(mInputs.size());
|
|
|
|
module->mOutputTensors.resize(mOutputFromTensor.size());
|
|
|
|
for (int i=0; i<mInputs.size(); ++i) {
|
|
|
|
module->mInputTensors[i] =
|
2021-01-06 16:29:37 +08:00
|
|
|
module->mSession->getInput(mInputs[i].c_str());
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
for (int i=0; i<mOutputFromTensor.size(); ++i) {
|
2021-01-06 16:29:37 +08:00
|
|
|
module->mOutputTensors[i] = module->mSession->getOutput(mOutputs[mOutputFromTensor[i]].c_str());
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
return this->cloneBaseTo(ctx, module);
|
|
|
|
}
|
|
|
|
|
2020-12-17 16:14:25 +08:00
|
|
|
void StaticModule::resizeTensor(Tensor* tensor, const std::vector<int>& dims) {
|
|
|
|
MNN_ASSERT(nullptr != tensor);
|
|
|
|
bool dirty = false;
|
|
|
|
if (tensor->buffer().dimensions != dims.size()) {
|
|
|
|
dirty = true;
|
|
|
|
} else {
|
|
|
|
for (int i = 0; i < dims.size(); ++i) {
|
|
|
|
if (tensor->buffer().dim[i].extent != dims[i]) {
|
|
|
|
dirty = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!dirty) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
tensor->buffer().dimensions = (int)dims.size();
|
|
|
|
for (int i = 0; i < dims.size(); ++i) {
|
|
|
|
tensor->buffer().dim[i].extent = dims[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
MNN_ASSERT(nullptr != mSession);
|
|
|
|
mSession->setNeedResize();
|
|
|
|
}
|
|
|
|
|
2020-11-05 16:41:56 +08:00
|
|
|
}
|
|
|
|
}
|