MNN/source/core/WrapExecution.cpp

//
//  WrapExecution.cpp
//  MNN
//
//  Created by MNN on 2018/09/03.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#include "core/WrapExecution.hpp"
#include "core/TensorUtils.hpp"
#include "backend/cpu/CPUBackend.hpp"
#include "backend/cpu/compute/CommonOptFunction.h"
namespace MNN {
bool WrapExecution::needWrap(const Tensor* input, Backend* curBackend) {
    if (curBackend->type() == MNN_FORWARD_NN) {
        return false;
    }
    auto des = TensorUtils::getDescribe(input);
    auto bn = des->backend;
    MNNForwardType type = MNN_FORWARD_CPU;
    int pack = 4;
    int bytes = 4;
    if (nullptr != bn) {
        type = bn->type();
        if (type == MNN_FORWARD_CPU_EXTENSION) {
            auto core = static_cast<CPUBackend*>(bn)->functions();
            pack = core->pack;
            bytes = core->bytes;
        }
    }
    if (type == curBackend->type()) {
        return false;;
    }
    bool srcCpu = (type == MNN_FORWARD_CPU_EXTENSION || type == MNN_FORWARD_CPU);
    bool dstCpu = ((curBackend->type() == MNN_FORWARD_CPU_EXTENSION) || (curBackend->type() == MNN_FORWARD_CPU));
    if (srcCpu && dstCpu) {
        auto dstCore = static_cast<CPUBackend*>(curBackend)->functions();
        if (dstCore->bytes == bytes) {
            if (dstCore->pack == pack || des->dimensionFormat != MNN_DATA_FORMAT_NC4HW4) {
                return false;
            }
        }
    }
    return true;
}

WrapExecution::WrapExecution(Backend* CPUBackend, std::shared_ptr<Execution> execution, bool isStatic)
    : Execution(execution->backend()), mCPUBackend(CPUBackend), mExecution(execution) {
    mValid  = execution->valid();
    mStatic = isStatic;
}

Tensor* WrapExecution::_getCopyTensor(Tensor* inputTensor) {
    auto dstBackend = mExecution->backend();
    auto inputDes   = TensorUtils::getDescribe(inputTensor);
    auto srcBackend = inputDes->backend;
    if (nullptr == srcBackend) {
        srcBackend = mCPUBackend;
    }
    // CPU -> CPU or XPU -> XPU
    //if (srcBackend == dstBackend) {
    if (srcBackend->type() == dstBackend->type()) {
        return inputTensor;
    }
    auto iter = mInputMaps.find(inputTensor);
    if (iter != mInputMaps.end()) {
        return std::get<2>(iter->second).get();
    }
    // CPU -> XPU
    if (srcBackend->type() == mCPUBackend->type()) {
        std::shared_ptr<Tensor> wrapTensor(new Tensor);
        TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);
        TensorUtils::adjustTensorForCompability(wrapTensor.get());
        wrapTensor->buffer().type = inputTensor->buffer().type;
        TensorUtils::getDescribe(wrapTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;
        mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(dstBackend, dstBackend, wrapTensor)));
        return wrapTensor.get();
    }
    // XPU -> CPU
    if (dstBackend->type() == mCPUBackend->type()) {
        std::shared_ptr<Tensor> wrapTensor(new Tensor);
        TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);
        wrapTensor->buffer().type = inputTensor->buffer().type;
        TensorUtils::adjustTensorForCompability(wrapTensor.get());
        TensorUtils::getDescribe(wrapTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;
        mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(mCPUBackend, srcBackend, wrapTensor)));
        return wrapTensor.get();
    }
    // XPU -> CPU -> XPU'
    std::shared_ptr<Tensor> midTensor(new Tensor);
    std::shared_ptr<Tensor> wrapTensor(new Tensor);
    TensorUtils::copyShape(inputTensor, midTensor.get(), true);
    TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);
    TensorUtils::adjustTensorForCompability(wrapTensor.get());
    TensorUtils::adjustTensorForCompability(midTensor.get());
    TensorUtils::getDescribe(midTensor.get())->usage = TensorUtils::getDescribe(inputTensor)->usage;
    TensorUtils::getDescribe(midTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;
    midTensor->buffer().type                         = inputTensor->buffer().type;
    wrapTensor->buffer().type                        = inputTensor->buffer().type;
    mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(mCPUBackend, srcBackend, midTensor)));
    mInputMaps.insert(std::make_pair(midTensor.get(), std::make_tuple(dstBackend, dstBackend, wrapTensor)));
    return wrapTensor.get();
}

ErrorCode WrapExecution::onResize(const std::vector<Tensor*>& inputs, const std::vector<Tensor*>& outputs) {
    mWrapInputTensors.resize(inputs.size());
    mInputMaps.clear();

    auto dstBackend = mExecution->backend();
    for (int i = 0; i < inputs.size(); ++i) {
        auto inputTensor = inputs[i];
        auto des         = TensorUtils::getDescribe(inputTensor);
        if (des->memoryType == Tensor::InsideDescribe::MEMORY_VIRTUAL) {
            MNN_ASSERT(inputs.size() == 1);
            mWrapForRaster.reset(new Tensor);
            TensorUtils::copyShape(inputTensor, mWrapForRaster.get(), true);
            mWrapForRaster->buffer().type = inputTensor->buffer().type;
            auto wrapDes                  = TensorUtils::getDescribe(mWrapForRaster.get());
            wrapDes->memoryType           = Tensor::InsideDescribe::MEMORY_VIRTUAL;
            wrapDes->regions              = des->regions;
            for (auto& r : wrapDes->regions) {
                r.origin = _getCopyTensor(r.origin);
            }
            mWrapInputTensors[i] = mWrapForRaster.get();
        } else {
            mWrapInputTensors[i] = _getCopyTensor(inputTensor);
        }
    }

    for (int i = 0; i < outputs.size(); ++i) {
        MNN_ASSERT(TensorUtils::getDescribe(outputs[i])->backend == dstBackend);
    }
    bool memoryAllocSuccess = true;
    // acquire memory, copy const tensors
    for (auto& iter : mInputMaps) {
        auto backend   = std::get<0>(iter.second);
        auto converter = std::get<1>(iter.second);
        auto src       = iter.first;
        auto dst       = std::get<2>(iter.second).get();

        if (TensorUtils::getDescribe(src)->usage == TensorUsage::CONSTANT && mStatic) {
            memoryAllocSuccess = backend->onAcquireBuffer(dst, Backend::DYNAMIC_SEPERATE);
            if (memoryAllocSuccess) {
                converter->onCopyBuffer(src, dst);
                TensorUtils::getDescribe(dst)->usage = TensorUtils::getDescribe(src)->usage;
            }
        } else {
            memoryAllocSuccess = backend->onAcquireBuffer(dst, Backend::DYNAMIC);
        }
    }
    if (!memoryAllocSuccess) {
        return OUT_OF_MEMORY;
    }

    // do resize
    auto result = mExecution->onResize(mWrapInputTensors, outputs);

    // release memory
    for (auto& iter : mInputMaps) {
        auto backend = std::get<0>(iter.second);
        auto dst     = std::get<2>(iter.second).get();

        if (TensorUtils::getDescribe(dst)->usage == TensorUsage::CONSTANT && mStatic) {
            backend->onReleaseBuffer(dst, Backend::DYNAMIC_SEPERATE);
        } else {
            backend->onReleaseBuffer(dst, Backend::DYNAMIC);
        }
    }
    return result;
}

ErrorCode WrapExecution::onExecute(const std::vector<Tensor*>& inputs, const std::vector<Tensor*>& outputs) {
    MNN_ASSERT(mWrapInputTensors.size() == inputs.size());

    // copy variant tensors
    for (auto& iter : mInputMaps) {
        auto converter = std::get<1>(iter.second);
        auto src       = iter.first;
        auto dst       = std::get<2>(iter.second).get();
        if (TensorUtils::getDescribe(src)->usage != TensorUsage::CONSTANT || (!mStatic)) {
            converter->onCopyBuffer(src, dst);
        }
    }
    auto code = mExecution->onExecute(mWrapInputTensors, outputs);
    return code;
}

} // namespace MNN
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// WrapExecution.cpp`
			`// MNN`
			`//`
			`// Created by MNN on 2018/09/03.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

Update 2019-12-27 22:16:57 +08:00			`#include "core/WrapExecution.hpp"`
			`#include "core/TensorUtils.hpp"`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`#include "backend/cpu/CPUBackend.hpp"`
			`#include "backend/cpu/compute/CommonOptFunction.h"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`namespace MNN {`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`bool WrapExecution::needWrap(const Tensor* input, Backend* curBackend) {`
			`if (curBackend->type() == MNN_FORWARD_NN) {`
			`return false;`
			`}`
			`auto des = TensorUtils::getDescribe(input);`
			`auto bn = des->backend;`
			`MNNForwardType type = MNN_FORWARD_CPU;`
			`int pack = 4;`
			`int bytes = 4;`
			`if (nullptr != bn) {`
			`type = bn->type();`
			`if (type == MNN_FORWARD_CPU_EXTENSION) {`
			`auto core = static_cast<CPUBackend*>(bn)->functions();`
			`pack = core->pack;`
			`bytes = core->bytes;`
			`}`
			`}`
			`if (type == curBackend->type()) {`
			`return false;;`
			`}`
			`bool srcCpu = (type == MNN_FORWARD_CPU_EXTENSION \|\| type == MNN_FORWARD_CPU);`
			`bool dstCpu = ((curBackend->type() == MNN_FORWARD_CPU_EXTENSION) \|\| (curBackend->type() == MNN_FORWARD_CPU));`
			`if (srcCpu && dstCpu) {`
			`auto dstCore = static_cast<CPUBackend*>(curBackend)->functions();`
			`if (dstCore->bytes == bytes) {`
			`if (dstCore->pack == pack \|\| des->dimensionFormat != MNN_DATA_FORMAT_NC4HW4) {`
			`return false;`
			`}`
			`}`
			`}`
			`return true;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`WrapExecution::WrapExecution(Backend* CPUBackend, std::shared_ptr<Execution> execution, bool isStatic)`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`: Execution(execution->backend()), mCPUBackend(CPUBackend), mExecution(execution) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mValid = execution->valid();`
			`mStatic = isStatic;`
			`}`

			`Tensor* WrapExecution::_getCopyTensor(Tensor* inputTensor) {`
			`auto dstBackend = mExecution->backend();`
			`auto inputDes = TensorUtils::getDescribe(inputTensor);`
			`auto srcBackend = inputDes->backend;`
			`if (nullptr == srcBackend) {`
			`srcBackend = mCPUBackend;`
			`}`
			`// CPU -> CPU or XPU -> XPU`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`//if (srcBackend == dstBackend) {`
			`if (srcBackend->type() == dstBackend->type()) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`return inputTensor;`
			`}`
			`auto iter = mInputMaps.find(inputTensor);`
			`if (iter != mInputMaps.end()) {`
			`return std::get<2>(iter->second).get();`
			`}`
			`// CPU -> XPU`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`if (srcBackend->type() == mCPUBackend->type()) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`std::shared_ptr<Tensor> wrapTensor(new Tensor);`
			`TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`TensorUtils::adjustTensorForCompability(wrapTensor.get());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`wrapTensor->buffer().type = inputTensor->buffer().type;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`TensorUtils::getDescribe(wrapTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(dstBackend, dstBackend, wrapTensor)));`
			`return wrapTensor.get();`
			`}`
			`// XPU -> CPU`
[MNN:Sync] Sync internal git 2021-01-06 16:29:37 +08:00			`if (dstBackend->type() == mCPUBackend->type()) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`std::shared_ptr<Tensor> wrapTensor(new Tensor);`
			`TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);`
			`wrapTensor->buffer().type = inputTensor->buffer().type;`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`TensorUtils::adjustTensorForCompability(wrapTensor.get());`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`TensorUtils::getDescribe(wrapTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(mCPUBackend, srcBackend, wrapTensor)));`
			`return wrapTensor.get();`
			`}`
			`// XPU -> CPU -> XPU'`
			`std::shared_ptr<Tensor> midTensor(new Tensor);`
			`std::shared_ptr<Tensor> wrapTensor(new Tensor);`
			`TensorUtils::copyShape(inputTensor, midTensor.get(), true);`
			`TensorUtils::copyShape(inputTensor, wrapTensor.get(), true);`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`TensorUtils::adjustTensorForCompability(wrapTensor.get());`
			`TensorUtils::adjustTensorForCompability(midTensor.get());`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`TensorUtils::getDescribe(midTensor.get())->usage = TensorUtils::getDescribe(inputTensor)->usage;`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`TensorUtils::getDescribe(midTensor.get())->quantAttr = TensorUtils::getDescribe(inputTensor)->quantAttr;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`midTensor->buffer().type = inputTensor->buffer().type;`
			`wrapTensor->buffer().type = inputTensor->buffer().type;`
			`mInputMaps.insert(std::make_pair(inputTensor, std::make_tuple(mCPUBackend, srcBackend, midTensor)));`
			`mInputMaps.insert(std::make_pair(midTensor.get(), std::make_tuple(dstBackend, dstBackend, wrapTensor)));`
			`return wrapTensor.get();`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`

			`ErrorCode WrapExecution::onResize(const std::vector<Tensor>& inputs, const std::vector<Tensor>& outputs) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`mWrapInputTensors.resize(inputs.size());`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`mInputMaps.clear();`

			`auto dstBackend = mExecution->backend();`
			`for (int i = 0; i < inputs.size(); ++i) {`
			`auto inputTensor = inputs[i];`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto des = TensorUtils::getDescribe(inputTensor);`
			`if (des->memoryType == Tensor::InsideDescribe::MEMORY_VIRTUAL) {`
			`MNN_ASSERT(inputs.size() == 1);`
			`mWrapForRaster.reset(new Tensor);`
			`TensorUtils::copyShape(inputTensor, mWrapForRaster.get(), true);`
			`mWrapForRaster->buffer().type = inputTensor->buffer().type;`
			`auto wrapDes = TensorUtils::getDescribe(mWrapForRaster.get());`
			`wrapDes->memoryType = Tensor::InsideDescribe::MEMORY_VIRTUAL;`
			`wrapDes->regions = des->regions;`
			`for (auto& r : wrapDes->regions) {`
			`r.origin = _getCopyTensor(r.origin);`
			`}`
			`mWrapInputTensors[i] = mWrapForRaster.get();`
			`} else {`
			`mWrapInputTensors[i] = _getCopyTensor(inputTensor);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`}`

			`for (int i = 0; i < outputs.size(); ++i) {`
			`MNN_ASSERT(TensorUtils::getDescribe(outputs[i])->backend == dstBackend);`
			`}`
beta 0.2.0.7 - move docs to http://www.yuque.com/mnn - fix bugs for CPU ops TopKV2 and quantized convolution - add enqueue map buffer error handle for OpenCL - add nullptr protection for extra tensor desc - add failure protection for memory acquirement - fix slice shape calculation - refactor binary shape calculation 2019-08-15 17:30:39 +08:00			`bool memoryAllocSuccess = true;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// acquire memory, copy const tensors`
			`for (auto& iter : mInputMaps) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto backend = std::get<0>(iter.second);`
			`auto converter = std::get<1>(iter.second);`
			`auto src = iter.first;`
			`auto dst = std::get<2>(iter.second).get();`
beta 0.1.0 2019-04-17 10:49:11 +08:00
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (TensorUtils::getDescribe(src)->usage == TensorUsage::CONSTANT && mStatic) {`
beta 0.2.0.7 - move docs to http://www.yuque.com/mnn - fix bugs for CPU ops TopKV2 and quantized convolution - add enqueue map buffer error handle for OpenCL - add nullptr protection for extra tensor desc - add failure protection for memory acquirement - fix slice shape calculation - refactor binary shape calculation 2019-08-15 17:30:39 +08:00			`memoryAllocSuccess = backend->onAcquireBuffer(dst, Backend::DYNAMIC_SEPERATE);`
			`if (memoryAllocSuccess) {`
			`converter->onCopyBuffer(src, dst);`
Sync. Fix OpenGL related building issues. Build the whole suite on Android CI (#580) * Sync code with latest internal version * Update CMake * Fix logging issues * Fix OpenGL Building * Bump CMakeLists version. Update Podspec * Update MetalLib Lookup logic * Fix Windows Build 2020-01-15 13:33:47 +08:00			`TensorUtils::getDescribe(dst)->usage = TensorUtils::getDescribe(src)->usage;`
beta 0.2.0.7 - move docs to http://www.yuque.com/mnn - fix bugs for CPU ops TopKV2 and quantized convolution - add enqueue map buffer error handle for OpenCL - add nullptr protection for extra tensor desc - add failure protection for memory acquirement - fix slice shape calculation - refactor binary shape calculation 2019-08-15 17:30:39 +08:00			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`} else {`
beta 0.2.0.7 - move docs to http://www.yuque.com/mnn - fix bugs for CPU ops TopKV2 and quantized convolution - add enqueue map buffer error handle for OpenCL - add nullptr protection for extra tensor desc - add failure protection for memory acquirement - fix slice shape calculation - refactor binary shape calculation 2019-08-15 17:30:39 +08:00			`memoryAllocSuccess = backend->onAcquireBuffer(dst, Backend::DYNAMIC);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`}`
beta 0.2.0.7 - move docs to http://www.yuque.com/mnn - fix bugs for CPU ops TopKV2 and quantized convolution - add enqueue map buffer error handle for OpenCL - add nullptr protection for extra tensor desc - add failure protection for memory acquirement - fix slice shape calculation - refactor binary shape calculation 2019-08-15 17:30:39 +08:00			`if (!memoryAllocSuccess) {`
			`return OUT_OF_MEMORY;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`// do resize`
			`auto result = mExecution->onResize(mWrapInputTensors, outputs);`

			`// release memory`
			`for (auto& iter : mInputMaps) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto backend = std::get<0>(iter.second);`
			`auto dst = std::get<2>(iter.second).get();`
beta 0.1.0 2019-04-17 10:49:11 +08:00
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (TensorUtils::getDescribe(dst)->usage == TensorUsage::CONSTANT && mStatic) {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`backend->onReleaseBuffer(dst, Backend::DYNAMIC_SEPERATE);`
			`} else {`
			`backend->onReleaseBuffer(dst, Backend::DYNAMIC);`
			`}`
			`}`
			`return result;`
			`}`

			`ErrorCode WrapExecution::onExecute(const std::vector<Tensor>& inputs, const std::vector<Tensor>& outputs) {`
			`MNN_ASSERT(mWrapInputTensors.size() == inputs.size());`

			`// copy variant tensors`
			`for (auto& iter : mInputMaps) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto converter = std::get<1>(iter.second);`
			`auto src = iter.first;`
			`auto dst = std::get<2>(iter.second).get();`
			`if (TensorUtils::getDescribe(src)->usage != TensorUsage::CONSTANT \|\| (!mStatic)) {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`converter->onCopyBuffer(src, dst);`
			`}`
			`}`
[MNN:Sync] Sync internal git for remain patch 2020-03-22 20:16:29 +08:00			`auto code = mExecution->onExecute(mWrapInputTensors, outputs);`
			`return code;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`

			`} // namespace MNN`