MNN/source/shape/SizeComputer.cpp

//
//  SizeComputer.cpp
//  MNN
//
//  Created by MNN on 2019/01/10.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#include "shape/SizeComputer.hpp"
#include <stdlib.h>
#include <mutex>
#include "core/Macro.h"
#include "core/TensorUtils.hpp"
// #define MNN_DEBUG_TENSOR_SIZE
namespace MNN {
void registerShapeOps();
SizeComputerSuite* SizeComputerSuite::gInstance = nullptr;

SizeComputerSuite::~SizeComputerSuite() {
    for (auto& iter : mRegistry) {
        delete iter;
    }
}

void SizeComputerSuite::init() {
    if (nullptr != gInstance) {
        return;
    }
    gInstance = new SizeComputerSuite;
    gInstance->mRegistry.resize(OpType_MAX + 1);
    ::memset(gInstance->mRegistry.data(), 0, gInstance->mRegistry.size() * sizeof(SizeComputer*));
    registerShapeOps();
}

SizeComputerSuite* SizeComputerSuite::get() {
    return gInstance;
}

void SizeComputerSuite::insert(SizeComputer* t, OpType type) {
    mRegistry[type] = t;
}

SizeComputer* SizeComputerSuite::search(OpType name) {
    auto iter = mRegistry[name];
    if (iter == nullptr) {
        return nullptr;
    }
    return iter;
}
float SizeComputer::onComputeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                                   const std::vector<Tensor*>& outputs) const {
    MNN_ASSERT(outputs.size() >= 1);
    return (float)outputs[0]->elementSize() / 1024.0f / 1024.0f;
}

float SizeComputer::computeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                                 const std::vector<Tensor*>& outputs) {
    auto computeFactory = SizeComputerSuite::get();
    auto computer       = computeFactory->search(op->type());
    if (nullptr != computer) {
        return computer->onComputeFlops(op, inputs, outputs);
    }
    if (op->type() == OpType_While && op->main_type() == OpParameter_LoopParam) {
        auto sumFlops = 0.0f;
        auto loop = op->main_as_LoopParam();
        auto cmdSize = loop->commands()->size();
        for (int i=0; i<cmdSize; ++i) {
            auto cmd = loop->commands()->GetAs<RegionCommand>(i);
            auto size = cmd->size()->data();
            sumFlops += (float)size[0] * (float)size[1] * (float)size[2] / 1024.0f / 1024.0f;
        }
        return sumFlops * (float)loop->loopNumber();
    }
    auto sumFlops = 0.0f;
    for (auto output : outputs) {
        sumFlops += (float)output->elementSize() / 1024.0f / 1024.0f;
    }
    return sumFlops;
}

bool SizeComputer::computeOutputSize(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                                     const std::vector<Tensor*>& outputs) {
    auto computeFactory = SizeComputerSuite::get();
    // When op is nullptr, it means a copy op
    if (nullptr != op) {
        // Don't support compute shape for control flow op
        if (op->type() == OpType_While || op->type() == OpType_If) {
            return false;
        }
        // Check -1 input
        for (auto& t : inputs) {
            for (int i=0; i < t->dimensions(); ++i) {
                if (t->length(i) < 0) {
                    return false;
                }
            }
        }
        auto computer = computeFactory->search(op->type());
        if (nullptr != computer) {
            bool ret = computer->onComputeSize(op, inputs, outputs);
#ifdef MNN_DEBUG_TENSOR_SIZE

            if (op->name() != nullptr) {
                MNN_PRINT("===> compute shape: %s, [%s]\n", op->name()->c_str(), MNN::EnumNameOpType(op->type()));
            } else {
                MNN_PRINT("===> compute shape:[%s]\n", MNN::EnumNameOpType(op->type()));
            }
            if (inputs.size()) {
                MNN_PRINT("\tInputs:\n");
                for (auto o : inputs) {
                    MNN_PRINT("\tptr=%p, format=%s, datatype=%d;\t", o, EnumNameMNN_DATA_FORMAT(TensorUtils::getDescribe(o)->dimensionFormat), o->getType().code);
                    if (o->dimensions() == 0) {
                        MNN_PRINT("\t*Scalar*");
                    }
                    for (int i = 0; i < o->dimensions(); ++i) {
                        MNN_PRINT("%d, ", o->length(i));
                    }
                    MNN_PRINT("\n");
                }
            }
            MNN_PRINT("\tOutputs:\n");
            for (auto o : outputs) {
                MNN_PRINT("\tptr=:%p, format=%s, datatype=%d;\t",o, EnumNameMNN_DATA_FORMAT(TensorUtils::getDescribe(o)->dimensionFormat), o->getType().code);
                if (o->dimensions() == 0) {
                    MNN_PRINT("\t*Scalar*");
                }
                for (int i = 0; i < o->dimensions(); ++i) {
                    MNN_PRINT("%d, ", o->length(i));
                }
                MNN_PRINT("\n");
            }
// }

#endif
            return ret;
        }
    }

    // Default Set to the same
    if (inputs.size() >= 1 && (outputs.size() == 1 || outputs.size() == inputs.size())) {
        if (inputs[0] == outputs[0]) {
            return true;
        }
        for (int i=0; i<outputs.size(); ++i) {
            const auto& ib = inputs[i]->buffer();
            auto& ob       = outputs[i]->buffer();
            memcpy(ob.dim, ib.dim, sizeof(halide_dimension_t) * ib.dimensions);
            ob.dimensions                                         = ib.dimensions;
            ob.type                                               = ib.type;
            TensorUtils::getDescribe(outputs[i])->dimensionFormat = TensorUtils::getDescribe(inputs[i])->dimensionFormat;
        }
        return true;
    }
    // Not Support
    MNN_PRINT("Can't compute size for %d, name=%s\n", op->type(), op->name() ? op->name()->c_str() : "");

    return false;
}

std::vector<int> SizeComputer::needInputContent(const MNN::Op* op, int inputSize) {
    auto computeFactory = SizeComputerSuite::get();
    // When op is nullptr, it means a copy op
    if (nullptr != op) {
        // when hasOutputShape = true, deconv last is outputShape
        if (op->type() == OpType_Deconvolution && op->main_as_Convolution2D() && op->main_as_Convolution2D()->common()) {
            if (op->main_as_Convolution2D()->common()->hasOutputShape()) {
                return std::vector<int>{ inputSize - 1 };
            }
        }
        if (inputSize > 1 && (op->type() == OpType_Squeeze || op->type() == OpType_Unsqueeze)) {
            return std::vector<int>{1};
        }
        if (op->type() == OpType_CumSum) {
            return std::vector<int>{1};
        }
        auto computer = computeFactory->search(op->type());
        if (nullptr != computer) {
            return computer->mNeedContentInputIndex;
        }
    }
    return std::vector<int>{};
}
bool SizeComputer::computeBroadCastDims(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                                 const std::vector<Tensor*>& outputs) {
    int maxDimensions = inputs[0]->dimensions();
    int maxIndex = 0;
    for (int index=1; index < inputs.size(); ++index) {
        if (inputs[index]->dimensions() > maxDimensions) {
            maxDimensions = inputs[index]->dimensions();
            maxIndex = index;
        }
    }
    int outputDims[MNN_MAX_TENSOR_DIM];
    for (int i = 0; i < maxDimensions; i++) {
        outputDims[i] = inputs[maxIndex]->length(i);
    }
    for (int index=0; index < inputs.size(); ++index) {
        if (index == maxIndex) {
            continue;
        }
        auto input1 = inputs[index];
        auto input0 = inputs[maxIndex];
        const int diffDimension = maxDimensions - input1->dimensions();
        for (int i = diffDimension; i < maxDimensions; i++) {
            const int input1Index = i - diffDimension;
            int dim1 = input1->buffer().dim[input1Index].extent;
            if (dim1 != outputDims[i] && (dim1 != 1 && outputDims[i] != 1)) {
                MNN_ERROR("Broad cast error, dim1 = %d, dim2 = %d\n", dim1, outputDims[i]);
                return false;
            }
            if (dim1 == outputDims[i]) {
                continue;
            }
            if (dim1 != outputDims[i] && (dim1 == 1 || outputDims[i] == 1)) {
                outputDims[i] = outputDims[i] * dim1;
            } else {
                return false;
            }
        }
    }
    auto& ob       = outputs[0]->buffer();
    ob.dimensions = maxDimensions;
    for (int i = 0; i < maxDimensions; i++) {
        ob.dim[i].extent = outputDims[i];
    }
    return true;
}
} // namespace MNN
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// SizeComputer.cpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/01/10.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include "shape/SizeComputer.hpp"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`#include <stdlib.h>`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#include <mutex>`
Update 2019-12-27 22:16:57 +08:00			`#include "core/Macro.h"`
			`#include "core/TensorUtils.hpp"`
[MNN:Sync] Sync internal gitlab 2022-06-10 10:39:50 +08:00			`// #define MNN_DEBUG_TENSOR_SIZE`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`namespace MNN {`
fix backend/op/sizer register 2019-05-09 19:39:33 +08:00			`void registerShapeOps();`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`SizeComputerSuite* SizeComputerSuite::gInstance = nullptr;`

			`SizeComputerSuite::~SizeComputerSuite() {`
			`for (auto& iter : mRegistry) {`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`delete iter;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`}`

- build: - unify schema building in core and converter; - add more build script for android; - add linux build script for python; - ops impl: - add floor mod support in binary; - use eltwise impl in add/max/sub/mul binary for optimization; - remove fake double support in cast; - fix 5d support for concat; - add adjX and adjY support for batch matmul; - optimize conv2d back prop filter; - add pad mode support for conv3d; - fix bug in conv2d & conv depthwise with very small feature map; - optimize binary without broacast; - add data types support for gather; - add gather ND support; - use uint8 data type in gather v2; - add transpose support for matmul; - add matrix band part; - add dim != 4 support for padding, reshape & tensor convert; - add pad type support for pool3d; - make ops based on TensorFlow Lite quantization optional; - add all & any support for reduction; - use type in parameter as output type in reduction; - add int support for unary; - add variable weight support for conv2d; - fix conv2d depthwise weights initialization; - fix type support for transpose; - fix grad outputs count for reduce grad and reshape grad; - fix priorbox & detection output; - fix metal softmax error; - python: - add runSessionWithCallBackInfo interface; - add max nodes limit (1400) for visualization tool; - fix save error in python3; - align default dim; - convert: - add extra design for optimization; - add more post converting optimizers; - add caffe v1 weights blob support; - add cast, unary, conv transpose support for onnx model; - optimize batchnorm, conv with variable weights, prelu, reshape, slice, upsample for onnx model; - add cos/sin/atan/tan support for unary for tensorflow model; - add any/all support for reduction for tensorflow model; - add elu, conv3d, pool3d support for tensorflow model; - optimize argmax, batchnorm, concat, batch to space, conv with variable weights, prelu, slice for tensorflow model; - others: - fix size computer lock; - fix thread pool deadlock; - add express & parameters in express; - rewrite blitter chooser without static map; - add tests for expr; 2019-10-29 13:37:26 +08:00			`void SizeComputerSuite::init() {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (nullptr != gInstance) {`
			`return;`
			`}`
			`gInstance = new SizeComputerSuite;`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`gInstance->mRegistry.resize(OpType_MAX + 1);`
			`::memset(gInstance->mRegistry.data(), 0, gInstance->mRegistry.size() * sizeof(SizeComputer*));`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`registerShapeOps();`
- build: - unify schema building in core and converter; - add more build script for android; - add linux build script for python; - ops impl: - add floor mod support in binary; - use eltwise impl in add/max/sub/mul binary for optimization; - remove fake double support in cast; - fix 5d support for concat; - add adjX and adjY support for batch matmul; - optimize conv2d back prop filter; - add pad mode support for conv3d; - fix bug in conv2d & conv depthwise with very small feature map; - optimize binary without broacast; - add data types support for gather; - add gather ND support; - use uint8 data type in gather v2; - add transpose support for matmul; - add matrix band part; - add dim != 4 support for padding, reshape & tensor convert; - add pad type support for pool3d; - make ops based on TensorFlow Lite quantization optional; - add all & any support for reduction; - use type in parameter as output type in reduction; - add int support for unary; - add variable weight support for conv2d; - fix conv2d depthwise weights initialization; - fix type support for transpose; - fix grad outputs count for reduce grad and reshape grad; - fix priorbox & detection output; - fix metal softmax error; - python: - add runSessionWithCallBackInfo interface; - add max nodes limit (1400) for visualization tool; - fix save error in python3; - align default dim; - convert: - add extra design for optimization; - add more post converting optimizers; - add caffe v1 weights blob support; - add cast, unary, conv transpose support for onnx model; - optimize batchnorm, conv with variable weights, prelu, reshape, slice, upsample for onnx model; - add cos/sin/atan/tan support for unary for tensorflow model; - add any/all support for reduction for tensorflow model; - add elu, conv3d, pool3d support for tensorflow model; - optimize argmax, batchnorm, concat, batch to space, conv with variable weights, prelu, slice for tensorflow model; - others: - fix size computer lock; - fix thread pool deadlock; - add express & parameters in express; - rewrite blitter chooser without static map; - add tests for expr; 2019-10-29 13:37:26 +08:00			`}`

			`SizeComputerSuite* SizeComputerSuite::get() {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`return gInstance;`
			`}`

			`void SizeComputerSuite::insert(SizeComputer* t, OpType type) {`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`mRegistry[type] = t;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`

			`SizeComputer* SizeComputerSuite::search(OpType name) {`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`auto iter = mRegistry[name];`
			`if (iter == nullptr) {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`return nullptr;`
			`}`
[MNN:Sync] Sync internal gitlab Main Feature: 1. Add OpenCV API and Numpy API Support 2. Protobuf move into MNN 3. Add more op for torchscript convert 4. Add recompute to speed up geometry compute 5. Add ModuleBasic Test 2021-11-30 10:10:53 +08:00			`return iter;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
			`float SizeComputer::onComputeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,`
fix backend/op/sizer register 2019-05-09 19:39:33 +08:00			`const std::vector<Tensor*>& outputs) const {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`MNN_ASSERT(outputs.size() >= 1);`
			`return (float)outputs[0]->elementSize() / 1024.0f / 1024.0f;`
			`}`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`float SizeComputer::computeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,`
			`const std::vector<Tensor*>& outputs) {`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`auto computeFactory = SizeComputerSuite::get();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`auto computer = computeFactory->search(op->type());`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`if (nullptr != computer) {`
			`return computer->onComputeFlops(op, inputs, outputs);`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`if (op->type() == OpType_While && op->main_type() == OpParameter_LoopParam) {`
			`auto sumFlops = 0.0f;`
			`auto loop = op->main_as_LoopParam();`
			`auto cmdSize = loop->commands()->size();`
			`for (int i=0; i<cmdSize; ++i) {`
			`auto cmd = loop->commands()->GetAs<RegionCommand>(i);`
			`auto size = cmd->size()->data();`
			`sumFlops += (float)size[0] * (float)size[1] * (float)size[2] / 1024.0f / 1024.0f;`
			`}`
			`return sumFlops * (float)loop->loopNumber();`
			`}`
Update 2019-12-27 22:16:57 +08:00			`auto sumFlops = 0.0f;`
			`for (auto output : outputs) {`
			`sumFlops += (float)output->elementSize() / 1024.0f / 1024.0f;`
			`}`
			`return sumFlops;`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`}`

beta 0.1.0 2019-04-17 10:49:11 +08:00			`bool SizeComputer::computeOutputSize(const MNN::Op* op, const std::vector<Tensor*>& inputs,`
			`const std::vector<Tensor*>& outputs) {`
			`auto computeFactory = SizeComputerSuite::get();`
			`// When op is nullptr, it means a copy op`
			`if (nullptr != op) {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`// Don't support compute shape for control flow op`
			`if (op->type() == OpType_While \|\| op->type() == OpType_If) {`
			`return false;`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`// Check -1 input`
			`for (auto& t : inputs) {`
			`for (int i=0; i < t->dimensions(); ++i) {`
			`if (t->length(i) < 0) {`
			`return false;`
			`}`
			`}`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`auto computer = computeFactory->search(op->type());`
			`if (nullptr != computer) {`
			`bool ret = computer->onComputeSize(op, inputs, outputs);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#ifdef MNN_DEBUG_TENSOR_SIZE`
[Sync] Sync Internal 2.1.2 2022-09-30 10:02:52 +08:00
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (op->name() != nullptr) {`
[MNN:Sync] Sync internal gitlab 2022-06-10 10:39:50 +08:00			`MNN_PRINT("===> compute shape: %s, [%s]\n", op->name()->c_str(), MNN::EnumNameOpType(op->type()));`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`} else {`
[MNN:Sync] Sync internal gitlab 2022-06-10 10:39:50 +08:00			`MNN_PRINT("===> compute shape:[%s]\n", MNN::EnumNameOpType(op->type()));`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`}`
			`if (inputs.size()) {`
[MNN:Sync] Sync internal gitlab 2022-06-10 10:39:50 +08:00			`MNN_PRINT("\tInputs:\n");`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`for (auto o : inputs) {`
[Sync] Sync Internal 2.1.2 2022-09-30 10:02:52 +08:00			`MNN_PRINT("\tptr=%p, format=%s, datatype=%d;\t", o, EnumNameMNN_DATA_FORMAT(TensorUtils::getDescribe(o)->dimensionFormat), o->getType().code);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (o->dimensions() == 0) {`
			`MNN_PRINT("\tScalar");`
			`}`
			`for (int i = 0; i < o->dimensions(); ++i) {`
			`MNN_PRINT("%d, ", o->length(i));`
			`}`
			`MNN_PRINT("\n");`
			`}`
			`}`
[MNN:Sync] Sync internal gitlab 2022-06-10 10:39:50 +08:00			`MNN_PRINT("\tOutputs:\n");`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`for (auto o : outputs) {`
[Sync] Sync Internal 2.1.2 2022-09-30 10:02:52 +08:00			`MNN_PRINT("\tptr=:%p, format=%s, datatype=%d;\t",o, EnumNameMNN_DATA_FORMAT(TensorUtils::getDescribe(o)->dimensionFormat), o->getType().code);`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`if (o->dimensions() == 0) {`
			`MNN_PRINT("\tScalar");`
			`}`
			`for (int i = 0; i < o->dimensions(); ++i) {`
			`MNN_PRINT("%d, ", o->length(i));`
			`}`
			`MNN_PRINT("\n");`
			`}`
[Sync] Sync Internal 2.1.2 2022-09-30 10:02:52 +08:00			`// }`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#endif`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`return ret;`
			`}`
			`}`

			`// Default Set to the same`
[Sync] Sync Internal 2.2.2 2022-11-18 22:35:31 +08:00			`if (inputs.size() >= 1 && (outputs.size() == 1 \|\| outputs.size() == inputs.size())) {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`if (inputs[0] == outputs[0]) {`
			`return true;`
			`}`
[Sync] Sync Internal 2.2.2 2022-11-18 22:35:31 +08:00			`for (int i=0; i<outputs.size(); ++i) {`
			`const auto& ib = inputs[i]->buffer();`
			`auto& ob = outputs[i]->buffer();`
			`memcpy(ob.dim, ib.dim, sizeof(halide_dimension_t) * ib.dimensions);`
			`ob.dimensions = ib.dimensions;`
			`ob.type = ib.type;`
			`TensorUtils::getDescribe(outputs[i])->dimensionFormat = TensorUtils::getDescribe(inputs[i])->dimensionFormat;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`return true;`
			`}`
			`// Not Support`
Update 2019-12-27 22:16:57 +08:00			`MNN_PRINT("Can't compute size for %d, name=%s\n", op->type(), op->name() ? op->name()->c_str() : "");`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`return false;`
			`}`
beta 0.2.0.8 - add NaN check-up - add quantification support for ScaleAdd Op - add binary to eltwise optimization - add console logs for quantization tool - better document for quantization tool - replace redundant dimension flags with dimension format - optimize performance of TensorFlow Lite Quantized Convolution - fix axis support for ONNX softmax - fix get performance compile error on Windows 2019-08-22 20:13:46 +08:00
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`std::vector<int> SizeComputer::needInputContent(const MNN::Op* op, int inputSize) {`
beta 0.2.0.8 - add NaN check-up - add quantification support for ScaleAdd Op - add binary to eltwise optimization - add console logs for quantization tool - better document for quantization tool - replace redundant dimension flags with dimension format - optimize performance of TensorFlow Lite Quantized Convolution - fix axis support for ONNX softmax - fix get performance compile error on Windows 2019-08-22 20:13:46 +08:00			`auto computeFactory = SizeComputerSuite::get();`
			`// When op is nullptr, it means a copy op`
			`if (nullptr != op) {`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`// when hasOutputShape = true, deconv last is outputShape`
			`if (op->type() == OpType_Deconvolution && op->main_as_Convolution2D() && op->main_as_Convolution2D()->common()) {`
			`if (op->main_as_Convolution2D()->common()->hasOutputShape()) {`
			`return std::vector<int>{ inputSize - 1 };`
			`}`
			`}`
[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`if (inputSize > 1 && (op->type() == OpType_Squeeze \|\| op->type() == OpType_Unsqueeze)) {`
			`return std::vector<int>{1};`
			`}`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`if (op->type() == OpType_CumSum) {`
			`return std::vector<int>{1};`
			`}`
beta 0.2.0.8 - add NaN check-up - add quantification support for ScaleAdd Op - add binary to eltwise optimization - add console logs for quantization tool - better document for quantization tool - replace redundant dimension flags with dimension format - optimize performance of TensorFlow Lite Quantized Convolution - fix axis support for ONNX softmax - fix get performance compile error on Windows 2019-08-22 20:13:46 +08:00			`auto computer = computeFactory->search(op->type());`
			`if (nullptr != computer) {`
			`return computer->mNeedContentInputIndex;`
			`}`
			`}`
			`return std::vector<int>{};`
			`}`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`bool SizeComputer::computeBroadCastDims(const MNN::Op* op, const std::vector<Tensor*>& inputs,`
			`const std::vector<Tensor*>& outputs) {`
			`int maxDimensions = inputs[0]->dimensions();`
			`int maxIndex = 0;`
			`for (int index=1; index < inputs.size(); ++index) {`
			`if (inputs[index]->dimensions() > maxDimensions) {`
			`maxDimensions = inputs[index]->dimensions();`
			`maxIndex = index;`
			`}`
			`}`
			`int outputDims[MNN_MAX_TENSOR_DIM];`
			`for (int i = 0; i < maxDimensions; i++) {`
			`outputDims[i] = inputs[maxIndex]->length(i);`
			`}`
			`for (int index=0; index < inputs.size(); ++index) {`
			`if (index == maxIndex) {`
			`continue;`
			`}`
			`auto input1 = inputs[index];`
			`auto input0 = inputs[maxIndex];`
			`const int diffDimension = maxDimensions - input1->dimensions();`
			`for (int i = diffDimension; i < maxDimensions; i++) {`
			`const int input1Index = i - diffDimension;`
			`int dim1 = input1->buffer().dim[input1Index].extent;`
			`if (dim1 != outputDims[i] && (dim1 != 1 && outputDims[i] != 1)) {`
[MNN:Sync] Sync internal gitlab 2021-04-16 14:50:43 +08:00			`MNN_ERROR("Broad cast error, dim1 = %d, dim2 = %d\n", dim1, outputDims[i]);`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`return false;`
			`}`
			`if (dim1 == outputDims[i]) {`
			`continue;`
			`}`
			`if (dim1 != outputDims[i] && (dim1 == 1 \|\| outputDims[i] == 1)) {`
			`outputDims[i] = outputDims[i] * dim1;`
			`} else {`
			`return false;`
			`}`
			`}`
			`}`
			`auto& ob = outputs[0]->buffer();`
			`ob.dimensions = maxDimensions;`
			`for (int i = 0; i < maxDimensions; i++) {`
			`ob.dim[i].extent = outputDims[i];`
			`}`
			`return true;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`} // namespace MNN`