2019-04-17 10:49:11 +08:00
|
|
|
//
|
|
|
|
// ShapeBinaryOp.cpp
|
|
|
|
// MNN
|
|
|
|
//
|
|
|
|
// Created by MNN on 2019/01/10.
|
|
|
|
// Copyright © 2018, Alibaba Group Holding Limited
|
|
|
|
//
|
|
|
|
|
|
|
|
#include "Macro.h"
|
|
|
|
#include "SizeComputer.hpp"
|
|
|
|
namespace MNN {
|
|
|
|
class BinaryOpComputer : public SizeComputer {
|
|
|
|
public:
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
static bool outputBool(int operation) {
|
|
|
|
if (operation == BinaryOpOperation_GREATER_EQUAL) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (operation == BinaryOpOperation_GREATER) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (operation == BinaryOpOperation_LESS) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (operation == BinaryOpOperation_LESS_EQUAL) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (operation == BinaryOpOperation_EQUAL) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
2019-08-15 17:30:39 +08:00
|
|
|
virtual bool onComputeSize(const Op* op, const std::vector<Tensor*>& inputs,
|
2019-04-17 10:49:11 +08:00
|
|
|
const std::vector<Tensor*>& outputs) const override {
|
|
|
|
MNN_ASSERT(2 == inputs.size());
|
|
|
|
MNN_ASSERT(1 == outputs.size());
|
2019-08-15 17:30:39 +08:00
|
|
|
// set output type & format
|
|
|
|
auto input0 = inputs[0], input1 = inputs[1], output = outputs[0];
|
|
|
|
auto &buffer = output->buffer();
|
2019-04-17 10:49:11 +08:00
|
|
|
const auto opType = op->main_as_BinaryOp()->opType();
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
if (outputBool(opType)) {
|
2019-08-15 17:30:39 +08:00
|
|
|
buffer.type = halide_type_of<int32_t>();
|
2019-04-17 10:49:11 +08:00
|
|
|
} else {
|
2019-08-15 17:30:39 +08:00
|
|
|
buffer.type = input0->getType();
|
2019-04-17 10:49:11 +08:00
|
|
|
}
|
2019-08-15 17:30:39 +08:00
|
|
|
TensorUtils::getDescribe(output)->dimensionFormat = TensorUtils::getDescribe(input0)->dimensionFormat;
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
if (input0->dimensions() < input1->dimensions()) {
|
|
|
|
auto temp = input0;
|
|
|
|
input0 = input1;
|
|
|
|
input1 = temp;
|
|
|
|
}
|
2019-04-17 10:49:11 +08:00
|
|
|
|
2019-08-15 17:30:39 +08:00
|
|
|
// if scalar input -> just copy the other
|
|
|
|
if (input1->dimensions() == 0) {
|
|
|
|
TensorUtils::copyShape(input0, output);
|
|
|
|
return true;
|
|
|
|
}
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
|
2019-08-15 17:30:39 +08:00
|
|
|
// else if inputs shape equals -> just copy any one
|
|
|
|
bool sameShape = input0->elementSize() == input1->elementSize();
|
|
|
|
if (sameShape) {
|
|
|
|
TensorUtils::copyShape(input0, output);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
// else if broadcast NOT supported -> failed
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
const int maxDimensions = input0->dimensions();
|
|
|
|
const int diffDimension = input0->dimensions() - input1->dimensions();
|
2019-08-15 17:30:39 +08:00
|
|
|
|
|
|
|
// else broadcast
|
- dynamic computation graph (beta)
- add supports (/express)
- add tests
- add benchmarks with it (/benchmark/exprModels)
- Python
- MNN engine and tools were submitted to pip
- available on Windows/macOS/Linux
- Engine/Converter
- add supports for each op benchmarking
- refactor optimizer by separating steps
- CPU
- add supports for Conv3D, Pool3D, ELU, ReverseSequence
- fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf
- OpenCL
- add half transform in CPU
- add broadcast supports for binary
- optimize Conv2D, Reshape, Eltwise, Gemm, etc.
- OpenGL
- add sub, real div supports for binary
- add supports for unary
- optimize Conv2D, Reshape
- Vulkan
- add max supports for eltwise
- Metal
- fix metallib missing problem
- Train/Quantization
- use express to refactor training codes
2019-09-26 21:02:07 +08:00
|
|
|
for (int i = maxDimensions-1; i >=0 ; --i) {
|
|
|
|
auto input0Length = input0->length(i);
|
|
|
|
auto input1Length = 1;
|
|
|
|
if (i >= diffDimension) {
|
|
|
|
input1Length = input1->length(i-diffDimension);
|
|
|
|
}
|
|
|
|
if (input0Length != input1Length && input1Length != 1 && input0Length != 1) {
|
|
|
|
MNN_PRINT("%d, %d\n", input1Length, input0Length);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
buffer.dim[i].extent = std::max(input0Length, input1Length);
|
2019-08-15 17:30:39 +08:00
|
|
|
}
|
|
|
|
buffer.dimensions = maxDimensions;
|
2019-04-17 10:49:11 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
REGISTER_SHAPE(BinaryOpComputer, OpType_BinaryOp);
|
|
|
|
} // namespace MNN
|