MNN/source/backend/opengl/GLBinary.cpp

//
//  GLBinary.cpp
//  MNN
//
//  Created by MNN on 2019/01/31.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#include "backend/opengl/GLBinary.hpp"
#include <sstream>
#include "AllShader.hpp"
#include "backend/opengl/GLBackend.hpp"
#include "core/Macro.h"
#include "core/TensorUtils.hpp"

namespace MNN {
namespace OpenGL {
GLBinary::GLBinary(const std::vector<Tensor *> &inputs, const Op *op, Backend *bn) : Execution(bn) {
    mType = op->main_as_BinaryOp()->opType();
}

GLBinary::~GLBinary() {

}

ErrorCode GLBinary::onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) {
    std::vector<std::string> prefix;
    setLocalSize(prefix, mLocalSize, 8, 8, 1);
    if (BinaryOpOperation_ADD == mType) {
        prefix.push_back("#define ADD");
        mProgram = ((GLBackend *)backend())->getProgram("binary_add", glsl_binary_glsl, prefix);
    }else if(BinaryOpOperation_MUL == mType) {
        prefix.push_back("#define MUL");
        mProgram = ((GLBackend *)backend())->getProgram("binary_mul", glsl_binary_glsl, prefix);
    }else if(BinaryOpOperation_SUB == mType) {
        prefix.push_back("#define SUB");
        mProgram = ((GLBackend *)backend())->getProgram("binary_sub", glsl_binary_glsl, prefix);
    }else if(BinaryOpOperation_REALDIV == mType) {
        prefix.push_back("#define REALDIV");
        mProgram = ((GLBackend *)backend())->getProgram("binary_realdiv", glsl_binary_glsl, prefix);
    }else{
        MNN_PRINT("Not Supported Binary Operation: %d\n", mType);
    }
    return NO_ERROR;
}

ErrorCode GLBinary::onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) {
    MNN_ASSERT(2 == inputs.size());
    MNN_ASSERT(1 == outputs.size());

    auto input0 = inputs[0];
    auto input1 = inputs[1];
    auto output  = outputs[0];

    std::vector<int> inputShape  = tensorShapeFormat(input0);
    std::vector<int> outputShape = tensorShapeFormat(output);

    int ib = inputShape.at(0);
    int ih = inputShape.at(1);
    int iw = inputShape.at(2);
    int ic = inputShape.at(3);
    int ic_4 = UP_DIV(ic, 4);

    int ob = outputShape.at(0);
    int oh = outputShape.at(1);
    int ow = outputShape.at(2);
    int oc = outputShape.at(3);
    int oc_4 = UP_DIV(oc, 4);

    MNN_ASSERT(input0->getType().code == halide_type_float);
    MNN_ASSERT(input0->dimensions() == input1->dimensions());

    const auto intputFormat = TensorUtils::getDescribe(input0)->dimensionFormat;

    mProgram->useProgram();
    glBindImageTexture(0, output->deviceId(), 0, GL_TRUE, 0, GL_WRITE_ONLY, ((GLBackend *)backend())->getTextrueFormat());
    {
        int texId = 0;
        glActiveTexture(GL_TEXTURE0 + texId);
        glUniform1i(1, texId);
        glBindTexture(GL_TEXTURE_3D, input0->deviceId());
        OPENGL_CHECK_ERROR;
    }
    {
        int texId = 1;
        glActiveTexture(GL_TEXTURE0 + texId);
        glUniform1i(2, texId);
        glBindTexture(GL_TEXTURE_3D, input1->deviceId());
        OPENGL_CHECK_ERROR;
    }
    glUniform4i(3, iw, ih, ic_4, 1);
    OPENGL_CHECK_ERROR;
    ((GLBackend *)backend())->compute(UP_DIV(iw, mLocalSize[0]), UP_DIV(ih, mLocalSize[1]), UP_DIV(ic_4, mLocalSize[2]));

    return NO_ERROR;
}

class BinaryCreator : public GLBackend::Creator {
public:
    virtual ~BinaryCreator() = default;
    virtual Execution *onCreate(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs,
                                const MNN::Op *op, Backend *backend) const override {

        MNN_ASSERT(inputs.size() > 1);
        auto input0 = inputs[0];
        // Don't support broatcast
        for (int i = 1; i < inputs.size(); ++i) {
            auto input = inputs[i];
            if (input0->dimensions() != input->dimensions()) {
                MNN_PRINT("dimensions : [%d, %d] \n", input0->dimensions(), input->dimensions());
                MNN_PRINT("opengl binary don't support broatcast !!! \n");
                return nullptr;
            }
            auto dim = input0->dimensions();
            for (int l = 0; l < dim; ++l) {
                if (input0->length(l) != input->length(l)) {
                    MNN_PRINT("length : [%d, %d] \n", input0->length(l), input->length(l));
                    MNN_PRINT("opengl binary don't support broatcast !!! \n");
                    return nullptr;
                }
            }
        }

        return new GLBinary(inputs, op, backend);
    }
};
GLCreatorRegister<BinaryCreator> __binary_op(OpType_BinaryOp);
} // namespace OpenGL
} // namespace MNN
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`//`
			`// GLBinary.cpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/01/31.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

Sync. Fix OpenGL related building issues. Build the whole suite on Android CI (#580) * Sync code with latest internal version * Update CMake * Fix logging issues * Fix OpenGL Building * Bump CMakeLists version. Update Podspec * Update MetalLib Lookup logic * Fix Windows Build 2020-01-15 13:33:47 +08:00			`#include "backend/opengl/GLBinary.hpp"`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`#include <sstream>`
Sync. Fix OpenGL related building issues. Build the whole suite on Android CI (#580) * Sync code with latest internal version * Update CMake * Fix logging issues * Fix OpenGL Building * Bump CMakeLists version. Update Podspec * Update MetalLib Lookup logic * Fix Windows Build 2020-01-15 13:33:47 +08:00			`#include "AllShader.hpp"`
Update 2019-12-27 22:16:57 +08:00			`#include "backend/opengl/GLBackend.hpp"`
			`#include "core/Macro.h"`
			`#include "core/TensorUtils.hpp"`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00
			`namespace MNN {`
			`namespace OpenGL {`
			`GLBinary::GLBinary(const std::vector<Tensor > &inputs, const Op op, Backend *bn) : Execution(bn) {`
			`mType = op->main_as_BinaryOp()->opType();`
			`}`

			`GLBinary::~GLBinary() {`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`}`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`ErrorCode GLBinary::onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) {`
			`std::vector<std::string> prefix;`
			`setLocalSize(prefix, mLocalSize, 8, 8, 1);`
			`if (BinaryOpOperation_ADD == mType) {`
			`prefix.push_back("#define ADD");`
			`mProgram = ((GLBackend *)backend())->getProgram("binary_add", glsl_binary_glsl, prefix);`
			`}else if(BinaryOpOperation_MUL == mType) {`
			`prefix.push_back("#define MUL");`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`mProgram = ((GLBackend *)backend())->getProgram("binary_mul", glsl_binary_glsl, prefix);`
			`}else if(BinaryOpOperation_SUB == mType) {`
			`prefix.push_back("#define SUB");`
			`mProgram = ((GLBackend *)backend())->getProgram("binary_sub", glsl_binary_glsl, prefix);`
			`}else if(BinaryOpOperation_REALDIV == mType) {`
			`prefix.push_back("#define REALDIV");`
			`mProgram = ((GLBackend *)backend())->getProgram("binary_realdiv", glsl_binary_glsl, prefix);`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`}else{`
			`MNN_PRINT("Not Supported Binary Operation: %d\n", mType);`
			`}`
			`return NO_ERROR;`
			`}`

			`ErrorCode GLBinary::onExecute(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) {`
			`MNN_ASSERT(2 == inputs.size());`
			`MNN_ASSERT(1 == outputs.size());`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`auto input0 = inputs[0];`
			`auto input1 = inputs[1];`
			`auto output = outputs[0];`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.2 - CPU - add padding support - fix bug in permute when channel % 4 != 0 - fix bug in exp with extreme value - OpenCL - add protecting logics - OpenGL - add protecting logics - support NCHW format in Squeeze and Reshape - Converter - add ShuffleChannel support for Caffe - add Clip/Transpose/Unary/Pad supports for ONNX 2019-07-02 18:01:08 +08:00			`std::vector<int> inputShape = tensorShapeFormat(input0);`
			`std::vector<int> outputShape = tensorShapeFormat(output);`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.2 - CPU - add padding support - fix bug in permute when channel % 4 != 0 - fix bug in exp with extreme value - OpenCL - add protecting logics - OpenGL - add protecting logics - support NCHW format in Squeeze and Reshape - Converter - add ShuffleChannel support for Caffe - add Clip/Transpose/Unary/Pad supports for ONNX 2019-07-02 18:01:08 +08:00			`int ib = inputShape.at(0);`
			`int ih = inputShape.at(1);`
			`int iw = inputShape.at(2);`
			`int ic = inputShape.at(3);`
			`int ic_4 = UP_DIV(ic, 4);`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.2 - CPU - add padding support - fix bug in permute when channel % 4 != 0 - fix bug in exp with extreme value - OpenCL - add protecting logics - OpenGL - add protecting logics - support NCHW format in Squeeze and Reshape - Converter - add ShuffleChannel support for Caffe - add Clip/Transpose/Unary/Pad supports for ONNX 2019-07-02 18:01:08 +08:00			`int ob = outputShape.at(0);`
			`int oh = outputShape.at(1);`
			`int ow = outputShape.at(2);`
			`int oc = outputShape.at(3);`
			`int oc_4 = UP_DIV(oc, 4);`
Update 2019-12-27 22:16:57 +08:00
beta 0.2.0.2 - CPU - add padding support - fix bug in permute when channel % 4 != 0 - fix bug in exp with extreme value - OpenCL - add protecting logics - OpenGL - add protecting logics - support NCHW format in Squeeze and Reshape - Converter - add ShuffleChannel support for Caffe - add Clip/Transpose/Unary/Pad supports for ONNX 2019-07-02 18:01:08 +08:00			`MNN_ASSERT(input0->getType().code == halide_type_float);`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`MNN_ASSERT(input0->dimensions() == input1->dimensions());`

			`const auto intputFormat = TensorUtils::getDescribe(input0)->dimensionFormat;`
Update 2019-12-27 22:16:57 +08:00
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`mProgram->useProgram();`
			`glBindImageTexture(0, output->deviceId(), 0, GL_TRUE, 0, GL_WRITE_ONLY, ((GLBackend *)backend())->getTextrueFormat());`
			`{`
			`int texId = 0;`
			`glActiveTexture(GL_TEXTURE0 + texId);`
			`glUniform1i(1, texId);`
			`glBindTexture(GL_TEXTURE_3D, input0->deviceId());`
			`OPENGL_CHECK_ERROR;`
			`}`
			`{`
			`int texId = 1;`
			`glActiveTexture(GL_TEXTURE0 + texId);`
			`glUniform1i(2, texId);`
			`glBindTexture(GL_TEXTURE_3D, input1->deviceId());`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`OPENGL_CHECK_ERROR;`
			`}`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`glUniform4i(3, iw, ih, ic_4, 1);`
			`OPENGL_CHECK_ERROR;`
			`((GLBackend *)backend())->compute(UP_DIV(iw, mLocalSize[0]), UP_DIV(ih, mLocalSize[1]), UP_DIV(ic_4, mLocalSize[2]));`
beta 0.2.0.2 - CPU - add padding support - fix bug in permute when channel % 4 != 0 - fix bug in exp with extreme value - OpenCL - add protecting logics - OpenGL - add protecting logics - support NCHW format in Squeeze and Reshape - Converter - add ShuffleChannel support for Caffe - add Clip/Transpose/Unary/Pad supports for ONNX 2019-07-02 18:01:08 +08:00
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`return NO_ERROR;`
			`}`
Update 2019-12-27 22:16:57 +08:00
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`class BinaryCreator : public GLBackend::Creator {`
			`public:`
			`virtual ~BinaryCreator() = default;`
			`virtual Execution onCreate(const std::vector<Tensor > &inputs, const std::vector<Tensor *> &outputs,`
			`const MNN::Op op, Backend backend) const override {`
Update 2019-12-27 22:16:57 +08:00
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`MNN_ASSERT(inputs.size() > 1);`
			`auto input0 = inputs[0];`
			`// Don't support broatcast`
			`for (int i = 1; i < inputs.size(); ++i) {`
			`auto input = inputs[i];`
			`if (input0->dimensions() != input->dimensions()) {`
			`MNN_PRINT("dimensions : [%d, %d] \n", input0->dimensions(), input->dimensions());`
			`MNN_PRINT("opengl binary don't support broatcast !!! \n");`
			`return nullptr;`
			`}`
			`auto dim = input0->dimensions();`
			`for (int l = 0; l < dim; ++l) {`
			`if (input0->length(l) != input->length(l)) {`
			`MNN_PRINT("length : [%d, %d] \n", input0->length(l), input->length(l));`
			`MNN_PRINT("opengl binary don't support broatcast !!! \n");`
			`return nullptr;`
			`}`
			`}`
			`}`
Update 2019-12-27 22:16:57 +08:00
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`return new GLBinary(inputs, op, backend);`
			`}`
			`};`
			`GLCreatorRegister<BinaryCreator> __binary_op(OpType_BinaryOp);`
beta 0.2.0.1 - support both armv7/arm64 in podspec (pod version >= 1.5.0 required) - refactor neg axis support - fix memory overlap in de-conv - fix CONVOLUTION_TILED_NUMBER spell error - fix few warnings - add binary / interp / permute / relu / reshape / softmax support and optimize conv for OpenGL backend - add clean in nmake build script 2019-06-24 11:32:41 +08:00			`} // namespace OpenGL`
			`} // namespace MNN`