MNN/source/shape/ShapeTFQuantizedConv2D.cpp

//
//  ShapeTFQuantizedConv2D.cpp
//  MNN
//
//  Created by MNN on 2019/01/10.
//  Copyright © 2018, Alibaba Group Holding Limited
//
#ifdef MNN_SUPPORT_TFLITE_QUAN
#include <math.h>
#include "Macro.h"
#include "SizeComputer.hpp"

namespace MNN {
class TFQuantizedConv2DComputer : public SizeComputer {
    virtual bool onComputeSize(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                               const std::vector<Tensor*>& outputs) const override {
        auto layer = op->main_as_TfQuantizedConv2D()->common();

        MNN_ASSERT(layer->dilateX() == 1);
        MNN_ASSERT(layer->dilateY() == 1);
        MNN_ASSERT(layer->strideX() == layer->strideY());

        int kernel_width  = layer->dilateX() * (layer->kernelX() - 1) + 1;
        int kernel_height = layer->dilateY() * (layer->kernelY() - 1) + 1;

        int output_width  = 1;
        int output_height = 1;

        auto input = inputs[0];

        if (layer->padMode() == PadMode_SAME) {                                     // Tensorflow padding mode SAME
            output_width  = ceil((float)input->width() / (float)layer->strideX());  // NHWC for tensorflow
            output_height = ceil((float)input->height() / (float)layer->strideY()); // the default layout is NCHW
        } else if (layer->padMode() == PadMode_VALID) {                             // Tensorflow padding mode VALID
            output_width  = ceil((float)(input->width() - kernel_width + 1) / (float)layer->strideX());
            output_height = ceil((float)(input->height() - kernel_height + 1) / (float)layer->strideY());
        } else {
            MNN_ASSERT(false); // unsupported type
        }

        // output：NCHW
        auto& outputBuffer         = outputs[0]->buffer();
        outputBuffer.dimensions    = input->buffer().dimensions;
        outputBuffer.dim[0].extent = input->buffer().dim[0].extent;
        outputBuffer.dim[1].extent = layer->outputCount();
        outputBuffer.dim[2].extent = output_height;
        outputBuffer.dim[3].extent = output_width;

        outputs[0]->buffer().type = halide_type_of<uint8_t>();
        TensorUtils::getDescribe(outputs[0])->dimensionFormat = TensorUtils::getDescribe(inputs[0])->dimensionFormat;
        return true;
    }

    virtual float onComputeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,
                                 const std::vector<Tensor*>& outputs) const override {
        auto layer = op->main_as_TfQuantizedConv2D()->common();
        auto kw    = layer->kernelX();
        auto kh    = layer->kernelY();
        int group  = 1;
        if (op->type() == OpType_QuantizedDepthwiseConv2D) {
            group = inputs[0]->channel();
        }
        auto ic    = inputs[0]->channel();
        auto oc    = outputs[0]->channel();
        auto oSize = outputs[0]->width() * outputs[0]->height() * outputs[0]->batch();

        return (float)oSize * kw * kh * (ic * oc / group) / FLOPS_M;
    }
};

REGISTER_SHAPE(TFQuantizedConv2DComputer, OpType_TfQuantizedConv2D);
REGISTER_SHAPE(TFQuantizedConv2DComputer, OpType_QuantizedDepthwiseConv2D);
} // namespace MNN
#endif
-												beta 0.1.0

											
										
										
											2019-04-17 10:49:11 +08:00
+								//
 								//  ShapeTFQuantizedConv2D.cpp
 								//  MNN
 								//
 								//  Created by MNN on 2019/01/10.
 								//  Copyright © 2018, Alibaba Group Holding Limited
 								//
-												- build:
	- unify schema building in core and converter;
	- add more build script for android;
	- add linux build script for python;

- ops impl:
	- add floor mod support in binary;
	- use eltwise impl in add/max/sub/mul binary for optimization;
	- remove fake double support in cast;
	- fix 5d support for concat;
	- add adjX and adjY support for batch matmul;
	- optimize conv2d back prop filter;
	- add pad mode support for conv3d;
	- fix bug in conv2d & conv depthwise with very small feature map;
	- optimize binary without broacast;
	- add data types support for gather;
	- add gather ND support;
	- use uint8 data type in gather v2;
	- add transpose support for matmul;
	- add matrix band part;
	- add dim != 4 support for padding, reshape & tensor convert;
	- add pad type support for pool3d;
	- make ops based on TensorFlow Lite quantization optional;
	- add all & any support for reduction;
	- use type in parameter as output type in reduction;
	- add int support for unary;
	- add variable weight support for conv2d;
	- fix conv2d depthwise weights initialization;
	- fix type support for transpose;
	- fix grad outputs count for  reduce grad and reshape grad;
	- fix priorbox & detection output;
	- fix metal softmax error;

- python:
	- add runSessionWithCallBackInfo interface;
	- add max nodes limit (1400) for visualization tool;
	- fix save error in python3;
	- align default dim;

- convert:
	- add extra design for optimization;
	- add more post converting optimizers;
	- add caffe v1 weights blob support;
	- add cast, unary, conv transpose support for onnx model;
	- optimize batchnorm, conv with variable weights, prelu, reshape, slice, upsample for onnx model;
	- add cos/sin/atan/tan support for unary for tensorflow model;
	- add any/all support for reduction for tensorflow model;
	- add elu, conv3d, pool3d support for tensorflow model;
	- optimize argmax, batchnorm, concat, batch to space, conv with variable weights, prelu, slice for tensorflow model;

- others:
	- fix size computer lock;
	- fix thread pool deadlock;
	- add express & parameters in express;
	- rewrite blitter chooser without static map;
	- add tests for expr;

											
										
										
											2019-10-29 13:37:26 +08:00
+								#ifdef MNN_SUPPORT_TFLITE_QUAN
-												beta 0.1.0

											
										
										
											2019-04-17 10:49:11 +08:00
+								#include <math.h>
 								#include "Macro.h"
 								#include "SizeComputer.hpp"
 								namespace MNN {
 								class TFQuantizedConv2DComputer : public SizeComputer {
 								    virtual bool onComputeSize(const MNN::Op* op, const std::vector<Tensor*>& inputs,
 								                               const std::vector<Tensor*>& outputs) const override {
 								        auto layer = op->main_as_TfQuantizedConv2D()->common();
 								        MNN_ASSERT(layer->dilateX() == 1);
 								        MNN_ASSERT(layer->dilateY() == 1);
 								        MNN_ASSERT(layer->strideX() == layer->strideY());
 								        int kernel_width  = layer->dilateX() * (layer->kernelX() - 1) + 1;
 								        int kernel_height = layer->dilateY() * (layer->kernelY() - 1) + 1;
 								        int output_width  = 1;
 								        int output_height = 1;
 								        auto input = inputs[0];
 								        if (layer->padMode() == PadMode_SAME) {                                     // Tensorflow padding mode SAME
 								            output_width  = ceil((float)input->width() / (float)layer->strideX());  // NHWC for tensorflow
 								            output_height = ceil((float)input->height() / (float)layer->strideY()); // the default layout is NCHW
 								        } else if (layer->padMode() == PadMode_VALID) {                             // Tensorflow padding mode VALID
 								            output_width  = ceil((float)(input->width() - kernel_width + 1) / (float)layer->strideX());
 								            output_height = ceil((float)(input->height() - kernel_height + 1) / (float)layer->strideY());
 								        } else {
 								            MNN_ASSERT(false); // unsupported type
 								        }
 								        // output：NCHW
 								        auto& outputBuffer         = outputs[0]->buffer();
 								        outputBuffer.dimensions    = input->buffer().dimensions;
 								        outputBuffer.dim[0].extent = input->buffer().dim[0].extent;
 								        outputBuffer.dim[1].extent = layer->outputCount();
 								        outputBuffer.dim[2].extent = output_height;
 								        outputBuffer.dim[3].extent = output_width;
 								        outputs[0]->buffer().type = halide_type_of<uint8_t>();
-												beta 0.2.0.8
- add NaN check-up
- add quantification support for ScaleAdd Op
- add binary to eltwise optimization
- add console logs for quantization tool
- better document for quantization tool
- replace redundant dimension flags with dimension format
- optimize performance of TensorFlow Lite Quantized Convolution
- fix axis support for ONNX softmax
- fix get performance compile error on Windows

											
										
										
											2019-08-22 20:13:46 +08:00
+								        TensorUtils::getDescribe(outputs[0])->dimensionFormat = TensorUtils::getDescribe(inputs[0])->dimensionFormat;
-												beta 0.1.0

											
										
										
											2019-04-17 10:49:11 +08:00
+								        return true;
 								    }
 								    virtual float onComputeFlops(const MNN::Op* op, const std::vector<Tensor*>& inputs,
 								                                 const std::vector<Tensor*>& outputs) const override {
 								        auto layer = op->main_as_TfQuantizedConv2D()->common();
 								        auto kw    = layer->kernelX();
 								        auto kh    = layer->kernelY();
 								        int group  = 1;
 								        if (op->type() == OpType_QuantizedDepthwiseConv2D) {
 								            group = inputs[0]->channel();
 								        }
 								        auto ic    = inputs[0]->channel();
 								        auto oc    = outputs[0]->channel();
 								        auto oSize = outputs[0]->width() * outputs[0]->height() * outputs[0]->batch();
 								        return (float)oSize * kw * kh * (ic * oc / group) / FLOPS_M;
 								    }
 								};
 								REGISTER_SHAPE(TFQuantizedConv2DComputer, OpType_TfQuantizedConv2D);
 								REGISTER_SHAPE(TFQuantizedConv2DComputer, OpType_QuantizedDepthwiseConv2D);
 								} // namespace MNN
-												- build:
	- unify schema building in core and converter;
	- add more build script for android;
	- add linux build script for python;

- ops impl:
	- add floor mod support in binary;
	- use eltwise impl in add/max/sub/mul binary for optimization;
	- remove fake double support in cast;
	- fix 5d support for concat;
	- add adjX and adjY support for batch matmul;
	- optimize conv2d back prop filter;
	- add pad mode support for conv3d;
	- fix bug in conv2d & conv depthwise with very small feature map;
	- optimize binary without broacast;
	- add data types support for gather;
	- add gather ND support;
	- use uint8 data type in gather v2;
	- add transpose support for matmul;
	- add matrix band part;
	- add dim != 4 support for padding, reshape & tensor convert;
	- add pad type support for pool3d;
	- make ops based on TensorFlow Lite quantization optional;
	- add all & any support for reduction;
	- use type in parameter as output type in reduction;
	- add int support for unary;
	- add variable weight support for conv2d;
	- fix conv2d depthwise weights initialization;
	- fix type support for transpose;
	- fix grad outputs count for  reduce grad and reshape grad;
	- fix priorbox & detection output;
	- fix metal softmax error;

- python:
	- add runSessionWithCallBackInfo interface;
	- add max nodes limit (1400) for visualization tool;
	- fix save error in python3;
	- align default dim;

- convert:
	- add extra design for optimization;
	- add more post converting optimizers;
	- add caffe v1 weights blob support;
	- add cast, unary, conv transpose support for onnx model;
	- optimize batchnorm, conv with variable weights, prelu, reshape, slice, upsample for onnx model;
	- add cos/sin/atan/tan support for unary for tensorflow model;
	- add any/all support for reduction for tensorflow model;
	- add elu, conv3d, pool3d support for tensorflow model;
	- optimize argmax, batchnorm, concat, batch to space, conv with variable weights, prelu, slice for tensorflow model;

- others:
	- fix size computer lock;
	- fix thread pool deadlock;
	- add express & parameters in express;
	- rewrite blitter chooser without static map;
	- add tests for expr;

											
										
										
											2019-10-29 13:37:26 +08:00
+								#endif