MNN/tools/quantization/quantizeWeight.hpp

//
//  quantizeWeight.hpp
//  MNN
//
//  Created by MNN on 2019/04/21.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef QUANTIZEWEIGHT_HPP
#define QUANTIZEWEIGHT_HPP
#include <stdint.h>
#include <vector>
#include <string>

// default: quantize weight every channel
int SymmetricQuantizeWeight(const float* weight, const int size, int8_t* quantizedWeight, float* scale,
                            const int channels, float weightClampValue);
int QuantizeWeightADMM(const float* weight, const int weightNum, int8_t* quantizedWeight, float* alpha,
                       const int kernelNum, const float weightClampValue);

// quantize convolution weight per channle
// firstly, multiply float weight by input_scale, then quantize the result to get input_sacle*weight_scale
// secondly, divide input_sacle*weight_scale by output_scale
int QuantizeConvPerChannel(const float* weight, const int size, const float* bias, int8_t* quantizedWeight,
                           int32_t* quantizedBias, float* scale, const float inputScale, const float outputScale,
                           const int inputChannel, const int outputChannel, std::string method, float weightClampValue, bool mergeChannel = true);

int QuantizeDepthwiseConv(const float* weight, const int size, const float* bias, int8_t* quantizedWeight,
                          int32_t* quantizedBias, float* scale, const float inputScale, const float outputScale,
                          const int inputChannel, const int outputChannel, std::string method, float weightClampValue, bool mergeChannel = true);

#endif // QUANTIZEWEIGHT_HPP
beta 0.2.0.3 - add quantization tool & cpu impl & demo/exec - add thread pool - add tests - fix onnx converter tensor name mismatch - optimize cpu performance with SSE for windows 2019-07-11 13:56:52 +08:00			`//`
			`// quantizeWeight.hpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/04/21.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#ifndef QUANTIZEWEIGHT_HPP`
			`#define QUANTIZEWEIGHT_HPP`
			`#include <stdint.h>`
			`#include <vector>`
fix quantize header missing 2019-08-08 14:41:22 +08:00			`#include <string>`

beta 0.2.0.3 - add quantization tool & cpu impl & demo/exec - add thread pool - add tests - fix onnx converter tensor name mismatch - optimize cpu performance with SSE for windows 2019-07-11 13:56:52 +08:00			`// default: quantize weight every channel`
			`int SymmetricQuantizeWeight(const float* weight, const int size, int8_t* quantizedWeight, float* scale,`
[PATCH 05/19] [Quantization:Feature] add option to set clamp value 2021-01-06 19:54:08 +08:00			`const int channels, float weightClampValue);`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`int QuantizeWeightADMM(const float* weight, const int weightNum, int8_t* quantizedWeight, float* alpha,`
			`const int kernelNum, const float weightClampValue);`
beta 0.2.0.3 - add quantization tool & cpu impl & demo/exec - add thread pool - add tests - fix onnx converter tensor name mismatch - optimize cpu performance with SSE for windows 2019-07-11 13:56:52 +08:00
			`// quantize convolution weight per channle`
			`// firstly, multiply float weight by input_scale, then quantize the result to get input_sacle*weight_scale`
			`// secondly, divide input_sacle*weight_scale by output_scale`
			`int QuantizeConvPerChannel(const float* weight, const int size, const float* bias, int8_t* quantizedWeight,`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`int32_t* quantizedBias, float* scale, const float inputScale, const float outputScale,`
			`const int inputChannel, const int outputChannel, std::string method, float weightClampValue, bool mergeChannel = true);`
beta 0.2.0.3 - add quantization tool & cpu impl & demo/exec - add thread pool - add tests - fix onnx converter tensor name mismatch - optimize cpu performance with SSE for windows 2019-07-11 13:56:52 +08:00
			`int QuantizeDepthwiseConv(const float* weight, const int size, const float* bias, int8_t* quantizedWeight,`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`int32_t* quantizedBias, float* scale, const float inputScale, const float outputScale,`
			`const int inputChannel, const int outputChannel, std::string method, float weightClampValue, bool mergeChannel = true);`
beta 0.2.0.3 - add quantization tool & cpu impl & demo/exec - add thread pool - add tests - fix onnx converter tensor name mismatch - optimize cpu performance with SSE for windows 2019-07-11 13:56:52 +08:00
			`#endif // QUANTIZEWEIGHT_HPP`