#include <armnn/Exceptions.hpp>

Include dependency graph for TosaRescaleOperatorUtils.hpp:

This graph shows which files directly or indirectly include this file:

Functions
void	CreateRawRescaleTosaOperator (const std::string &inputName, const std::string &outputName, const std::vector< int32_t > &multipliers, const std::vector< int32_t > &shifts, int32_t input_zp, int32_t output_zp, bool input_unsigned, bool output_unsigned, bool double_round, bool scale32, bool per_channel, TosaSerializationOperator **op)

void	ComputeMultiplierAndShiftTosaScale32 (double scale, int32_t &multiplier, int32_t &shift)
	The following is taken from mlir/lib/Dialect/Tosa/Utils/QuantUtils.cpp in the LLVM project From a scale value, generates multiplier and shift values where mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that multiplier = mantissa*2^shift for 32-bit scaling. More...

void	ComputeMultiplierAndShiftTosaScale16 (double scale, int32_t &multiplier, int32_t &shift)
	The following is taken from mlir/lib/Dialect/Tosa/Utils/QuantUtils.cpp in the LLVM project From a scale value, generates multiplier and shift values where mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that multiplier = mantissa*2^shift for 16-bit scaling. More...

void	CreateRescaleTosaOperator (const std::string &inputName, const std::string &outputName, double scale, int32_t input_zp, int32_t output_zp, bool input_unsigned, bool output_unsigned, bool double_round, bool scale32, TosaSerializationOperator **op)

void	CreateRescaleTosaOperatorForWeights (const std::string &inputName, const std::string &outputName, int32_t input_zp, int32_t output_zp, bool input_unsigned, bool output_unsigned, bool double_round, bool scale32, double input_scale, double output_scale, const std::vector< float > &weight_scales, TosaSerializationOperator **op)

Function Documentation

◆ ComputeMultiplierAndShiftTosaScale16()

void ComputeMultiplierAndShiftTosaScale16	(	double	scale,
		int32_t &	multiplier,
		int32_t &	shift
	)

inline

The following is taken from mlir/lib/Dialect/Tosa/Utils/QuantUtils.cpp in the LLVM project From a scale value, generates multiplier and shift values where mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that multiplier = mantissa*2^shift for 16-bit scaling.

Definition at line 123 of file TosaRescaleOperatorUtils.hpp.

 {
     const double mantissa = std::frexp(scale, &shift);
     auto shiftedM = std::round(mantissa * (int64_t(1) << 15));
  
     // Can't be greater than 1.0.
     if (!(shiftedM <= (int64_t(1) << 15)))
     {
         throw armnn::Exception("Shifted mantissa exceeds 16 signed bits");
     }
  
     if (shiftedM == (int64_t(1) << 15))
     {
         shiftedM /= 2;
         shift++;
     }
  
     // TOSA expects right shift to be positive and embed (1 << 15) into right
     // shift bits.
     shift = (-shift) + 15;
  
     if (!(shiftedM <= std::numeric_limits<int32_t>::max()))
     {
         throw armnn::Exception("Shifted mantissa exceeds 32-bit signed output type");
     }
  
     multiplier = static_cast<int32_t>(shiftedM);
  
     // Shifting tops out at 62 bits. Right shift to make 62 bits the max.
     // The limit of 62 on shift allows the shift to be decomposed as
     // two right shifts of 31.
     if (shift > 62)
     {
         // Shifting the multiplier by more than 31-bits is unnecessary.
         multiplier = multiplier >> std::min<int32_t>(31, shift - 62);
         shift = 62;
     }
 }

Referenced by CreateRescaleTosaOperator(), and CreateRescaleTosaOperatorForWeights().

◆ ComputeMultiplierAndShiftTosaScale32()

void ComputeMultiplierAndShiftTosaScale32	(	double	scale,
		int32_t &	multiplier,
		int32_t &	shift
	)

inline

The following is taken from mlir/lib/Dialect/Tosa/Utils/QuantUtils.cpp in the LLVM project From a scale value, generates multiplier and shift values where mantissa is in [-1.0,-0.5] or [0.5, 1.0] such that multiplier = mantissa*2^shift for 32-bit scaling.

Definition at line 78 of file TosaRescaleOperatorUtils.hpp.

 {
     const double mantissa = std::frexp(scale, &shift);
     auto shiftedM = std::round(mantissa * (int64_t(1) << 31));
  
     // Can't be greater than 1.0.
     if (!(shiftedM <= (int64_t(1) << 31)))
     {
         throw armnn::Exception("Shifted mantissa exceeds 32 signed bits");
     }
  
     if (shiftedM == (int64_t(1) << 31))
     {
         shiftedM /= 2;
         shift++;
     }
  
     // TOSA expects right shift to be positive, and embed (1 << 31) into right
     // shift bits.
     shift = (-shift) + 31;
  
     if (!(shiftedM <= std::numeric_limits<int32_t>::max()))
     {
         throw armnn::Exception("Shifted mantissa exceeds 32-bit signed output type");
     }
  
     multiplier = static_cast<int32_t>(shiftedM);
  
     // Shifting tops out at 62 bits. Right shift to make 62 bits the max.
     // The limit of 62 on shift allows the shift to be decomposed as
     // two right shifts of 31.
     if (shift > 62)
     {
         // Shifting the multiplier by more than 32-bits is unnecessary.
         multiplier = multiplier >> std::min<int32_t>(31, shift - 62);
         shift = 62;
     }
 }

Referenced by CreateRescaleTosaOperator(), and CreateRescaleTosaOperatorForWeights().

◆ CreateRawRescaleTosaOperator()

void CreateRawRescaleTosaOperator	(	const std::string &	inputName,
		const std::string &	outputName,
		const std::vector< int32_t > &	multipliers,
		const std::vector< int32_t > &	shifts,
		int32_t	input_zp,
		int32_t	output_zp,
		bool	input_unsigned,
		bool	output_unsigned,
		bool	double_round,
		bool	scale32,
		bool	per_channel,
		TosaSerializationOperator **	op
	)

inline

Definition at line 10 of file TosaRescaleOperatorUtils.hpp.

 {
     if (!op)
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: nullptr op.");
     }
  
     if (multipliers.empty())
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: multipliers is empty.");
     }
  
     if (multipliers.size() != shifts.size())
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: multipliers and shift not same size.");
     }
  
     if (multipliers.size() == 1 && per_channel)
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: \
                                 multipliers must be greater than 1 if per_channel is true.");
     }
  
     if (multipliers.size() == 1 && per_channel)
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: \
                                 multipliers size must be greater than 1 if per_channel is true.");
     }
  
     if (multipliers.size() > 1 && !per_channel)
     {
         throw armnn::Exception("CreateRawRescaleTosaOperator: \
                                 multipliers size must be 1 if per_channel is false.");
     }
  
     TosaRescaleAttribute attribute(input_zp,
                                    output_zp,
                                    multipliers,
                                    shifts,
                                    scale32,
                                    double_round,
                                    per_channel,
                                    input_unsigned,
                                    output_unsigned);
  
     // op
     *op = new TosaSerializationOperator(Op_RESCALE, Attribute_RescaleAttribute, &attribute, {inputName}, {outputName});
     if (!(*op))
     {
         throw armnn::Exception("CreateRescaleTosaOperator: failed to created operator");
     }
 }

Referenced by CreateRescaleTosaOperator(), and CreateRescaleTosaOperatorForWeights().

◆ CreateRescaleTosaOperator()

void CreateRescaleTosaOperator	(	const std::string &	inputName,
		const std::string &	outputName,
		double	scale,
		int32_t	input_zp,
		int32_t	output_zp,
		bool	input_unsigned,
		bool	output_unsigned,
		bool	double_round,
		bool	scale32,
		TosaSerializationOperator **	op
	)

inline

Definition at line 164 of file TosaRescaleOperatorUtils.hpp.

 {
     int32_t multiplier;
     int32_t shift;
  
     if (scale32)
     {
         ComputeMultiplierAndShiftTosaScale32(scale, multiplier, shift);
     }
     else
     {
         ComputeMultiplierAndShiftTosaScale16(scale, multiplier, shift);
     }
  
     const std::vector<int32_t> multipliers{multiplier};
     const std::vector<int32_t> shifts{shift};
     CreateRawRescaleTosaOperator(inputName, outputName, multipliers, shifts,
                                  input_zp, output_zp, input_unsigned, output_unsigned,
                                  double_round, scale32, false, op);
 }

References ComputeMultiplierAndShiftTosaScale16(), ComputeMultiplierAndShiftTosaScale32(), and CreateRawRescaleTosaOperator().

Referenced by ConvertQuantizeToTosaOperator(), and ConvertSoftmaxToTosaOperator().

◆ CreateRescaleTosaOperatorForWeights()

void CreateRescaleTosaOperatorForWeights	(	const std::string &	inputName,
		const std::string &	outputName,
		int32_t	input_zp,
		int32_t	output_zp,
		bool	input_unsigned,
		bool	output_unsigned,
		bool	double_round,
		bool	scale32,
		double	input_scale,
		double	output_scale,
		const std::vector< float > &	weight_scales,
		TosaSerializationOperator **	op
	)

inline

Definition at line 194 of file TosaRescaleOperatorUtils.hpp.

 {
     std::vector<int32_t> op_tensor_multipliers;
     std::vector<int32_t> op_tensor_shifts;
     op_tensor_multipliers.reserve(weight_scales.size());
     op_tensor_shifts.reserve(weight_scales.size());
  
     for (const float& weight_scale : weight_scales)
     {
         double op_tensor_scale = (input_scale * weight_scale) / output_scale;
         int32_t multiplier;
         int32_t shift;
  
         if (scale32)
         {
             ComputeMultiplierAndShiftTosaScale32(op_tensor_scale, multiplier, shift);
         }
         else
         {
             ComputeMultiplierAndShiftTosaScale16(op_tensor_scale, multiplier, shift);
         }
  
         op_tensor_multipliers.push_back(multiplier);
         op_tensor_shifts.push_back(shift);
     }
  
     bool per_channel = weight_scales.size() == 1 ? false : true;
     CreateRawRescaleTosaOperator(inputName, outputName, op_tensor_multipliers, op_tensor_shifts,
                                  input_zp, output_zp, input_unsigned, output_unsigned, double_round,
                                  scale32, per_channel, op);
 }

References ComputeMultiplierAndShiftTosaScale16(), ComputeMultiplierAndShiftTosaScale32(), and CreateRawRescaleTosaOperator().

Functions

Function Documentation

◆ ComputeMultiplierAndShiftTosaScale16()

◆ ComputeMultiplierAndShiftTosaScale32()

◆ CreateRawRescaleTosaOperator()

◆ CreateRescaleTosaOperator()

◆ CreateRescaleTosaOperatorForWeights()