armnn/latest/_max_min_into_bounded_relu_8hpp_source.html

 //

 // Copyright © 2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //


 #pragma once


 #include "Optimization.hpp"


 namespace armnn::optimizations

 {


 class MaxMinIntoBoundedReluImpl

 {

 public:

     /// Run for every exclusive connection between any Max & Min layers

     /// The Max, Min and its associated constant inputs will be removed, and replaced with a BoundedRelu Activation

     static void Run(Graph& graph, InputSlot& connection)

     {

         Layer& base = connection.GetConnectedOutputSlot()->GetOwningLayer();

         Layer& child = connection.GetOwningLayer();


         auto& maxLayer = *PolymorphicDowncast<ElementwiseBinaryLayer*>(&base);

         if (maxLayer.GetParameters().m_Operation != BinaryOperation::Maximum)

         {

             return;

         }

         auto& minLayer = *PolymorphicDowncast<ElementwiseBinaryLayer*>(&child);

         if (minLayer.GetParameters().m_Operation != BinaryOperation::Minimum)

         {

             return;

         }


         if (maxLayer.GetDataType() != minLayer.GetDataType())

         {

             return;

         }


         // get max and min values

         float_t maxValue;

         if (!GetValue(maxLayer, maxValue))

         {

             return;

         }

         float_t minValue;

         if (!GetValue(minLayer, minValue))

         {

             return;

         }


         // Save original parent output slot of the max layer

         OutputSlot& parentOut = *maxLayer.GetInputSlot(0).GetConnectedOutputSlot();


         // Insert activation layer between max layer and its parent layer

         ActivationDescriptor boundedReluDescriptor(ActivationFunction::BoundedReLu, minValue, maxValue);

         const std::string name = std::string("replaced-") + maxLayer.GetName() + std::string("-") + minLayer.GetName()

                                + std::string("-with-BoundedRelu");

         auto& boundedReluLayer = *graph.InsertNewLayer<ActivationLayer>(maxLayer.GetInputSlot(0),

                                                                         boundedReluDescriptor,

                                                                         name.c_str());


         // Reconnects with original parent.

         boundedReluLayer.GetOutputSlot().MoveAllConnections(parentOut);


         // Moves connections in min layer output to parent layer.

         // Min layer will be removed as it's left unconnected.

         // Max layer will be removed if left unconnected.

         minLayer.GetOutputSlot().MoveAllConnections(boundedReluLayer.GetOutputSlot());

     }


 protected:

     MaxMinIntoBoundedReluImpl()  = default;

     ~MaxMinIntoBoundedReluImpl() = default;


 private:

     static float_t GetConstTensorValue(Layer& layer)

     {

         auto& constLayer = *PolymorphicDowncast<ConstantLayer*>(&layer);

         switch (constLayer.GetDataType())

         {

             case DataType::Float32:

                 return *constLayer.m_LayerOutput->GetConstTensor<float>();

             case DataType::BFloat16:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<BFloat16>());

             case DataType::Float16:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<half_float::half>());

             case DataType::QAsymmU8:

             case DataType::Boolean:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<uint8_t>());

             case DataType::QAsymmS8:

             case DataType::QSymmS8:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<int8_t>());

             case DataType::QSymmS16:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<int16_t>());

             case DataType::Signed32:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<int32_t>());

             case DataType::Signed64:

                 return static_cast<float_t>(*constLayer.m_LayerOutput->GetConstTensor<int64_t>());

             default:

                 throw InvalidArgumentException("No supported Data Type");

         }

     }


     static bool GetValue(Layer& layer, float_t& value)

     {

         Layer& input0 = layer.GetInputSlot(0).GetConnectedOutputSlot()->GetOwningLayer();

         Layer& input1 = layer.GetInputSlot(1).GetConnectedOutputSlot()->GetOwningLayer();

         if (input0.GetType() == LayerType::Constant)

         {

             if (input0.GetOutputSlot(0).GetTensorInfo().GetNumElements() != 1)

             {

                 return false;

             }

             value = GetConstTensorValue(input0);

         }

         else if (input1.GetType() == LayerType::Constant)

         {

             if (input1.GetOutputSlot(0).GetTensorInfo().GetNumElements() != 1)

             {

                 return false;

             }

             value = GetConstTensorValue(input1);

         }

         else

         {

             return false;

         }

         return true;

     };

 };


 using MaxMinIntoBoundedRelu = OptimizeForExclusiveConnection<ElementwiseBinaryLayer,

                                                              ElementwiseBinaryLayer,

                                                              MaxMinIntoBoundedReluImpl>;


 } // namespace armnn::optimizations

Optimization.hpp

armnn::ActivationLayer
This layer represents an activation operation with the specified activation function.
Definition: ActivationLayer.hpp:13

armnn::BFloat16
Definition: BFloat16.hpp:16

armnn::ElementwiseBinaryLayer
This layer represents a elementwiseBinary operation.
Definition: ElementwiseBinaryLayer.hpp:15

armnn::Graph
Definition: Graph.hpp:31

armnn::Graph::InsertNewLayer
LayerT * InsertNewLayer(InputSlot &insertBefore, Args &&... args)
Inserts a new layer between the output slot currently connected to insertBefore and insertBefore itse...
Definition: Graph.hpp:481

armnn::InputSlot
Definition: Layer.hpp:43

armnn::InputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:53

armnn::InputSlot::GetConnectedOutputSlot
const OutputSlot * GetConnectedOutputSlot() const
Definition: Layer.hpp:56

armnn::InvalidArgumentException
Definition: Exceptions.hpp:81

armnn::Layer
Definition: Layer.hpp:231

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:339

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:337

armnn::Layer::GetType
LayerType GetType() const override
Returns the armnn::LayerType of this layer.
Definition: Layer.hpp:286

armnn::OptimizeForExclusiveConnection
Definition: Optimization.hpp:175

armnn::OutputSlot
Definition: Layer.hpp:101

armnn::OutputSlot::MoveAllConnections
void MoveAllConnections(OutputSlot &destination)
Moves all connections to another OutputSlot.
Definition: Layer.cpp:156

armnn::OutputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:132

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:100

armnn::TensorInfo::GetNumElements
unsigned int GetNumElements() const
Definition: Tensor.hpp:198

armnn::optimizations::MaxMinIntoBoundedReluImpl
Definition: MaxMinIntoBoundedRelu.hpp:14

armnn::optimizations::MaxMinIntoBoundedReluImpl::~MaxMinIntoBoundedReluImpl
~MaxMinIntoBoundedReluImpl()=default

armnn::optimizations::MaxMinIntoBoundedReluImpl::MaxMinIntoBoundedReluImpl
MaxMinIntoBoundedReluImpl()=default

armnn::optimizations::MaxMinIntoBoundedReluImpl::Run
static void Run(Graph &graph, InputSlot &connection)
Run for every exclusive connection between any Max & Min layers The Max, Min and its associated const...
Definition: MaxMinIntoBoundedRelu.hpp:18

armnn::optimizations
Definition: AddBroadcastReshapeLayer.hpp:15

armnn::ActivationFunction::BoundedReLu
@ BoundedReLu
min(a, max(b, input)) ReLu1 & ReLu6.

armnn::LayerType::Constant
@ Constant

armnn::BinaryOperation::Maximum
@ Maximum

armnn::BinaryOperation::Minimum
@ Minimum

armnn::DataType::QSymmS16
@ QSymmS16

armnn::DataType::QAsymmU8
@ QAsymmU8

armnn::DataType::Float32
@ Float32

armnn::DataType::Float16
@ Float16

armnn::DataType::Boolean
@ Boolean

armnn::DataType::QSymmS8
@ QSymmS8

armnn::DataType::QAsymmS8
@ QAsymmS8

armnn::DataType::Signed32
@ Signed32

armnn::DataType::BFloat16
@ BFloat16

armnn::DataType::Signed64
@ Signed64

armnn::ActivationDescriptor
An ActivationDescriptor for the ActivationLayer.
Definition: Descriptors.hpp:37