armnn/latest/_turbo_convert_const_dequantisation_layers_to_const_layers_8hpp_source.html

 //

 // Copyright © 2024 Arm Ltd and Contributors.

 // SPDX-License-Identifier: MIT

 //

 #pragma once


 #include "Optimization.hpp"

 #include "NetworkUtils.hpp"


 #include <armnn/Logging.hpp>

 #include <armnnUtils/Permute.hpp>


 namespace armnn

 {

 namespace optimizations

 {


 class TurboConvertConstDequantisationLayersToConstLayersImpl

 {

 public:

     void Run(Graph& graph, InputSlot& connection) const

     {

         Layer& base = connection.GetConnectedOutputSlot()->GetOwningLayer();

         Layer& child = connection.GetOwningLayer();


         // Check the basic criteria for the optimization are met.

         if ((base.GetType() == LayerType::Constant) && (child.GetType() == LayerType::Dequantize))

         {

             ReplaceConstDequantisationLayer(graph, PolymorphicDowncast<ConstantLayer*>(&base),

                                             PolymorphicDowncast<DequantizeLayer*>(&child));

         }

     }

 protected:

     TurboConvertConstDequantisationLayersToConstLayersImpl() = default;

     ~TurboConvertConstDequantisationLayersToConstLayersImpl() = default;

 private:


     static void ReplaceConstDequantisationLayer(Graph&,

                                                 ConstantLayer* constantLayer,

                                                 DequantizeLayer* dequantizeLayer)

     {

         ARMNN_LOG(info) << "TurboConvertConstDequantisationLayersToConstLayersImpl::ReplaceConstDequantisationLayer()";

         /**

          * This optimisation is to find situations where a constant set of inputs is being provided to a Dequantization

          * layer. In this case we don't want the overhead of Dequantizing the values on every inference, instead we

          * want to Dequantize them once and store them in a Const layer to be used everytime as they will not change.

          */

         TensorInfo constantInfo = constantLayer->GetOutputSlot(0).GetTensorInfo();

         TensorInfo inputDequantizeInfo = dequantizeLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo();

         TensorInfo outputDequantizeInfo = dequantizeLayer->GetOutputSlot(0).GetTensorInfo();


         bool requiresPermute = false;


         auto connection = dequantizeLayer->GetOutputSlot(0).GetConnection(0);

         if (connection)

         {

             if (connection->GetOwningLayer().GetType() == LayerType::Convolution2d)

             {

                 /**

                  * ArmNN does not currently support non-fixed weights or bias

                  * The NNAPI filter is always OHWI [depth_out, filter_height, filter_width, depth_in]

                  * but ArmNN expects the filter's height and width indices to match the input's height

                  * and width indices so we permute it to OIHW if the DataLayout is NCHW

                  */

                 ARMNN_LOG(info) << "ConvertConstDequantisationLayersToConstLayersImpl:: Connected to "

                                    "Convolution layer.";

                 auto conv2dLayer = PolymorphicDowncast<Convolution2dLayer*>(&connection->GetOwningLayer());

                 if (conv2dLayer->GetParameters().m_DataLayout == DataLayout::NCHW)

                 {

                     ARMNN_LOG(info) << "ConvertConstDequantisationLayersToConstLayersImpl:: Connected to "

                                         "Convolution layer and requires permute on weights. ";

                     requiresPermute = true;

                 }

             }

         }


         auto numConnections = constantLayer->GetOutputSlot(0).GetNumConnections();


         ARMNN_LOG(info) << "constantInfo datatype:" << armnn::GetDataTypeName(constantInfo.GetDataType())

            << "inputDequantizeInfo datatype:" << armnn::GetDataTypeName(inputDequantizeInfo.GetDataType())

            << "outputDequantizeInfo datatype:" << armnn::GetDataTypeName(outputDequantizeInfo.GetDataType());


         TensorInfo newInfo = inputDequantizeInfo;

         newInfo.SetConstant(true);

         if (requiresPermute)

         {

             ARMNN_LOG(info) << "TurboConvertConstDequantisationLayersToConstLayersImpl:: Permuting the constant data.";

             const PermutationVector OHWIToOIHW = {0, 2, 3, 1};

             // Here Permute weights

             std::vector<Half> permutedValues(outputDequantizeInfo.GetNumElements());

             armnnUtils::Permute(outputDequantizeInfo.GetShape(), OHWIToOIHW,

                                 constantLayer->m_LayerOutput->Map(true), permutedValues.data(),

                                 GetDataTypeSize(outputDequantizeInfo.GetDataType()));

             ConstTensor newInput(newInfo, permutedValues);

             constantLayer->m_LayerOutput.reset(new ScopedTensorHandle(newInput));

         }

         else

         {

             ConstTensor newInput(newInfo, constantLayer->m_LayerOutput->Map(true));

             constantLayer->m_LayerOutput.reset(new ScopedTensorHandle(newInput));

         }


         // Move connections in dequantize output to the constant layer.

         // Dequantize layer will be removed if left unconnected.

         dequantizeLayer->GetOutputSlot().MoveAllConnections(constantLayer->GetOutputSlot());


         // Update the output tensor

         constantLayer->GetOutputSlot(0).SetTensorInfo(newInfo);

         ARMNN_ASSERT(constantLayer->GetOutputSlot(0).GetTensorInfo().IsConstant() == true);


         // Set isConstant to true in all input tensor infos where constantLayer is now connected to

         for (unsigned int i = numConnections; i < constantLayer->GetOutputSlot(0).GetNumConnections(); ++i)

         {

             auto info = constantLayer->GetOutputSlot(0).GetConnection(i)->GetOwningLayer().GetInputSlot(0)

                     .GetConnectedOutputSlot()->GetTensorInfo();

             info.SetConstant();

             constantLayer->GetOutputSlot(0).GetConnection(i)->GetOwningLayer().GetInputSlot(0)

                     .GetConnectedOutputSlot()->SetTensorInfo(info);

         }

     }


 };


 using TurboConvertConstDequantisationLayersToConstLayers =

                             OptimizeForConnection<ConstantLayer,

                             DequantizeLayer,

                             TurboConvertConstDequantisationLayersToConstLayersImpl>;


 } // namespace optimizations

 } // namespace armnn

ARMNN_ASSERT
#define ARMNN_ASSERT(COND)
Definition: Assert.hpp:14

Logging.hpp

ARMNN_LOG
#define ARMNN_LOG(severity)
Definition: Logging.hpp:212

NetworkUtils.hpp

Optimization.hpp

Permute.hpp

armnn::ConstTensor
A tensor defined by a TensorInfo (shape and data type) and an immutable backing store.
Definition: Tensor.hpp:330

armnn::ConstantLayer
A layer that the constant data can be bound to.
Definition: ConstantLayer.hpp:16

armnn::ConstantLayer::m_LayerOutput
std::shared_ptr< ConstTensorHandle > m_LayerOutput
Definition: ConstantLayer.hpp:46

armnn::DequantizeLayer
This layer dequantizes the input tensor.
Definition: DequantizeLayer.hpp:14

armnn::Graph
Definition: Graph.hpp:31

armnn::InputSlot
Definition: Layer.hpp:43

armnn::InputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:53

armnn::InputSlot::GetConnectedOutputSlot
const OutputSlot * GetConnectedOutputSlot() const
Definition: Layer.hpp:56

armnn::Layer
Definition: Layer.hpp:231

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:339

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:337

armnn::Layer::GetType
LayerType GetType() const override
Returns the armnn::LayerType of this layer.
Definition: Layer.hpp:286

armnn::OptimizeForConnection
Definition: Optimization.hpp:120

armnn::OutputSlot::GetConnection
const InputSlot * GetConnection(unsigned int index) const override
Definition: Layer.cpp:83

armnn::OutputSlot::MoveAllConnections
void MoveAllConnections(OutputSlot &destination)
Moves all connections to another OutputSlot.
Definition: Layer.cpp:156

armnn::OutputSlot::GetNumConnections
unsigned int GetNumConnections() const override
Definition: Layer.hpp:158

armnn::OutputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:132

armnn::OutputSlot::SetTensorInfo
void SetTensorInfo(const TensorInfo &tensorInfo) override
Definition: Layer.cpp:95

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:100

armnn::PermutationVector
Definition: Types.hpp:317

armnn::ScopedTensorHandle
Definition: TensorHandle.hpp:116

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn::TensorInfo::GetNumElements
unsigned int GetNumElements() const
Definition: Tensor.hpp:198

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:193

armnn::TensorInfo::SetConstant
void SetConstant(const bool IsConstant=true)
Marks the data corresponding to this tensor info as constant.
Definition: Tensor.cpp:518

armnn::TensorInfo::IsConstant
bool IsConstant() const
Definition: Tensor.cpp:513

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition: Tensor.hpp:200

armnn::optimizations::TurboConvertConstDequantisationLayersToConstLayersImpl
Definition: TurboConvertConstDequantisationLayersToConstLayers.hpp:19

armnn::optimizations::TurboConvertConstDequantisationLayersToConstLayersImpl::Run
void Run(Graph &graph, InputSlot &connection) const
Definition: TurboConvertConstDequantisationLayersToConstLayers.hpp:21

armnn::optimizations::TurboConvertConstDequantisationLayersToConstLayersImpl::~TurboConvertConstDequantisationLayersToConstLayersImpl
~TurboConvertConstDequantisationLayersToConstLayersImpl()=default

armnn::optimizations::TurboConvertConstDequantisationLayersToConstLayersImpl::TurboConvertConstDequantisationLayersToConstLayersImpl
TurboConvertConstDequantisationLayersToConstLayersImpl()=default

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::BoostLogSeverityMapping::info
@ info

armnn::LayerType::Dequantize
@ Dequantize

armnn::LayerType::Constant
@ Constant

armnn::LayerType::Convolution2d
@ Convolution2d

armnn::GetDataTypeName
constexpr const char * GetDataTypeName(DataType dataType)
Definition: TypesUtils.hpp:234

armnn::GetDataTypeSize
constexpr unsigned int GetDataTypeSize(DataType dataType)
Definition: TypesUtils.hpp:183

armnn::DataLayout::NCHW
@ NCHW

armnnUtils::Permute
void Permute(const armnn::TensorShape &dstShape, const armnn::PermutationVector &mappings, const void *src, void *dst, size_t dataTypeSize)
Definition: Permute.cpp:164