armnn/latest/_network_utils_8cpp_source.html

 //

 // Copyright © 2022,2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //


 #include "NetworkUtils.hpp"


 #include "SubgraphViewSelector.hpp"


 #include <armnn/Exceptions.hpp>

 #include <armnn/BackendRegistry.hpp>


 namespace armnn

 {


 namespace

 {


 void UpdateOutputSlotToFp32(OutputSlot& outputSlot)

 {

     const TensorInfo& origTensorInfo = outputSlot.GetTensorInfo();

     TensorInfo newTensorInfo(origTensorInfo);

     newTensorInfo.SetDataType(DataType::Float32);

     outputSlot.SetTensorInfo(newTensorInfo);

 }


 void ChangeOutputFp16ToFp32(Layer& layer)

 {

     for (auto&& outputSlot = layer.BeginOutputSlots(); outputSlot != layer.EndOutputSlots(); ++outputSlot)

     {

         if (outputSlot->GetTensorInfo().GetDataType() == DataType::Float16)

         {

             UpdateOutputSlotToFp32(*outputSlot);

         }

     }

 }


 } // anonymous namespace


 std::vector<ConvertFp16ToFp32Layer*> InsertConvertFp16ToFp32LayersBefore(Graph& graph,

                                                                          Layer& layer,

                                                                          bool expectCorrectInputType)

 {

     std::vector<ConvertFp16ToFp32Layer*> convertLayers;

     convertLayers.reserve(layer.GetNumInputSlots());


     // Insert a ConvertFp16ToFp32Layer before each input slot

     for (auto&& inputSlot = layer.BeginInputSlots(); inputSlot != layer.EndInputSlots(); ++inputSlot)

     {

         bool allowInsert = true;

         if (expectCorrectInputType)

         {

             // Only insert ConvertFp16ToFp32Layer before FP16 input slots

             OutputSlot* connectedOutputSlot = inputSlot->GetConnectedOutputSlot();

             allowInsert =

                 connectedOutputSlot && connectedOutputSlot->GetTensorInfo().GetDataType() == DataType::Float16;

         }


         if (allowInsert)

         {

             const std::string name =

                 std::string("convert_fp16_to_fp32-" + std::to_string(inputSlot->GetSlotIndex()) + "-") +

                 layer.GetName();

             ConvertFp16ToFp32Layer* convertLayer =

                 graph.InsertNewLayer<ConvertFp16ToFp32Layer>(*inputSlot, name.c_str());


             TensorInfo convertInfo = convertLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo();

             convertInfo.SetDataType(DataType::Float32);


             convertLayer->GetOutputSlot().SetTensorInfo(convertInfo);


             convertLayers.emplace_back(convertLayer);

         }

     }


     return convertLayers;

 }


 std::vector<ConvertFp32ToFp16Layer*> InsertConvertFp32ToFp16LayersAfter(Graph& graph, Layer& layer)

 {

     const unsigned int numOutputSlots = layer.GetNumOutputSlots();


     std::vector<ConvertFp32ToFp16Layer*> convertLayers;

     convertLayers.reserve(numOutputSlots);


     // Update FP16 output slots to FP32 on current layer

     ChangeOutputFp16ToFp32(layer);


     // Insert a ConvertFp32ToFp16Layer after each FP32 output slot

     for (unsigned int slotIndex = 0u; slotIndex < numOutputSlots; ++slotIndex)

     {

         OutputSlot& outputSlot = layer.GetOutputSlot(slotIndex);

         if(outputSlot.GetTensorInfo().GetDataType() == DataType::Float32)

         {

             const std::string name =

                 std::string("convert_fp32_to_fp16-" + std::to_string(slotIndex) + "-") + layer.GetName();

             ConvertFp32ToFp16Layer* convertLayer =

                 graph.InsertNewLayer<ConvertFp32ToFp16Layer>(outputSlot, name.c_str());


             TensorInfo convertInfo = convertLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo();

             convertInfo.SetDataType(DataType::Float16);


             convertLayer->GetOutputSlot().SetTensorInfo(convertInfo);


             convertLayers.emplace_back(convertLayer);

         }

     }


     return convertLayers;

 }


 std::vector<DebugLayer*> InsertDebugLayerAfter(Graph& graph, Layer& layer, bool toFile)

 {

     std::vector<DebugLayer*> debugLayers;

     debugLayers.reserve(layer.GetNumOutputSlots());


     // Connect a DebugLayer to each output slot of the layer

     uint32_t outputSlotIdx = 0;

     for (auto outputSlot = layer.BeginOutputSlots(); outputSlot != layer.EndOutputSlots(); ++outputSlot)

     {

         const std::string debugName = std::string("DebugLayerAfter") + layer.GetNameStr() + "_" +

             std::to_string(outputSlotIdx);


         DebugLayer* debugLayer =

             graph.InsertNewLayer<DebugLayer>(*outputSlot, debugName.c_str(), toFile);


         // Sets output tensor info for the debug layer.

         if (debugLayer->GetInputSlot(0).GetConnectedOutputSlot() != &(*outputSlot))

         {

             throw armnn::Exception("unable to set output tensor info for the debug layer.");

         }


         TensorInfo debugInfo = debugLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo();


         debugLayer->GetOutputSlot().SetTensorInfo(debugInfo);


         // NOTE: It is OK to do this because DebugLayer is only supported on CpuRef

         debugLayer->SetBackendId(Compute::CpuRef);


         debugLayers.emplace_back(debugLayer);


         ++outputSlotIdx;

     }


     return debugLayers;

 }


 } // namespace armnn

BackendRegistry.hpp

Exceptions.hpp

NetworkUtils.hpp

SubgraphViewSelector.hpp

armnn::ConvertFp16ToFp32Layer
This layer converts data type Float 16 to Float 32.
Definition: ConvertFp16ToFp32Layer.hpp:15

armnn::ConvertFp32ToFp16Layer
This layer converts data type Float 32 to Float 16.
Definition: ConvertFp32ToFp16Layer.hpp:14

armnn::DebugLayer
This layer visualizes the data flowing through the network.
Definition: DebugLayer.hpp:14

armnn::Exception
Base class for all ArmNN exceptions so that users can filter to just those.
Definition: Exceptions.hpp:47

armnn::Graph
Definition: Graph.hpp:31

armnn::Graph::InsertNewLayer
LayerT * InsertNewLayer(InputSlot &insertBefore, Args &&... args)
Inserts a new layer between the output slot currently connected to insertBefore and insertBefore itse...
Definition: Graph.hpp:481

armnn::InputSlot::GetConnectedOutputSlot
const OutputSlot * GetConnectedOutputSlot() const
Definition: Layer.hpp:56

armnn::Layer
Definition: Layer.hpp:231

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:339

armnn::Layer::GetNumOutputSlots
unsigned int GetNumOutputSlots() const override
Returns the number of connectable output slots.
Definition: Layer.hpp:335

armnn::Layer::SetBackendId
void SetBackendId(const BackendId &id) override
Set the backend of the IConnectableLayer.
Definition: Layer.hpp:291

armnn::Layer::EndOutputSlots
std::vector< OutputSlot >::iterator EndOutputSlots()
Definition: Layer.hpp:267

armnn::Layer::GetName
const char * GetName() const override
Returns the name of the layer.
Definition: Layer.hpp:332

armnn::Layer::BeginOutputSlots
std::vector< OutputSlot >::iterator BeginOutputSlots()
Definition: Layer.hpp:266

armnn::Layer::EndInputSlots
std::vector< InputSlot >::iterator EndInputSlots()
Definition: Layer.hpp:263

armnn::Layer::GetNameStr
const std::string & GetNameStr() const
Definition: Layer.hpp:240

armnn::Layer::GetNumInputSlots
unsigned int GetNumInputSlots() const override
Returns the number of connectable input slots.
Definition: Layer.hpp:334

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:337

armnn::Layer::BeginInputSlots
std::vector< InputSlot >::iterator BeginInputSlots()
Definition: Layer.hpp:262

armnn::OutputSlot
Definition: Layer.hpp:101

armnn::OutputSlot::SetTensorInfo
void SetTensorInfo(const TensorInfo &tensorInfo) override
Definition: Layer.cpp:95

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:100

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn::TensorInfo::SetDataType
void SetDataType(DataType type)
Definition: Tensor.hpp:201

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition: Tensor.hpp:200

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::InsertDebugLayerAfter
std::vector< DebugLayer * > InsertDebugLayerAfter(Graph &graph, Layer &layer, bool toFile)
Definition: NetworkUtils.cpp:112

armnn::InsertConvertFp32ToFp16LayersAfter
std::vector< ConvertFp32ToFp16Layer * > InsertConvertFp32ToFp16LayersAfter(Graph &graph, Layer &layer)
Definition: NetworkUtils.cpp:79

armnn::InsertConvertFp16ToFp32LayersBefore
std::vector< ConvertFp16ToFp32Layer * > InsertConvertFp16ToFp32LayersBefore(Graph &graph, Layer &layer, bool expectCorrectInputType)
Definition: NetworkUtils.cpp:40

armnn::DataType::Float32
@ Float32

armnn::DataType::Float16
@ Float16

armnn::Compute::CpuRef
@ CpuRef
CPU Execution: Reference C++ kernels.