armnn/latest/_concat_layer_8cpp_source.html

 //

 // Copyright © 2017-2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //

 #include "ConcatLayer.hpp"

 #include "LayerCloneBase.hpp"


 #include <armnn/TypesUtils.hpp>

 #include <armnn/utility/PolymorphicDowncast.hpp>

 #include <armnn/backends/WorkloadData.hpp>

 #include <armnn/backends/WorkloadFactory.hpp>


 #include <queue>


 namespace armnn

 {


 ConcatLayer::ConcatLayer(const OriginsDescriptor& param, const char* name)

     : LayerWithParameters(param.GetNumViews(), 1, LayerType::Concat, param, name)

 {

 }


 std::unique_ptr<IWorkload> ConcatLayer::CreateWorkload(const IWorkloadFactory& factory) const

 {

     ConcatQueueDescriptor descriptor;


     // Copies the view origins to the descriptor.

     descriptor.m_ViewOrigins.reserve(m_Param.GetNumViews());

     for (unsigned int i = 0; i < m_Param.GetNumViews(); ++i)

     {

         descriptor.m_ViewOrigins.emplace_back(

             std::vector<unsigned int>(m_Param.GetViewOrigin(i), m_Param.GetViewOrigin(i) + m_Param.GetNumDimensions()));

     }

     SetAdditionalInfo(descriptor);


     return factory.CreateWorkload(LayerType::Concat, descriptor, PrepInfoAndDesc(descriptor));

 }


 template<typename FactoryType>

 void ConcatLayer::CreateTensors(const TensorHandleFactoryRegistry& registry,

                                 const FactoryType& factory,

                                 bool isMemoryManaged)

 {

     //If sub tensors are supported then the concat

     //just needs to make sure that the outputs of the prev layer

     //are made subtensors of the output of the concat layer.

     m_OutputHandlers[0].CreateTensorHandles(factory, isMemoryManaged);


     if (factory.SupportsSubTensors())

     {

         // check if concat is along the x or y (2 innermost dimensions)

         uint32_t concatAxis = m_Param.GetConcatAxis();

         auto numberOfDimensions = m_Param.GetNumDimensions();

         bool isConcatOnXorY = m_Param.GetNumDimensions() >= 3

                                 && ((concatAxis == numberOfDimensions - 1) || (concatAxis == numberOfDimensions - 2));


         ITensorHandleFactory::FactoryId factoryId = GetOutputSlot(0).GetTensorHandleFactoryId();


         std::queue<ConcatLayer*> m_ConcatLayers;


         m_ConcatLayers.push(this);

         while (!m_ConcatLayers.empty())

         {

             ConcatLayer* currentLayer = m_ConcatLayers.front();

             ITensorHandle* parentTensor = currentLayer->GetOutputHandler(0).GetData();

             const TensorInfo& parentInfo = currentLayer->GetOutputHandler(0).GetTensorInfo();

             m_ConcatLayers.pop();


             const unsigned int numInputSlots = currentLayer->GetNumInputSlots();


             // if concat along x or y (2 innermost dimensions) and the previous layers do not require padding

             bool canUseSubTensorOnXorY = true;

             bool isTensorHandleFactory = std::is_same<armnn::ITensorHandleFactory, FactoryType>::value;

             if (isTensorHandleFactory)

             {

                 for (unsigned int i = 0; i < numInputSlots; ++i)

                 {

                     OutputSlot* slot = currentLayer->GetInputSlot(i).GetConnectedOutputSlot();

                     ITensorHandleFactory* handleFactory  = registry.GetFactory(factoryId);

                     std::vector<Capability> capabilities =

                         handleFactory->GetCapabilities(&(slot->GetOwningLayer()),

                                                        currentLayer,

                                                        CapabilityClass::PaddingRequired);

                     if (isConcatOnXorY)

                     {

                         canUseSubTensorOnXorY = false;

                         if (capabilities.empty())

                         {

                             canUseSubTensorOnXorY = true;

                         }

                     }


                     // Splitter layer outputs are subtensors on the inputs whereas concat inputs are subtensors on

                     // the output. If the parent is a Splitter layer we cannot use subtensors.

                     if ((PolymorphicDowncast<const Layer*>(&(slot->GetOwningLayer())))->GetType() == LayerType::Splitter

                         && (PolymorphicDowncast<const Layer*>(currentLayer))->GetType() == LayerType::Concat)

                     {

                         canUseSubTensorOnXorY = false;

                     }


                     if (!canUseSubTensorOnXorY)

                     {

                         break;

                     }

                 }

             }

             // First go through all the input slots and verify that we can sub-tensor all the inputs.

             std::vector<std::unique_ptr<ITensorHandle>> subTensors(0);

             subTensors.reserve(numInputSlots);

             for (unsigned int i = 0; i < numInputSlots; ++i)

             {

                 OutputSlot* slot = currentLayer->GetInputSlot(i).GetConnectedOutputSlot();

                 const TensorInfo& info = currentLayer->GetInputSlot(i).GetTensorInfo();


                 auto CreateSubTensor = [&]()

                 {

                     // Make sure:

                     // 1) quantization parameters are in the same space

                     // 2) the same TensorHandleFactory is used for input and Concat layer output

                     // 3) the input does not come from a Constant layer or input layer

                     // 4) the input is only read by this concat layer

                     // 5) if concat along x or y (2 innermost dimensions) and the previous layers do not require padding

                     // 6) neither the inputs nor the output have an Overridden TensorInfo

                     if (slot &&

                         parentInfo.IsTypeSpaceMatch(info) && //(1)

                         factoryId == slot->GetTensorHandleFactoryId() && //(2)

                         slot->GetOwningLayer().GetType() != LayerType::Constant && //(3)

                         slot->GetOwningLayer().GetType() != LayerType::Input && //(3)

                         slot->GetNumConnections() == 1 &&

                         canUseSubTensorOnXorY && //(5)

                         !GetOutputSlot(0).GetConnection(0)->IsTensorInfoOverridden() && //(6)

                         !currentLayer->GetInputSlot(i).IsTensorInfoOverridden()) //(6)

                     {

                         ARMNN_NO_DEPRECATE_WARN_BEGIN

                         return factory.CreateSubTensorHandle(*parentTensor,

                                                              info.GetShape(),

                                                              currentLayer->m_Param.GetViewOrigin(i));

                         ARMNN_NO_DEPRECATE_WARN_END

                     }

                     return std::unique_ptr<ITensorHandle>();

                 };


                 auto subTensor = CreateSubTensor();

                 if (!subTensor)

                 {

                     break; //Failed to create a valid sub-tensor, so stop trying with the rest of the inputs.

                 }

                 else

                 {

                     subTensors.push_back(std::move(subTensor)); // store the valid sub-tensor.

                 }

             }


             // Ensure that ALL inputs can be substituted with valid sub-tensors

             if (subTensors.size() < numInputSlots)

             {

                 continue; // Don't optimize this Concat layer with sub-tensors

             }


             // Substitute input tensors with sub-tensors by replacing the output tensors on the connected layers.

             unsigned int i=0;

             for (auto& subTensor : subTensors)

             {

                 OutputSlot* slot = currentLayer->GetInputSlot(i).GetConnectedOutputSlot();

                 OutputHandler& outputHandler = slot->GetOutputHandler();


                 if (!subTensor)

                 {

                     throw armnn::Exception("ConcatLayer: Expected a valid sub-tensor for substitution.");

                 }


                 outputHandler.SetData(std::move(subTensor));


                 Layer& inputLayer = slot->GetOwningLayer();

                 if (inputLayer.GetType() == LayerType::Concat)

                 {

                     // Continue with the substitution if the connected inputs are also concat layers

                     m_ConcatLayers.push(PolymorphicDowncast<ConcatLayer*>(&inputLayer));

                 }

                 ++i;

             }

         }

     }

 }


 void ConcatLayer::CreateTensorHandles(const TensorHandleFactoryRegistry& registry,

                                       const IWorkloadFactory& workloadFactory,

                                       const bool isMemoryManaged)

 {

     OutputSlot& slot = GetOutputSlot(0);

     ITensorHandleFactory::FactoryId factoryId = slot.GetTensorHandleFactoryId();


     if (factoryId == ITensorHandleFactory::LegacyFactoryId)

     {

         CreateTensors(registry, workloadFactory, isMemoryManaged);

     }

     else

     {

         ITensorHandleFactory* handleFactory = registry.GetFactory(factoryId);

         if (!handleFactory)

         {

             throw armnn::NullPointerException("handleFactory is returning a nullptr.");

         }

         CreateTensors(registry, *handleFactory, isMemoryManaged);

     }

 }


 ConcatLayer* ConcatLayer::Clone(Graph& graph) const

 {

     return CloneBase<ConcatLayer>(graph, m_Param, GetName());

 }


 std::vector<TensorShape> ConcatLayer::InferOutputShapes(const std::vector<TensorShape>& inputShapes) const

 {

     if (inputShapes.size() != m_Param.GetNumViews())

     {

         throw armnn::Exception("inputShapes' and m_NumViews' sizes do not match (\""

                                + std::to_string(inputShapes.size()) +

                                "\" vs \""

                                + std::to_string(m_Param.GetNumViews()) + "\")");

     }


     unsigned int numDims = m_Param.GetNumDimensions();

     for (unsigned int i=0; i< inputShapes.size(); i++)

     {

         auto& inputShape = inputShapes[i];


         ConditionalThrowIfNotEqual<LayerValidationException>(

             "ConcatLayer: Num Dimensions must match all inputs.",

             numDims,

             inputShape.GetNumDimensions());

     }


     // Finds the bounding box (extents) of all the views.

     std::vector<unsigned int> extentMin(numDims);

     std::vector<unsigned int> extentMax(numDims);

     for (unsigned int i = 0; i < inputShapes.size(); i++)

     {

         const uint32_t* origin = m_Param.GetViewOrigin(i);

         const armnn::TensorShape& shape = inputShapes[i];

         for (unsigned int d = 0; d < numDims; d++)

         {

             extentMin[d] = std::min(extentMin[d], origin[d]);

             extentMax[d] = std::max(extentMax[d], origin[d] + shape[d]);

         }

     }


     // Checks that the bounding box starts at the origin.

     if (!std::all_of(extentMin.begin(), extentMin.end(), [](unsigned int s) { return s == 0; }))

     {

         throw LayerValidationException("ConcatLayer: there is no view that starts at the origin");

     }


     // Checks that there are no overlaps of views (this would lead to undefined output at those locations).

     // Checks each pair of views against each other

     // (and doesn't bother to check against self, or check the same pair both ways round).

     for (unsigned int a = 0; a < inputShapes.size(); a++)

     {

         const uint32_t* aOrigin = m_Param.GetViewOrigin(a);

         const armnn::TensorShape& aShape = inputShapes[a];

         for (unsigned int b = 0; b < a; b++)

         {

             const uint32_t* bOrigin = m_Param.GetViewOrigin(b);

             const armnn::TensorShape& bShape = inputShapes[b];


             bool allAxesOverlap = true;

             for (unsigned int d = 0; d < numDims && allAxesOverlap; d++)

             {

                 unsigned int a1 = aOrigin[d];

                 unsigned int a2 = aOrigin[d] + aShape[d];


                 unsigned int b1 = bOrigin[d];

                 unsigned int b2 = bOrigin[d] + bShape[d];


                 if (a2 <= b1 || b2 <= a1)

                 {

                     allAxesOverlap = false;

                 }

             }

             if (allAxesOverlap)

             {

                 throw LayerValidationException("ConcatLayer: Some views overlap.");

             }

         }

     }


     // Checks that there are no "holes", i.e. regions of the output which is not covered by a view.

     // Because we already checked that there are no overlaps, this can be done simply by checking that

     // the total 'volume' of the views is the same as the output.

     unsigned int totalViewsVolume = 0;

     for (unsigned int i = 0; i < inputShapes.size(); i++)

     {

         totalViewsVolume += inputShapes[i].GetNumElements();

     }

     unsigned int outputVolume = 1;

     for (unsigned int d = 0; d < numDims; d++)

     {

         outputVolume *= (extentMax[d] - extentMin[d]);

     }


     ConditionalThrowIfNotEqual<LayerValidationException>(

         "ConcatLayer: there are some gaps between views",

         totalViewsVolume,

         outputVolume);


     return std::vector<TensorShape>({ TensorShape({numDims, extentMax.data()}) });

 }


 void ConcatLayer::ValidateTensorShapesFromInputs()

 {

     // Validates Concat layer.

     ConditionalThrowIfNotEqual<LayerValidationException>(

         "ConcatLayer: Num Inputs must match num views.",

         m_Param.GetNumViews(),

         GetNumInputSlots());


     VerifyLayerConnections(m_Param.GetNumViews(), CHECK_LOCATION());


     const TensorShape& outputShape = GetOutputSlot(0).GetTensorInfo().GetShape();


     VerifyShapeInferenceType(outputShape, m_ShapeInferenceMethod);


     std::vector<TensorShape> inputShapes;

     for (unsigned int i = 0; i < GetNumInputSlots(); ++i)

     {

         inputShapes.push_back(GetInputSlot(i).GetTensorInfo().GetShape());

     }


     auto inferredShapes = InferOutputShapes(inputShapes);


     if (inferredShapes.size() != 1)

     {

         throw armnn::Exception("inferredShapes has "

                                + std::to_string(inferredShapes.size()) +

                                " elements - should only have 1.");

     }


     ValidateAndCopyShape(outputShape, inferredShapes[0], m_ShapeInferenceMethod, "ConcatLayer");

 }


 void ConcatLayer::ExecuteStrategy(IStrategy& strategy) const

 {

     strategy.ExecuteStrategy(this, GetParameters(), {}, GetName());

 }


 } // namespace armnn armnn

ConcatLayer.hpp

ARMNN_NO_DEPRECATE_WARN_BEGIN
#define ARMNN_NO_DEPRECATE_WARN_BEGIN
Definition: Deprecated.hpp:33

ARMNN_NO_DEPRECATE_WARN_END
#define ARMNN_NO_DEPRECATE_WARN_END
Definition: Deprecated.hpp:34

CHECK_LOCATION
#define CHECK_LOCATION()
Definition: Exceptions.hpp:203

LayerCloneBase.hpp

PolymorphicDowncast.hpp

TypesUtils.hpp

WorkloadData.hpp

WorkloadFactory.hpp

armnn::ConcatLayer
This layer represents a merge operation.
Definition: ConcatLayer.hpp:14

armnn::ConcatLayer::ExecuteStrategy
void ExecuteStrategy(IStrategy &strategy) const override
Apply a visitor to this layer.
Definition: ConcatLayer.cpp:341

armnn::ConcatLayer::InferOutputShapes
std::vector< TensorShape > InferOutputShapes(const std::vector< TensorShape > &inputShapes) const override
By default returns inputShapes if the number of inputs are equal to number of outputs,...
Definition: ConcatLayer.cpp:213

armnn::ConcatLayer::CreateTensorHandles
virtual void CreateTensorHandles(const TensorHandleFactoryRegistry &registry, const IWorkloadFactory &factory, const bool IsMemoryManaged=true) override
Set the outputs to be appropriate sub tensors of the input if sub tensors are supported otherwise cre...
Definition: ConcatLayer.cpp:186

armnn::ConcatLayer::ValidateTensorShapesFromInputs
void ValidateTensorShapesFromInputs() override
Check if the input tensor shape(s) will lead to a valid configuration of ConcatLayer.
Definition: ConcatLayer.cpp:309

armnn::ConcatLayer::Clone
ConcatLayer * Clone(Graph &graph) const override
Creates a dynamically-allocated copy of this layer.
Definition: ConcatLayer.cpp:208

armnn::ConcatLayer::ConcatLayer
ConcatLayer(const OriginsDescriptor &param, const char *name)
Constructor to create a ConcatLayer.
Definition: ConcatLayer.cpp:18

armnn::ConcatLayer::CreateWorkload
virtual std::unique_ptr< IWorkload > CreateWorkload(const IWorkloadFactory &factory) const override
Makes a workload for the Concat type.
Definition: ConcatLayer.cpp:23

armnn::Exception
Base class for all ArmNN exceptions so that users can filter to just those.
Definition: Exceptions.hpp:47

armnn::Graph
Definition: Graph.hpp:31

armnn::IStrategy
Definition: IStrategy.hpp:17

armnn::IStrategy::ExecuteStrategy
virtual void ExecuteStrategy(const IConnectableLayer *layer, const armnn::BaseDescriptor &descriptor, const std::vector< armnn::ConstTensor > &constants, const char *name, const armnn::LayerBindingId id=0)=0

armnn::ITensorHandleFactory
Definition: ITensorHandleFactory.hpp:47

armnn::ITensorHandleFactory::FactoryId
std::string FactoryId
Definition: ITensorHandleFactory.hpp:49

armnn::ITensorHandleFactory::GetCapabilities
virtual std::vector< Capability > GetCapabilities(const IConnectableLayer *layer, const IConnectableLayer *connectedLayer, CapabilityClass capabilityClass)
Definition: ITensorHandleFactory.hpp:93

armnn::ITensorHandleFactory::LegacyFactoryId
static const FactoryId LegacyFactoryId
Definition: ITensorHandleFactory.hpp:50

armnn::ITensorHandle
Definition: ITensorHandle.hpp:17

armnn::IWorkloadFactory
Definition: WorkloadFactory.hpp:23

armnn::IWorkloadFactory::CreateWorkload
virtual std::unique_ptr< IWorkload > CreateWorkload(LayerType type, const QueueDescriptor &descriptor, const WorkloadInfo &info) const =0
Backends should implement their own CreateWorkload function with a switch statement.

armnn::InputSlot::IsTensorInfoOverridden
bool IsTensorInfoOverridden() const override
Returns true if this InputSlot has an overridden TensorInfo that was set through a call to SetTensorI...
Definition: Layer.cpp:631

armnn::InputSlot::GetConnectedOutputSlot
const OutputSlot * GetConnectedOutputSlot() const
Definition: Layer.hpp:56

armnn::InputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Gets the TensorInfo for this InputSlot.
Definition: Layer.cpp:614

armnn::Layer::VerifyLayerConnections
void VerifyLayerConnections(unsigned int expectedConnections, const CheckLocation &location) const
Definition: Layer.cpp:410

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:339

armnn::Layer::VerifyShapeInferenceType
void VerifyShapeInferenceType(const TensorShape &outputShape, ShapeInferenceMethod shapeInferenceMethod)
Definition: Layer.cpp:526

armnn::Layer::Layer
Layer(unsigned int numInputSlots, unsigned int numOutputSlots, LayerType type, const char *name)
Definition: Layer.cpp:260

armnn::Layer::GetName
const char * GetName() const override
Returns the name of the layer.
Definition: Layer.hpp:332

armnn::Layer::m_OutputHandlers
std::vector< OutputHandler > m_OutputHandlers
Definition: Layer.hpp:440

armnn::Layer::GetNumInputSlots
unsigned int GetNumInputSlots() const override
Returns the number of connectable input slots.
Definition: Layer.hpp:334

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:337

armnn::Layer::ValidateAndCopyShape
void ValidateAndCopyShape(const TensorShape &outputShape, const TensorShape &inferredShape, const ShapeInferenceMethod shapeInferenceMethod, const std::string &layerName, const unsigned int outputSlotIndex=0)
Definition: Layer.cpp:457

armnn::Layer::GetOutputHandler
const OutputHandler & GetOutputHandler(unsigned int i=0) const
Definition: Layer.hpp:245

armnn::Layer::SetAdditionalInfo
void SetAdditionalInfo(QueueDescriptor &descriptor) const
Definition: Layer.cpp:303

armnn::Layer::m_ShapeInferenceMethod
ShapeInferenceMethod m_ShapeInferenceMethod
Definition: Layer.hpp:441

armnn::LayerValidationException
Definition: Exceptions.hpp:106

armnn::LayerWithParameters
Definition: LayerWithParameters.hpp:15

armnn::LayerWithParameters< OriginsDescriptor >::PrepInfoAndDesc
WorkloadInfo PrepInfoAndDesc(QueueDescriptor &descriptor) const
Helper function to reduce duplication in *Layer::CreateWorkload.
Definition: LayerWithParameters.hpp:44

armnn::LayerWithParameters< OriginsDescriptor >::m_Param
OriginsDescriptor m_Param
The parameters for the layer (not including tensor-valued weights etc.).
Definition: LayerWithParameters.hpp:52

armnn::LayerWithParameters< OriginsDescriptor >::GetParameters
const OriginsDescriptor & GetParameters() const override
Definition: LayerWithParameters.hpp:19

armnn::NullPointerException
Definition: Exceptions.hpp:147

armnn::OutputHandler::GetTensorInfo
const TensorInfo & GetTensorInfo() const
Gets the matching TensorInfo for the output.
Definition: OutputHandler.hpp:42

armnn::OutputHandler::GetData
ITensorHandle * GetData() const
Gets the allocated tensor memory.
Definition: OutputHandler.hpp:46

armnn::OutputSlot
Definition: Layer.hpp:101

armnn::OutputSlot::GetConnection
const InputSlot * GetConnection(unsigned int index) const override
Definition: Layer.cpp:83

armnn::OutputSlot::GetOwningLayer
Layer & GetOwningLayer() const
Definition: Layer.hpp:132

armnn::OutputSlot::GetOutputHandler
const OutputHandler & GetOutputHandler() const
Definition: Layer.hpp:139

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:100

armnn::OutputSlot::GetTensorHandleFactoryId
ITensorHandleFactory::FactoryId GetTensorHandleFactoryId() const
Definition: Layer.cpp:218

armnn::TensorHandleFactoryRegistry
Definition: TensorHandleFactoryRegistry.hpp:24

armnn::TensorHandleFactoryRegistry::GetFactory
ITensorHandleFactory * GetFactory(ITensorHandleFactory::FactoryId id) const
Find a TensorHandleFactory by Id Returns nullptr if not found.
Definition: TensorHandleFactoryRegistry.cpp:39

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn::TensorInfo::IsTypeSpaceMatch
bool IsTypeSpaceMatch(const TensorInfo &other) const
Check that the types are the same and, if quantize, that the quantization parameters are the same.
Definition: Tensor.cpp:432

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:193

armnn::TensorShape
Definition: Tensor.hpp:21

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::CapabilityClass::PaddingRequired
@ PaddingRequired

armnn::BoostLogSeverityMapping::info
@ info

armnn::LayerType
LayerType
When adding a new layer, adapt also the LastLayer enum value in the enum class LayerType below.
Definition: Types.hpp:494

armnn::LayerType::Input
@ Input

armnn::LayerType::Splitter
@ Splitter

armnn::LayerType::Constant
@ Constant

armnn::LayerType::Concat
@ Concat

armnn::ConcatQueueDescriptor
Definition: WorkloadData.hpp:131

armnn::ConcatQueueDescriptor::m_ViewOrigins
std::vector< ViewOrigin > m_ViewOrigins
Definition: WorkloadData.hpp:143

armnn::OriginsDescriptor
An OriginsDescriptor for the ConcatLayer.
Definition: Descriptors.hpp:202

armnn::OriginsDescriptor::GetNumViews
uint32_t GetNumViews() const
Get the number of views.
Definition: Descriptors.cpp:187

armnn::OriginsDescriptor::GetConcatAxis
unsigned int GetConcatAxis() const
Get the concatenation axis value.
Definition: Descriptors.cpp:162

armnn::OriginsDescriptor::GetNumDimensions
uint32_t GetNumDimensions() const
Get the number of dimensions.
Definition: Descriptors.cpp:192

armnn::OriginsDescriptor::GetViewOrigin
const uint32_t * GetViewOrigin(uint32_t idx) const
Return the view origin at the int value idx.
Definition: Descriptors.cpp:197