armnn/latest/_batch_mat_mul_layer_8cpp_source.html

 //

 // Copyright © 2022-2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //

 #include "BatchMatMulLayer.hpp"


 #include <armnn/backends/WorkloadFactory.hpp>

 #include <armnnUtils/Permute.hpp>

 #include "layers/LayerCloneBase.hpp"


 namespace armnn

 {


 BatchMatMulLayer::BatchMatMulLayer(const BatchMatMulDescriptor& param, const char* name)

     : LayerWithParameters(2, 1, LayerType::BatchMatMul, param, name)

 {}


 std::unique_ptr<IWorkload> BatchMatMulLayer::CreateWorkload(const IWorkloadFactory& factory) const

 {

     BatchMatMulQueueDescriptor descriptor;

     SetAdditionalInfo(descriptor);


     return factory.CreateWorkload(LayerType::BatchMatMul, descriptor, PrepInfoAndDesc(descriptor));

 }


 BatchMatMulLayer* BatchMatMulLayer::Clone(Graph& graph) const

 {

     auto layer = CloneBase<BatchMatMulLayer>(graph, m_Param, GetName());


     return std::move(layer);

 }


 std::vector<TensorShape> BatchMatMulLayer::InferOutputShapes(const std::vector<TensorShape>& inputShapes) const

 {

     if (inputShapes.size() != 2)

     {

         throw armnn::LayerValidationException("inputShapes' size is \"" + std::to_string(inputShapes.size()) +

                                               "\" - should be \"2\".");

     }


     TensorShape inputXShape = inputShapes[0];

     TensorShape inputYShape = inputShapes[1];


     // Adjoint is assumed to be square, but we will apply the permute anyway

     if(m_Param.m_TransposeX || m_Param.m_AdjointX)

     {

         auto permuteVec = BatchMatMulDescriptor::GetPermuteVec(m_Param.m_DataLayoutX,

                                                                inputXShape);

         inputXShape = armnnUtils::Permuted(inputXShape, permuteVec);

     }

     if(m_Param.m_TransposeY || m_Param.m_AdjointY)

     {

         auto permuteVec = BatchMatMulDescriptor::GetPermuteVec(m_Param.m_DataLayoutY,

                                                                inputYShape);

         inputYShape = armnnUtils::Permuted(inputYShape, permuteVec);

     }


     TensorShape& longerInput = inputXShape.GetNumDimensions() >= inputYShape.GetNumDimensions()?

                                inputXShape : inputYShape;

     TensorShape& shorterInput = inputXShape.GetNumDimensions() >= inputYShape.GetNumDimensions()?

                                 inputYShape : inputXShape;


     unsigned int inputNumDimsOffset = longerInput.GetNumDimensions() - shorterInput.GetNumDimensions();


     unsigned int outputNumDimensions = longerInput.GetNumDimensions();


     std::vector<unsigned int> tensorDimensions(outputNumDimensions, 0);


     const auto& longerInputDataLayout = inputXShape.GetNumDimensions() >= inputYShape.GetNumDimensions()?

                                         m_Param.m_DataLayoutX : m_Param.m_DataLayoutY;

     auto longerAxesToMul = BatchMatMulDescriptor::GetAxesToMul(longerInputDataLayout,

                                                                longerInput);


     for (unsigned int i = 0; i < outputNumDimensions; ++i)

     {

         if (i == longerAxesToMul.first)

         {

             tensorDimensions[i] = &shorterInput == &inputXShape ? inputXShape[i - inputNumDimsOffset] : inputXShape[i];

         }

         else if(i == longerAxesToMul.second)

         {

             tensorDimensions[i] = &shorterInput == &inputYShape ? inputYShape[i - inputNumDimsOffset] : inputYShape[i];

         }

         else // The other dimensions not to be multiplied (but may be broadcasted)

         {

             // Does NOT validate whether it's a valid broadcast - that's done in the validate func in WorkloadData.cpp

             tensorDimensions[i] = static_cast<int>(i) - static_cast<int>(inputNumDimsOffset) < 0 ?

                 longerInput[i] :

                 std::max(longerInput[i], shorterInput[i - inputNumDimsOffset]);

         }

     }


     auto outputShape = TensorShape(outputNumDimensions, tensorDimensions.data());

     return std::vector<TensorShape>({ outputShape });

 }


 void BatchMatMulLayer::ValidateTensorShapesFromInputs()

 {

     VerifyLayerConnections(2, CHECK_LOCATION());


     const TensorShape& outputShape = GetOutputSlot(0).GetTensorInfo().GetShape();


     VerifyShapeInferenceType(outputShape, m_ShapeInferenceMethod);


     auto inferredShapes = InferOutputShapes({

         GetInputSlot(0).GetTensorInfo().GetShape(),

         GetInputSlot(1).GetTensorInfo().GetShape() });


     if (inferredShapes.size() != 1)

     {

         throw armnn::LayerValidationException("inferredShapes has "

                                               + std::to_string(inferredShapes.size()) +

                                               " elements - should only have 1.");

     }


     ValidateAndCopyShape(outputShape, inferredShapes[0], m_ShapeInferenceMethod, "BatchMatMulLayer");

 }


 } // namespace armnn

BatchMatMulLayer.hpp

CHECK_LOCATION
#define CHECK_LOCATION()
Definition: Exceptions.hpp:203

LayerCloneBase.hpp

Permute.hpp

WorkloadFactory.hpp

armnn::BatchMatMul
Definition: BatchMatMulImpl.hpp:16

armnn::BatchMatMulLayer
Definition: BatchMatMulLayer.hpp:14

armnn::BatchMatMulLayer::Clone
BatchMatMulLayer * Clone(Graph &graph) const override
Creates a dynamically-allocated copy of this layer.
Definition: BatchMatMulLayer.cpp:26

armnn::BatchMatMulLayer::InferOutputShapes
std::vector< TensorShape > InferOutputShapes(const std::vector< TensorShape > &inputShapes) const override
Infers the output shape from the given input shapes.
Definition: BatchMatMulLayer.cpp:33

armnn::BatchMatMulLayer::ValidateTensorShapesFromInputs
void ValidateTensorShapesFromInputs() override
Check if the input tensor shapes will lead to a valid configuration of BatchMatMulLayer.
Definition: BatchMatMulLayer.cpp:97

armnn::BatchMatMulLayer::BatchMatMulLayer
BatchMatMulLayer(const BatchMatMulDescriptor &param, const char *name)
Constructor to create a BatchMatMulLayer.
Definition: BatchMatMulLayer.cpp:14

armnn::BatchMatMulLayer::CreateWorkload
virtual std::unique_ptr< IWorkload > CreateWorkload(const IWorkloadFactory &factory) const override
Makes a workload for the BatchMatMul type.
Definition: BatchMatMulLayer.cpp:18

armnn::Graph
Definition: Graph.hpp:31

armnn::IWorkloadFactory
Definition: WorkloadFactory.hpp:23

armnn::IWorkloadFactory::CreateWorkload
virtual std::unique_ptr< IWorkload > CreateWorkload(LayerType type, const QueueDescriptor &descriptor, const WorkloadInfo &info) const =0
Backends should implement their own CreateWorkload function with a switch statement.

armnn::InputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Gets the TensorInfo for this InputSlot.
Definition: Layer.cpp:614

armnn::Layer::VerifyLayerConnections
void VerifyLayerConnections(unsigned int expectedConnections, const CheckLocation &location) const
Definition: Layer.cpp:410

armnn::Layer::GetOutputSlot
const OutputSlot & GetOutputSlot(unsigned int index=0) const override
Get the const output slot handle by slot index.
Definition: Layer.hpp:339

armnn::Layer::VerifyShapeInferenceType
void VerifyShapeInferenceType(const TensorShape &outputShape, ShapeInferenceMethod shapeInferenceMethod)
Definition: Layer.cpp:526

armnn::Layer::GetName
const char * GetName() const override
Returns the name of the layer.
Definition: Layer.hpp:332

armnn::Layer::GetInputSlot
const InputSlot & GetInputSlot(unsigned int index) const override
Get a const input slot handle by slot index.
Definition: Layer.hpp:337

armnn::Layer::ValidateAndCopyShape
void ValidateAndCopyShape(const TensorShape &outputShape, const TensorShape &inferredShape, const ShapeInferenceMethod shapeInferenceMethod, const std::string &layerName, const unsigned int outputSlotIndex=0)
Definition: Layer.cpp:457

armnn::Layer::SetAdditionalInfo
void SetAdditionalInfo(QueueDescriptor &descriptor) const
Definition: Layer.cpp:303

armnn::Layer::m_ShapeInferenceMethod
ShapeInferenceMethod m_ShapeInferenceMethod
Definition: Layer.hpp:441

armnn::LayerValidationException
Definition: Exceptions.hpp:106

armnn::LayerWithParameters
Definition: LayerWithParameters.hpp:15

armnn::LayerWithParameters< BatchMatMulDescriptor >::PrepInfoAndDesc
WorkloadInfo PrepInfoAndDesc(QueueDescriptor &descriptor) const
Helper function to reduce duplication in *Layer::CreateWorkload.
Definition: LayerWithParameters.hpp:44

armnn::LayerWithParameters< BatchMatMulDescriptor >::m_Param
BatchMatMulDescriptor m_Param
The parameters for the layer (not including tensor-valued weights etc.).
Definition: LayerWithParameters.hpp:52

armnn::OutputSlot::GetTensorInfo
const TensorInfo & GetTensorInfo() const override
Definition: Layer.cpp:100

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:193

armnn::TensorShape
Definition: Tensor.hpp:21

armnn::TensorShape::GetNumDimensions
unsigned int GetNumDimensions() const
Function that returns the tensor rank.
Definition: Tensor.cpp:174

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::LayerType
LayerType
When adding a new layer, adapt also the LastLayer enum value in the enum class LayerType below.
Definition: Types.hpp:494

armnn::LayerType::BatchMatMul
@ BatchMatMul

armnnUtils::Permuted
armnn::TensorShape Permuted(const armnn::TensorShape &srcShape, const armnn::PermutationVector &mappings)
Definition: Permute.cpp:125

armnn::BatchMatMulDescriptor
A BatchMatMulDescriptor for the BatchMatMul operator.
Definition: Descriptors.hpp:1585

armnn::BatchMatMulDescriptor::m_AdjointX
bool m_AdjointX
Adjoint the slices of each input tensor Transpose and Adjoint can not both be set to true for the sam...
Definition: Descriptors.hpp:1617

armnn::BatchMatMulDescriptor::m_TransposeY
bool m_TransposeY
Definition: Descriptors.hpp:1613

armnn::BatchMatMulDescriptor::GetAxesToMul
static std::pair< unsigned int, unsigned int > GetAxesToMul(DataLayout dataLayout, const TensorShape &tensorShape)
Static helper to get the two axes (for each input) for multiplication.
Definition: Descriptors.cpp:485

armnn::BatchMatMulDescriptor::GetPermuteVec
static PermutationVector GetPermuteVec(DataLayout dataLayout, const TensorShape &tensorShape)
Static helper to get the axes which will be transposed.
Definition: Descriptors.cpp:523

armnn::BatchMatMulDescriptor::m_DataLayoutY
DataLayout m_DataLayoutY
Definition: Descriptors.hpp:1622

armnn::BatchMatMulDescriptor::m_TransposeX
bool m_TransposeX
Transpose the slices of each input tensor Transpose and Adjoint can not both be set to true for the s...
Definition: Descriptors.hpp:1612

armnn::BatchMatMulDescriptor::m_AdjointY
bool m_AdjointY
Definition: Descriptors.hpp:1618

armnn::BatchMatMulDescriptor::m_DataLayoutX
DataLayout m_DataLayoutX
Data layout of each input tensor, such as NHWC/NDHWC (leave as default for arbitrary layout)
Definition: Descriptors.hpp:1621

armnn::BatchMatMulQueueDescriptor
Definition: WorkloadData.hpp:754