armnn/latest/_neon_gather_nd_workload_8cpp_source.html

 //

 // Copyright © 2022-2024 Arm Ltd and Contributors. All rights reserved.

 // SPDX-License-Identifier: MIT

 //


 #include "NeonGatherNdWorkload.hpp"

 #include "NeonWorkloadUtils.hpp"

 #include <armnn/utility/PolymorphicDowncast.hpp>

 #include <aclCommon/ArmComputeUtils.hpp>

 #include "backendsCommon/WorkloadUtils.hpp"


 namespace armnn

 {

 arm_compute::Status NeonGatherNdWorkloadValidate(const TensorInfo& paramsInfo,

                                                  const TensorInfo& indicesInfo,

                                                  const TensorInfo& outputInfo)

 {

     // Calculate ND, K, W, C.

     std::map<std::string, unsigned int> keyIndices = CalculateGatherNdKeyIndices(paramsInfo, indicesInfo);


     /// Validate Mul

     // Indices with shape { W, ND }

     armnn::TensorInfo indices_W_ND_Info = indicesInfo;

     indices_W_ND_Info.SetShape({ keyIndices["W"], keyIndices["ND"] });

     const arm_compute::TensorInfo aclIndicesInfo = BuildArmComputeTensorInfo(indices_W_ND_Info);


     // Flattened coefficients with shape { ND }

     armnn::TensorInfo flattenedCoeff_Info = indicesInfo;

     flattenedCoeff_Info.SetShape({ keyIndices["ND"] });

     const arm_compute::TensorInfo aclFlattenedCoeffInfo = BuildArmComputeTensorInfo(flattenedCoeff_Info);


     // Output of Mul with shape { W, ND }

     const arm_compute::TensorInfo aclOutputMulInfo = BuildArmComputeTensorInfo(indices_W_ND_Info);


     auto statusMul = arm_compute::NEPixelWiseMultiplication::validate(&aclIndicesInfo,

                                                                       &aclFlattenedCoeffInfo,

                                                                       &aclOutputMulInfo,

                                                                       1.0f,

                                                                       arm_compute::ConvertPolicy::WRAP,

                                                                       arm_compute::RoundingPolicy::TO_ZERO,

                                                                       arm_compute::ActivationLayerInfo());


     /// Validate ReduceSum

     // Flattened indices with shape { W }

     armnn::TensorInfo flattenedIndices_Info = indicesInfo;

     flattenedIndices_Info.SetShape({ keyIndices["W"] });

     const arm_compute::TensorInfo aclFlattenedIndicesInfo = BuildArmComputeTensorInfo(flattenedIndices_Info);


     const std::vector<unsigned int> armnnReduceAxes(1, 1);

     arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(aclOutputMulInfo.num_dimensions(),

                                                                           indices_W_ND_Info.GetNumDimensions(),

                                                                           armnnReduceAxes);


     auto statusReduceSum = arm_compute::NEReductionOperation::validate(&aclOutputMulInfo,

                                                                        &aclFlattenedIndicesInfo,

                                                                        static_cast<unsigned int>(coords[0]),

                                                                        arm_compute::ReductionOperation::SUM,

                                                                        false);


     /// Validate Gather

     // Params with shape { K, C }

     armnn::TensorInfo params_K_C_Info = paramsInfo;

     params_K_C_Info.SetShape({ keyIndices["K"], keyIndices["C"] });

     const arm_compute::TensorInfo aclParamsInfo = BuildArmComputeTensorInfo(params_K_C_Info);


     // Output of gather with shape { W, C }

     armnn::TensorInfo outputGather_Info = outputInfo;

     outputGather_Info.SetShape({ keyIndices["W"], keyIndices["C"] });

     const arm_compute::TensorInfo aclOutputGatherInfo = BuildArmComputeTensorInfo(outputGather_Info);


     auto aclAxis = ComputeAclAxis(0, params_K_C_Info);

     auto statusGather =

             arm_compute::NEGather::validate(&aclParamsInfo, &aclFlattenedIndicesInfo, &aclOutputGatherInfo, aclAxis);


     /// Validate Reshape

     const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(outputInfo);

     const arm_compute::TensorInfo aclParamsOriginalShapeInfo = BuildArmComputeTensorInfo(paramsInfo);

     const arm_compute::TensorInfo aclIndicesOriginalShapeInfo = BuildArmComputeTensorInfo(indicesInfo);

     const arm_compute::TensorInfo aclParamsReshapeInfo = BuildArmComputeTensorInfo(paramsInfo);

     const arm_compute::TensorInfo aclIndicesReshapeInfo = BuildArmComputeTensorInfo(indicesInfo);


     auto statusOutputReshape = arm_compute::NEReshapeLayer::validate(&aclOutputGatherInfo, &aclOutputInfo);

     auto statusParamsReshape = arm_compute::NEReshapeLayer::validate(&aclParamsOriginalShapeInfo,

                                                                      &aclParamsReshapeInfo);

     auto statusIndicesReshape = arm_compute::NEReshapeLayer::validate(&aclIndicesOriginalShapeInfo,

                                                                       &aclIndicesReshapeInfo);


     /// Return OK if all the layers are valid

     auto okCode = arm_compute::ErrorCode::OK;

     if (statusMul.error_code()       == okCode &&

         statusReduceSum.error_code() == okCode &&

         statusGather.error_code()    == okCode &&

         statusParamsReshape.error_code() == okCode &&

         statusIndicesReshape.error_code() == okCode &&

         statusOutputReshape.error_code()   == okCode)

     {

         return arm_compute::Status(arm_compute::ErrorCode::OK,

                                    "All GatherND layers validate status OK.");

     }

     else

     {

         return arm_compute::Status(arm_compute::ErrorCode::RUNTIME_ERROR,

                                    "GatherND layer validate status failed.");

     }

 }


 NeonGatherNdWorkload::NeonGatherNdWorkload(const GatherNdQueueDescriptor& descriptor,

                                            const WorkloadInfo& info)

         : NeonBaseWorkload<GatherNdQueueDescriptor>(descriptor, info)

 {

     m_Data.ValidateInputsOutputs("NeonGatherNdWorkload", 2, 1);


     TensorInfo paramsInfo  = info.m_InputTensorInfos[0];

     TensorInfo indicesInfo = info.m_InputTensorInfos[1];

     TensorInfo outputInfo  = info.m_OutputTensorInfos[0];


     arm_compute::ITensor& input   = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();

     arm_compute::ITensor& indices = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();

     arm_compute::ITensor& output  = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();


     // Calculate ND, K, W, C.

     std::map<std::string, unsigned int> keyIndices = CalculateGatherNdKeyIndices(paramsInfo, indicesInfo);


     /// Calculate flattened indices: m_FlattenedIndices = indices * m_FlattenedCoeff.

     /// This could be done using MatMul instead of multiplication followed by reduce sum operation,

     /// but GeMM does not support s32 at the moment.


     // Prepare the tensor to store the output of the reduce_sum operation

     armnn::TensorInfo flattenedIndices_Info = indicesInfo;

     flattenedIndices_Info.SetShape({ keyIndices["W"] });

     BuildArmComputeTensor(m_FlattenedIndices, flattenedIndices_Info);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_FlattenedIndices);


     // Reshape indices into { W, ND }

     armnn::TensorInfo indicesInfoReshape = indicesInfo;

     indicesInfoReshape.SetShape({ keyIndices["W"], keyIndices["ND"] });

     BuildArmComputeTensor(m_IndicesReshaped, indicesInfoReshape);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_IndicesReshaped);


     // Calculate the m_FlattenedCoeff

     TensorShape paramsShape = paramsInfo.GetShape();

     std::vector<int32_t> flattenedCoeff(keyIndices["ND"], 1);

     for (unsigned int i = 1; i < keyIndices["ND"]; ++i)

     {

         flattenedCoeff[i - 1] = static_cast<int32_t>(paramsShape[i]);

     }

     for (unsigned int i = keyIndices["ND"] - 1; i > 0; --i)

     {

         flattenedCoeff[i - 1] *= flattenedCoeff[i];

     }

     armnn::TensorInfo flattenedCoeff_Info = indicesInfo;

     flattenedCoeff_Info.SetShape({ keyIndices["ND"] });

     BuildArmComputeTensor(m_FlattenedCoeff, flattenedCoeff_Info);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_FlattenedCoeff);

     CopyArmComputeITensorData<int32_t>(flattenedCoeff.data(), m_FlattenedCoeff);


     // Prepare the tensor to store the output of the multiplication

     armnn::TensorInfo outputMul_Info = indicesInfo;

     outputMul_Info.SetShape({ keyIndices["W"], keyIndices["ND"] });

     BuildArmComputeTensor(m_OutputMul, outputMul_Info);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_OutputMul);


     // Reshape indices to the mul layer input shape

     m_ReshapeIndicesLayer.configure(&indices, &m_IndicesReshaped);


     // Multiply

     m_MulLayer.configure(&m_IndicesReshaped,

                          &m_FlattenedCoeff,

                          &m_OutputMul,

                          1.0f,

                          arm_compute::ConvertPolicy::WRAP,

                          arm_compute::RoundingPolicy::TO_ZERO,

                          arm_compute::ActivationLayerInfo());


     // Reduce Sum

     const std::vector<unsigned int> armnnReduceAxes(1, 1);

     arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(m_OutputMul.info()->num_dimensions(),

                                                                           outputMul_Info.GetNumDimensions(),

                                                                           armnnReduceAxes);

     m_ReduceSumLayer.configure(&m_OutputMul,

                                &m_FlattenedIndices,

                                static_cast<unsigned int>(coords[0]),

                                arm_compute::ReductionOperation::SUM,

                                false);


     /// Call Gather with adequate shapes

     // Reshape params into { K, C }

     armnn::TensorInfo paramsInfoReshape = paramsInfo;

     paramsInfoReshape.SetShape({ keyIndices["K"], keyIndices["C"] });

     BuildArmComputeTensor(m_InputGather, paramsInfoReshape);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_InputGather);


     // Reshape input to the gather params input shape

     m_ReshapeInputLayer.configure(&input, &m_InputGather);


     // Reshape output to have the shape given by gather { W, C }

     // (the original outputInfo has the shape given by gatherNd)

     armnn::TensorInfo outputGather_Info = outputInfo;

     outputGather_Info.SetShape({ keyIndices["W"], keyIndices["C"] });

     BuildArmComputeTensor(m_OutputGather, outputGather_Info);

     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_OutputGather);


     m_GatherLayer.configure(&m_InputGather,

                             &m_FlattenedIndices,

                             &m_OutputGather,

                             ComputeAclAxis(0, paramsInfoReshape));


     // Reshape output to the original output shape

     m_ReshapeOutputLayer.configure(&m_OutputGather, &output);

 }


 void NeonGatherNdWorkload::Execute() const

 {

     ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonGatherNdWorkload_Execute");

     m_ReshapeInputLayer.run();

     m_ReshapeIndicesLayer.run();

     m_MulLayer.run();

     m_ReduceSumLayer.run();

     m_GatherLayer.run();

     m_ReshapeOutputLayer.run();

 }

 } //namespace armnn

ArmComputeUtils.hpp

NeonGatherNdWorkload.hpp

NeonWorkloadUtils.hpp

ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
Definition: NeonWorkloadUtils.hpp:33

PolymorphicDowncast.hpp

WorkloadUtils.hpp

armnn::BaseWorkload::m_Data
QueueDescriptor m_Data
Definition: Workload.hpp:74

armnn::NeonBaseWorkload
Definition: NeonBaseWorkload.hpp:14

armnn::NeonGatherNdWorkload::Execute
virtual void Execute() const override
Definition: NeonGatherNdWorkload.cpp:212

armnn::NeonGatherNdWorkload::NeonGatherNdWorkload
NeonGatherNdWorkload(const GatherNdQueueDescriptor &descriptor, const WorkloadInfo &info)
Definition: NeonGatherNdWorkload.cpp:107

armnn::TensorInfo
Definition: Tensor.hpp:153

armnn::TensorInfo::GetNumDimensions
unsigned int GetNumDimensions() const
Definition: Tensor.hpp:197

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:193

armnn::TensorInfo::SetShape
void SetShape(const TensorShape &newShape)
Definition: Tensor.hpp:195

armnn::TensorShape
Definition: Tensor.hpp:21

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:7

armnn::ComputeAclAxis
int ComputeAclAxis(const int &armnnAxis, const armnn::TensorInfo &tensor)
Function to convert ArmNN axis (left to right) to ACL axis (right to left) ranging from [-rank,...
Definition: ArmComputeUtils.hpp:246

armnn::BoostLogSeverityMapping::info
@ info

armnn::Status
Status
enumeration
Definition: Types.hpp:43

armnn::CalculateGatherNdKeyIndices
std::map< std::string, unsigned int > CalculateGatherNdKeyIndices(TensorInfo inputInfo0, TensorInfo inputInfo1)
Calculates the key index values needed for GatherNd: N, ND, K, W, C (N is always 1)
Definition: WorkloadUtils.cpp:313

armnn::Coordinates
std::array< unsigned int, MaxNumOfTensorDimensions > Coordinates
Definition: InternalTypes.hpp:15

armnn::NeonGatherNdWorkloadValidate
arm_compute::Status NeonGatherNdWorkloadValidate(const TensorInfo &paramsInfo, const TensorInfo &indicesInfo, const TensorInfo &outputInfo)
Definition: NeonGatherNdWorkload.cpp:14

armnn::GatherNdQueueDescriptor
Definition: WorkloadData.hpp:503

armnn::QueueDescriptor::m_Inputs
std::vector< ITensorHandle * > m_Inputs
Definition: WorkloadData.hpp:26

armnn::QueueDescriptor::m_Outputs
std::vector< ITensorHandle * > m_Outputs
Definition: WorkloadData.hpp:27

armnn::QueueDescriptor::ValidateInputsOutputs
void ValidateInputsOutputs(const std::string &descName, unsigned int numExpectedIn, unsigned int numExpectedOut) const
Definition: WorkloadData.cpp:447

armnn::WorkloadInfo
Contains information about TensorInfos of a layer.
Definition: WorkloadInfo.hpp:17