armnn/latest/_neon_fully_connected_workload_8cpp_source.html

//

// Copyright © 2017-2024 Arm Ltd and Contributors. All rights reserved.

// SPDX-License-Identifier: MIT

//


#include "NeonFullyConnectedWorkload.hpp"


#include "NeonWorkloadUtils.hpp"


#include <aclCommon/ArmComputeTensorUtils.hpp>

#include <aclCommon/ArmComputeUtils.hpp>


#include <armnn/utility/PolymorphicDowncast.hpp>


#include <armnn/backends/TensorHandle.hpp>


#include <arm_compute/runtime/NEON/functions/NEFullyConnectedLayer.h>


namespace armnn

{

using namespace armcomputetensorutils;

using ACLMemManagerOnDemand = std::shared_ptr<arm_compute::MemoryManagerOnDemand>;


arm_compute::Status NeonFullyConnectedWorkloadValidate(const TensorInfo& input,

                                                       const TensorInfo& output,

                                                       const TensorInfo& weights,

                                                       const Optional<TensorInfo>& biases,

                                                       const FullyConnectedDescriptor& descriptor,

                                                       const ActivationDescriptor* activationDescriptor)

{

    const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input);

    const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output);

    arm_compute::TensorInfo aclWeights = BuildArmComputeTensorInfo(weights);

    aclWeights.set_are_values_constant(weights.IsConstant());


    arm_compute::TensorInfo aclBiases;

    arm_compute::TensorInfo* optionalAclBiases = nullptr;

    if (descriptor.m_BiasEnabled)

    {

        ARMNN_THROW_INVALIDARG_MSG_IF_FALSE(

            biases.has_value(),

            "NeonFullyConnectedWorkload: Bias was enabled in the descriptor but no value was supplied.");

        aclBiases = BuildArmComputeTensorInfo(biases.value());

        aclBiases.set_are_values_constant(biases.value().IsConstant());

        optionalAclBiases = &aclBiases;

    }


    const arm_compute::FullyConnectedLayerInfo fullyConnectedLayerInfo =

        ConvertFullyConnectedDescriptorToAclFullyConnectedLayerInfo(descriptor, activationDescriptor);

    return arm_compute::NEFullyConnectedLayer::validate(&aclInput,

                                                        &aclWeights,

                                                        optionalAclBiases,

                                                        &aclOutput,

                                                        fullyConnectedLayerInfo);

}


NeonFullyConnectedWorkload::NeonFullyConnectedWorkload(const FullyConnectedQueueDescriptor& descriptor,

                                                       const WorkloadInfo& info,

                                                       ACLMemManagerOnDemand& memoryManager)

    : NeonBaseWorkload<FullyConnectedQueueDescriptor>(descriptor, info)

{

    m_Data.ValidateInputsOutputs("NeonFullyConnectedWorkload", descriptor.m_Parameters.GetNumInputs(), 1);


    arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();

    arm_compute::ITensor& weights = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();

    m_WeightsTensorInfo = info.m_InputTensorInfos[1];

    weights.info()->set_are_values_constant(m_WeightsTensorInfo.IsConstant());

    arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();

    if (m_WeightsTensorInfo.IsConstant())

    {

        // Copy the weights' tensor into arm_compute tensor.

        m_WeightsTensor = std::make_unique<arm_compute::Tensor>();

        BuildArmComputeTensor(*m_WeightsTensor, m_WeightsTensorInfo);

        m_WeightsTensor->info()->set_are_values_constant(m_WeightsTensorInfo.IsConstant());

    }


    if (m_Data.m_Parameters.m_BiasEnabled)

    {

        // Copy the biases tensor into arm_compute tensor.

        m_BiasesTensor = std::make_unique<arm_compute::Tensor>();

        m_BiasesTensorInfo = info.m_InputTensorInfos[2];

        BuildArmComputeTensor(*m_BiasesTensor, m_BiasesTensorInfo);

        m_BiasesTensor->info()->set_are_values_constant(m_BiasesTensorInfo.IsConstant());

    }


    const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);

    arm_compute::FullyConnectedLayerInfo fc_info =

        ConvertFullyConnectedDescriptorToAclFullyConnectedLayerInfo(descriptor.m_Parameters, activationInfo);


    auto layer = std::make_unique<arm_compute::NEFullyConnectedLayer>(memoryManager);

    if (m_WeightsTensorInfo.IsConstant())

    {

        layer->configure(&input, m_WeightsTensor.get(), m_BiasesTensor.get(), &output, fc_info);

    }

    else

    {

        layer->configure(&input, &weights, m_BiasesTensor.get(), &output, fc_info);

    }

    m_FullyConnectedLayer.reset(layer.release());


    // Add details for profiling output

    WorkloadInfo detailsInfo;


    detailsInfo.m_InputTensorInfos = info.m_InputTensorInfos;

    detailsInfo.m_OutputTensorInfos = info.m_OutputTensorInfos;


    // Report Profiling Details

    ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonFullyConnectedWorkload_Construct",

                                         descriptor.m_Parameters,

                                         detailsInfo,

                                         this->GetGuid());

}


void NeonFullyConnectedWorkload::Execute() const

{

    ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonFullyConnectedWorkload_Execute");

    // The constant tensors may not be fully in place until the workload is Executed

    if (!prepared)

    {

        if (m_WeightsTensorInfo.IsConstant())

        {

            InitializeArmComputeTensorData(*m_WeightsTensor, m_WeightsTensorInfo, m_Data.m_Inputs[1]);

            m_WeightsTensor->info()->set_are_values_constant(m_WeightsTensorInfo.IsConstant());

        }


        if (m_Data.m_Parameters.m_BiasEnabled)

        {

            InitializeArmComputeTensorData(*m_BiasesTensor, m_BiasesTensorInfo, m_Data.m_Inputs[2]);

            m_BiasesTensor->info()->set_are_values_constant(m_BiasesTensorInfo.IsConstant());

        }

        if (m_WeightsTensorInfo.IsConstant())

        {

            FreeTensorIfUnused(m_WeightsTensor);

        }

        if (m_BiasesTensorInfo.IsConstant())

        {

            FreeTensorIfUnused(m_BiasesTensor);

        }

        prepared = true;

    }

    m_FullyConnectedLayer->run();

}


} //namespace armnn

ArmComputeTensorUtils.hpp

ArmComputeUtils.hpp

ARMNN_THROW_INVALIDARG_MSG_IF_FALSE
#define ARMNN_THROW_INVALIDARG_MSG_IF_FALSE(_cond, _str)
Definition Exceptions.hpp:210

NeonFullyConnectedWorkload.hpp

NeonWorkloadUtils.hpp

ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
Definition NeonWorkloadUtils.hpp:33

PolymorphicDowncast.hpp

ARMNN_REPORT_PROFILING_WORKLOAD_DESC
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
Definition Profiling.hpp:227

TensorHandle.hpp

armnn::BaseWorkload< FullyConnectedQueueDescriptor >::m_Data
FullyConnectedQueueDescriptor m_Data
Definition Workload.hpp:74

armnn::NeonBaseWorkload< FullyConnectedQueueDescriptor >::NeonBaseWorkload
NeonBaseWorkload(const FullyConnectedQueueDescriptor &descriptor, const WorkloadInfo &info)
Definition NeonBaseWorkload.hpp:16

armnn::NeonFullyConnectedWorkload::NeonFullyConnectedWorkload
NeonFullyConnectedWorkload(const FullyConnectedQueueDescriptor &descriptor, const WorkloadInfo &info, std::shared_ptr< arm_compute::MemoryManagerOnDemand > &memoryManager)
Definition NeonFullyConnectedWorkload.cpp:57

armnn::NeonFullyConnectedWorkload::Execute
virtual void Execute() const override
Definition NeonFullyConnectedWorkload.cpp:114

armnn::OptionalBase::has_value
bool has_value() const noexcept
Definition Optional.hpp:53

armnn::Optional
Definition Optional.hpp:271

armnn::OptionalReferenceSwitch::value
const T & value() const
Definition Optional.hpp:146

armnn::TensorInfo
Definition Tensor.hpp:153

armnn::TensorInfo::IsConstant
bool IsConstant() const
Definition Tensor.cpp:513

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition 01_00_quick_start.dox:7

armnn::BoostLogSeverityMapping::info
@ info
Definition Logging.hpp:200

armnn::ConvertAdditionalInfoToAclActivationLayerInfo
arm_compute::ActivationLayerInfo ConvertAdditionalInfoToAclActivationLayerInfo(const QueueDescriptor &queueDescriptor)
Definition ArmComputeUtils.hpp:105

armnn::PolymorphicDowncast
DestType PolymorphicDowncast(SourceType *value)
Polymorphic downcast for build in pointers only.
Definition PolymorphicDowncast.hpp:74

armnn::InitializeArmComputeTensorData
void InitializeArmComputeTensorData(arm_compute::Tensor &tensor, TensorInfo tensorInfo, const ITensorHandle *handle)
Definition NeonWorkloadUtils.hpp:69

armnn::ConvertFullyConnectedDescriptorToAclFullyConnectedLayerInfo
arm_compute::FullyConnectedLayerInfo ConvertFullyConnectedDescriptorToAclFullyConnectedLayerInfo(const FullyConnectedDescriptor &fullyConnectedDesc, const ActivationDescriptor *activationDesc)
Definition ArmComputeUtils.hpp:194

armnn::NeonFullyConnectedWorkloadValidate
arm_compute::Status NeonFullyConnectedWorkloadValidate(const TensorInfo &input, const TensorInfo &output, const TensorInfo &weights, const Optional< TensorInfo > &biases, const FullyConnectedDescriptor &descriptor, const ActivationDescriptor *activationDescriptor)
Definition NeonFullyConnectedWorkload.cpp:24

armnn::ACLMemManagerOnDemand
std::shared_ptr< arm_compute::MemoryManagerOnDemand > ACLMemManagerOnDemand
Definition NeonFullyConnectedWorkload.cpp:22

armnn::ActivationDescriptor
An ActivationDescriptor for the ActivationLayer.
Definition Descriptors.hpp:37

armnn::FullyConnectedDescriptor
A FullyConnectedDescriptor for the FullyConnectedLayer.
Definition Descriptors.hpp:508

armnn::FullyConnectedDescriptor::GetNumInputs
uint32_t GetNumInputs() const
Get the number of inputs.
Definition Descriptors.cpp:475

armnn::FullyConnectedDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition Descriptors.hpp:526

armnn::FullyConnectedQueueDescriptor
Definition WorkloadData.hpp:181

armnn::QueueDescriptorWithParameters::m_Parameters
LayerDescriptor m_Parameters
Definition WorkloadData.hpp:66

armnn::WorkloadInfo
Contains information about TensorInfos of a layer.
Definition WorkloadInfo.hpp:17

armnn::WorkloadInfo::m_OutputTensorInfos
std::vector< TensorInfo > m_OutputTensorInfos
Definition WorkloadInfo.hpp:19

armnn::WorkloadInfo::m_InputTensorInfos
std::vector< TensorInfo > m_InputTensorInfos
Definition WorkloadInfo.hpp:18