ArmNN
 25.11
Loading...
Searching...
No Matches
ClFullyConnectedWorkload.cpp
Go to the documentation of this file.
1//
2// Copyright © 2017-2018,2020-2024 Arm Ltd and Contributors. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
11#include <cl/ClLayerSupport.hpp>
12
13#include "ClWorkloadUtils.hpp"
14
15namespace armnn
16{
17using namespace armcomputetensorutils;
18
19arm_compute::Status ClFullyConnectedWorkloadValidate(const TensorInfo& input,
20 const TensorInfo& output,
21 const TensorInfo& weights,
22 const Optional<TensorInfo>& biases,
23 const FullyConnectedDescriptor& descriptor,
24 const ActivationDescriptor* activationDescriptor)
25{
26 const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input);
27 const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output);
28 arm_compute::TensorInfo aclWeights = BuildArmComputeTensorInfo(weights);
29 aclWeights.set_are_values_constant(weights.IsConstant());
30
31 arm_compute::TensorInfo aclBiases;
32 arm_compute::TensorInfo* optionalAclBiases = nullptr;
33 if (descriptor.m_BiasEnabled)
34 {
36 biases.has_value(),
37 "ClFullyConnectedWorkload: Bias was enabled in the descriptor but no value was supplied.");
38 aclBiases = BuildArmComputeTensorInfo(biases.value());
39 aclBiases.set_are_values_constant(biases.value().IsConstant());
40 optionalAclBiases = &aclBiases;
41 }
42
43 const arm_compute::FullyConnectedLayerInfo fullyConnectedLayerInfo =
45
46 return arm_compute::CLFullyConnectedLayer::validate(&aclInput,
47 &aclWeights,
48 optionalAclBiases,
49 &aclOutput,
50 fullyConnectedLayerInfo);
51}
52
54 const FullyConnectedQueueDescriptor& descriptor,
55 const WorkloadInfo& info,
56 std::shared_ptr<arm_compute::MemoryManagerOnDemand>& memoryManager,
57 const arm_compute::CLCompileContext& clCompileContext)
58 : ClBaseWorkload<FullyConnectedQueueDescriptor>(descriptor, info), m_FullyConnectedLayer(memoryManager)
59{
60 m_Data.ValidateInputsOutputs("ClFullyConnectedWorkload", descriptor.m_Parameters.GetNumInputs(), 1);
61
62 arm_compute::ICLTensor& input = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
63 arm_compute::ICLTensor& output = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
64 arm_compute::ICLTensor& weights = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
65
66 weights.info()->set_are_values_constant(info.m_InputTensorInfos[1].IsConstant());
67
68 arm_compute::ICLTensor* bias = nullptr;
69 if (m_Data.m_Parameters.m_BiasEnabled)
70 {
71 bias = &PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[2])->GetTensor();
72 bias->info()->set_are_values_constant(info.m_InputTensorInfos[2].IsConstant());
73 }
74
75 const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);
76
77 arm_compute::FullyConnectedLayerInfo fc_info =
79 activationInfo);
80
81 {
82 ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClFullyConnectedWorkload_configure");
83 m_FullyConnectedLayer.configure(clCompileContext,
84 &input,
85 &weights,
86 bias,
87 &output,
88 fc_info);
89 }
90
91 // Add details for profiling output
92 WorkloadInfo detailsInfo;
93
94 detailsInfo.m_InputTensorInfos = info.m_InputTensorInfos;
95 detailsInfo.m_OutputTensorInfos = info.m_OutputTensorInfos;
96
97 // Report Profiling Details
98 ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClFullyConnectedWorkload_Construct",
99 descriptor.m_Parameters,
100 detailsInfo,
101 this->GetGuid());
102}
103
105{
106 ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClFullyConnectedWorkload_Execute");
107 RunClFunction(m_FullyConnectedLayer, CHECK_LOCATION());
108}
109
110} //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
#define ARMNN_THROW_INVALIDARG_MSG_IF_FALSE(_cond, _str)
#define CHECK_LOCATION()
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
ClBaseWorkload(const FullyConnectedQueueDescriptor &descriptor, const WorkloadInfo &info)
ClFullyConnectedWorkload(const FullyConnectedQueueDescriptor &descriptor, const WorkloadInfo &info, std::shared_ptr< arm_compute::MemoryManagerOnDemand > &memoryManager, const arm_compute::CLCompileContext &clCompileContext)
bool has_value() const noexcept
Definition Optional.hpp:53
bool IsConstant() const
Definition Tensor.cpp:513
Copyright (c) 2021 ARM Limited and Contributors.
arm_compute::Status ClFullyConnectedWorkloadValidate(const TensorInfo &input, const TensorInfo &output, const TensorInfo &weights, const Optional< TensorInfo > &biases, const FullyConnectedDescriptor &descriptor, const ActivationDescriptor *activationDescriptor)
void RunClFunction(arm_compute::IFunction &function, const CheckLocation &location)
arm_compute::ActivationLayerInfo ConvertAdditionalInfoToAclActivationLayerInfo(const QueueDescriptor &queueDescriptor)
DestType PolymorphicDowncast(SourceType *value)
Polymorphic downcast for build in pointers only.
arm_compute::FullyConnectedLayerInfo ConvertFullyConnectedDescriptorToAclFullyConnectedLayerInfo(const FullyConnectedDescriptor &fullyConnectedDesc, const ActivationDescriptor *activationDesc)
An ActivationDescriptor for the ActivationLayer.
A FullyConnectedDescriptor for the FullyConnectedLayer.
uint32_t GetNumInputs() const
Get the number of inputs.
bool m_BiasEnabled
Enable/disable bias.
Contains information about TensorInfos of a layer.
std::vector< TensorInfo > m_OutputTensorInfos
std::vector< TensorInfo > m_InputTensorInfos