ArmNN
 25.11
Loading...
Searching...
No Matches
ClSplitterWorkload.cpp
Go to the documentation of this file.
1//
2// Copyright © 2019-2024 Arm Ltd and Contributors. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
7
8#include "ClWorkloadUtils.hpp"
9
15#include <cl/ClTensorHandle.hpp>
16
17
18namespace armnn
19{
20
21using namespace armcomputetensorutils;
22
23namespace
24{
25 unsigned int CalcAclAxis(unsigned int numDimensions, unsigned int splitAxis)
26 {
27 return (numDimensions - splitAxis) - 1;
28 }
29
30} //namespace
31
32arm_compute::Status ClSplitterWorkloadValidate(const TensorInfo& input,
33 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
34 unsigned int splitAxis)
35{
36 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
37
38 size_t numOutputs = outputs.size();
39
40 std::vector<arm_compute::TensorInfo> aclOutputs;
41 aclOutputs.reserve(numOutputs);
42
43 std::vector<arm_compute::ITensorInfo*> aclOutputPtr;
44 aclOutputPtr.reserve(numOutputs);
45
46 for (size_t i = 0u; i < outputs.size(); ++i)
47 {
48 aclOutputs.emplace_back(BuildArmComputeTensorInfo(outputs[i]));
49 aclOutputPtr.emplace_back(&aclOutputs.back());
50 }
51
52 unsigned int aclAxis = CalcAclAxis(input.GetNumDimensions(), splitAxis);
53 return arm_compute::CLSplit::validate(&aclInputInfo, aclOutputPtr, aclAxis);
54}
55
57 const WorkloadInfo& info,
58 const arm_compute::CLCompileContext&)
60{
61 // Report Profiling Details
62 ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClSplitterWorkload_Construct",
63 descriptor.m_Parameters,
64 info,
65 this->GetGuid());
66 bool allOutputsAreSubtensors = true;
67
68 // Check that all outputs are sub-tensors
69 for (auto output : m_Data.m_Outputs)
70 {
71 if (output && !output->GetParent())
72 {
73 // Non sub-tensor input found so we need to execute the split function
74 allOutputsAreSubtensors = false;
75 break;
76 }
77 }
78
79 if (allOutputsAreSubtensors)
80 {
81 // Can skip configuring the split function since it's not executed
82 return;
83 }
84
85 arm_compute::ICLTensor& input = armnn::PolymorphicPointerDowncast<IClTensorHandle>(
86 m_Data.m_Inputs[0])->GetTensor();
87
88 std::vector<arm_compute::ICLTensor *> aclOutputs;
89 for (auto output : m_Data.m_Outputs)
90 {
91 arm_compute::ICLTensor& aclOutput = armnn::PolymorphicPointerDowncast<IClTensorHandle>(output)->GetTensor();
92 aclOutputs.emplace_back(&aclOutput);
93 }
94
95 // Create the layer function
96
97 // Configure input and output tensors
98 std::set<unsigned int> splitAxis = ComputeSplitAxis(descriptor.m_Parameters, m_Data.m_Inputs[0]->GetShape());
99 if (splitAxis.size() != 1)
100 {
101 throw InvalidArgumentException("Cannot derive split axis from SplitterDescriptor");
102 }
103
104 unsigned int aclAxis = CalcAclAxis(descriptor.m_Parameters.GetNumDimensions(), *splitAxis.begin());
105 auto layer = std::make_unique<arm_compute::CLSplit>();
106 {
107 ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClSplitterWorkload_configure");
108 layer->configure(&input, aclOutputs, aclAxis);
109 }
110
111 // Prepare
112 layer->prepare();
113
114 m_Layer = std::move(layer);
115}
116
118{
119 if (m_Layer)
120 {
121 ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClSplitterWorkload_Execute");
122 m_Layer->run();
123 }
124}
125
126} //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
ClBaseWorkload(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info)
ClSplitterWorkload(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info, const arm_compute::CLCompileContext &clCompileContext)
void Execute() const override
unsigned int GetNumDimensions() const
Definition Tensor.hpp:197
Copyright (c) 2021 ARM Limited and Contributors.
std::set< unsigned int > ComputeSplitAxis(const armnn::SplitterDescriptor &desc, const TensorShape &input)
Calculates the axis values for split operation.
auto PolymorphicPointerDowncast(const SourceType &value)
Polymorphic downcast for shared pointers and build in pointers.
arm_compute::Status ClSplitterWorkloadValidate(const TensorInfo &input, const std::vector< std::reference_wrapper< TensorInfo > > &outputs, unsigned int splitAxis)
uint32_t GetNumDimensions() const
Get the number of dimensions.
Contains information about TensorInfos of a layer.