8#include <arm_compute/runtime/NEON/functions/NESplit.h>
22using namespace armcomputetensorutils;
26unsigned int CalcAclAxis(
unsigned int numDimensions,
unsigned int splitAxis)
28 return (numDimensions - splitAxis) - 1;
34 const std::vector<std::reference_wrapper<TensorInfo>>& outputs,
35 unsigned int splitAxis)
37 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input);
39 size_t numOutputs = outputs.size();
41 std::vector<arm_compute::TensorInfo> aclOutputs;
42 aclOutputs.reserve(numOutputs);
44 std::vector<arm_compute::ITensorInfo*> aclOutputPtr;
45 aclOutputPtr.reserve(numOutputs);
47 for (
size_t i = 0u; i < outputs.size(); ++i)
49 aclOutputs.emplace_back(BuildArmComputeTensorInfo(outputs[i]));
50 aclOutputPtr.emplace_back(&aclOutputs.back());
54 return arm_compute::NESplit::validate(&aclInputInfo, aclOutputPtr, aclAxis);
66 bool allOutputsAreSubtensors =
true;
69 for (
auto output :
m_Data.m_Outputs)
71 if (output && !output->GetParent())
74 allOutputsAreSubtensors =
false;
79 if (allOutputsAreSubtensors)
87 std::vector<arm_compute::ITensor *> aclOutputs;
88 for (
auto output :
m_Data.m_Outputs)
91 aclOutputs.emplace_back(&aclOutput);
95 std::unique_ptr<arm_compute::NESplit> layer(
new arm_compute::NESplit());
99 if (splitAxis.size() != 1)
105 layer->configure(&input, aclOutputs, aclAxis);
109 m_Layer.reset(layer.release());
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
SplitterQueueDescriptor m_Data
NeonBaseWorkload(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info)
NeonSplitterWorkload(const SplitterQueueDescriptor &descriptor, const WorkloadInfo &info)
void Execute() const override
unsigned int GetNumDimensions() const
Copyright (c) 2021 ARM Limited and Contributors.
std::set< unsigned int > ComputeSplitAxis(const armnn::SplitterDescriptor &desc, const TensorShape &input)
Calculates the axis values for split operation.
auto PolymorphicPointerDowncast(const SourceType &value)
Polymorphic downcast for shared pointers and build in pointers.
arm_compute::Status NeonSplitterWorkloadValidate(const TensorInfo &input, const std::vector< std::reference_wrapper< TensorInfo > > &outputs, unsigned int splitAxis)
DestType PolymorphicDowncast(SourceType *value)
Polymorphic downcast for build in pointers only.
LayerDescriptor m_Parameters
uint32_t GetNumDimensions() const
Get the number of dimensions.
Contains information about TensorInfos of a layer.