ArmNN
 25.11
Loading...
Searching...
No Matches
NeonTileWorkload.cpp
Go to the documentation of this file.
1//
2// Copyright © 2023-2024 Arm Ltd and Contributors. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
8#include <vector>
9#include <algorithm>
10
11using namespace armnn::armcomputetensorutils;
12namespace armnn
13{
14arm_compute::Status NeonTileWorkloadValidate(const TensorInfo& input,
15 const TensorInfo& output,
16 const TileDescriptor& descriptor)
17{
18 if(input.GetDataType() == DataType::Boolean)
19 {
20 return arm_compute::Status{arm_compute::ErrorCode::RUNTIME_ERROR,
21 "NeonTileWorkloadValidate: Unsupported Boolean DataType"};
22 }
23
24 const arm_compute::TensorInfo aclInput = BuildArmComputeTensorInfo(input);
25 const arm_compute::TensorInfo aclOutput = BuildArmComputeTensorInfo(output);
26
27 std::vector<unsigned int> aclMultiples = descriptor.m_Multiples;
28 std::reverse(aclMultiples.begin(),aclMultiples.end());
29
30 return arm_compute::NETile::validate(&aclInput, &aclOutput, aclMultiples);
31}
32
36{
37 m_Data.ValidateInputsOutputs("NeonTileWorkload", 1, 1);
38
39 std::vector<unsigned int> aclMultiples = descriptor.m_Parameters.m_Multiples;
40 std::reverse(aclMultiples.begin(),aclMultiples.end());
41
42 arm_compute::ITensor& input = static_cast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
43 arm_compute::ITensor& output = static_cast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
44 m_Layer.configure(&input, &output, aclMultiples);
45}
46
48{
49 ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonTileWorkload_Execute");
50 m_Layer.run();
51}
52} //namespace armnn
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
BaseWorkload(const TileQueueDescriptor &descriptor, const WorkloadInfo &info)
Definition Workload.hpp:35
void Execute() const override
NeonTileWorkload(const TileQueueDescriptor &descriptor, const WorkloadInfo &info)
DataType GetDataType() const
Definition Tensor.hpp:200
Copyright (c) 2021 ARM Limited and Contributors.
arm_compute::Status NeonTileWorkloadValidate(const TensorInfo &input, const TensorInfo &output, const TileDescriptor &descriptor)
std::vector< uint32_t > m_Multiples
The vector to multiply the input shape by.
Contains information about TensorInfos of a layer.