20using namespace armcomputetensorutils;
27 const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, dataLayout);
31 const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, dataLayout);
33 const arm_compute::Status aclStatus = arm_compute::CLDepthToSpaceLayer::validate(&aclInputInfo,
41 const arm_compute::CLCompileContext& clCompileContext)
50 m_Data.ValidateInputsOutputs(
"ClDepthToSpaceWorkload", 1, 1);
52 arm_compute::DataLayout aclDataLayout = ConvertDataLayout(
m_Data.m_Parameters.m_DataLayout);
54 arm_compute::ICLTensor& input =
56 input.info()->set_data_layout(aclDataLayout);
60 arm_compute::ICLTensor& output =
62 output.info()->set_data_layout(aclDataLayout);
66 m_Layer.configure(clCompileContext, &input, &output, blockSize);
#define ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID(label)
Creates a profiling event that uses GetGuid() and GetName() from the calling class.
#define ARMNN_REPORT_PROFILING_WORKLOAD_DESC(name, desc, infos, guid)
DepthToSpaceQueueDescriptor m_Data
ClBaseWorkload(const DepthToSpaceQueueDescriptor &descriptor, const WorkloadInfo &info)
ClDepthToSpaceWorkload(const DepthToSpaceQueueDescriptor &descriptor, const WorkloadInfo &info, const arm_compute::CLCompileContext &clCompileContext)
void Execute() const override
Copyright (c) 2021 ARM Limited and Contributors.
auto PolymorphicPointerDowncast(const SourceType &value)
Polymorphic downcast for shared pointers and build in pointers.
void RunClFunction(arm_compute::IFunction &function, const CheckLocation &location)
SpaceToDepthDescriptor DepthToSpaceDescriptor
A DepthToSpaceDescriptor for the DepthToSpaceLayer.
std::enable_if_t< std::is_unsigned< Source >::value &&std::is_unsigned< Dest >::value, Dest > numeric_cast(Source source)
arm_compute::Status ClDepthToSpaceWorkloadValidate(const TensorInfo &input, const TensorInfo &output, const DepthToSpaceDescriptor &descriptor)
LayerDescriptor m_Parameters
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
unsigned int m_BlockSize
Scalar specifying the input block size. It must be >= 1.
Contains information about TensorInfos of a layer.