Interface for the kernel to perform Direct Convolution Layer. More...

#include <CpuDirectConv2dKernel.h>

Collaboration diagram for CpuDirectConv2dKernel:

Data Structures
struct	DirectConv2dKernel

Public Member Functions
	CpuDirectConv2dKernel ()=default

	ARM_COMPUTE_DISALLOW_COPY_ALLOW_MOVE (CpuDirectConv2dKernel)

void	configure (ITensorInfo src, ITensorInfo weights, ITensorInfo *dst, const PadStrideInfo &conv_info)
	Set the src, weights, and dst tensors. More...

void	run_op (ITensorPack &tensors, const Window &window, const ThreadInfo &info) override
	Execute the kernel on the passed window. More...

const char *	name () const override
	Name of the kernel. More...

Public Member Functions inherited from ICPPKernel
virtual	~ICPPKernel ()=default
	Default destructor. More...

virtual void	run (const Window &window, const ThreadInfo &info)
	Execute the kernel on the passed window. More...

virtual void	run_nd (const Window &window, const ThreadInfo &info, const Window &thread_locator)
	legacy compatibility layer for implemantions which do not support thread_locator In these cases we simply narrow the interface down the legacy version More...

virtual size_t	get_mws (const CPUInfo &platform, size_t thread_count) const
	Return minimum workload size of the relevant kernel. More...

Public Member Functions inherited from IKernel
	IKernel ()
	Constructor. More...

virtual	~IKernel ()=default
	Destructor. More...

virtual bool	is_parallelisable () const
	Indicates whether or not the kernel is parallelisable. More...

virtual BorderSize	border_size () const
	The size of the border for that kernel. More...

const Window &	window () const
	The maximum window the kernel can be executed on. More...

bool	is_window_configured () const
	Function to check if the embedded window of this kernel has been configured. More...

Static Public Member Functions
static Status	validate (const ITensorInfo src, const ITensorInfo weights, const ITensorInfo *dst, const PadStrideInfo &conv_info)
	Static function to check if given info will lead to a valid configuration. More...

static const std::vector< DirectConv2dKernel > &	get_available_kernels ()

Static Public Member Functions inherited from ICpuKernel< CpuDirectConv2dKernel >
static const auto *	get_implementation (const SelectorType &selector, KernelSelectionType selection_type=KernelSelectionType::Supported)
	Micro-kernel selector. More...

Additional Inherited Members
Static Public Attributes inherited from ICPPKernel
static constexpr size_t	default_mws = 1

Detailed Description

Interface for the kernel to perform Direct Convolution Layer.

Definition at line 37 of file CpuDirectConv2dKernel.h.

Constructor & Destructor Documentation

◆ CpuDirectConv2dKernel()

CpuDirectConv2dKernel ( )

default

Member Function Documentation

◆ ARM_COMPUTE_DISALLOW_COPY_ALLOW_MOVE()

ARM_COMPUTE_DISALLOW_COPY_ALLOW_MOVE ( CpuDirectConv2dKernel )

◆ configure()

void configure	(	ITensorInfo *	src,
		ITensorInfo *	weights,
		ITensorInfo *	dst,
		const PadStrideInfo &	conv_info
	)

Set the src, weights, and dst tensors.

Note: : DirectConvolution only works in the following configurations: 1x1 convolution with stride_x = 1/2/3, stride_y = 1/2/3 3x3 convolution with stride_x = 1/2/3, stride_y = 1/2/3

Parameters

[in]	src	The input tensor to convolve. 3 lower dimensions represent a single input [width, height, IFM], while every optional dimension from 4 and above represent a batch of inputs. Data types supported: F16/F32.
[in]	weights	Weights tensor. Weights are 4D tensor with dimensions [kernel_x, kernel_y, IFM, OFM]. The 3rd dimension must be the same as the input's volume 3rd dimension. Data type supported:Same as `input`.
[out]	dst	Output tensor. The 3rd dimensions must be equal to the 4th dimension of the `kernels` tensor. Data types supported: F16/F32
[in]	conv_info	Contains padding and stride information described in PadStrideInfo.

Definition at line 108 of file CpuDirectConv2dKernel.cpp.

 {
     ARM_COMPUTE_ERROR_ON_NULLPTR(src, weights, dst);
  
     _conv_info   = conv_info;
     _data_layout = src->data_layout();
     _kernel_size = weights->dimension(get_data_layout_dimension_index(_data_layout, DataLayoutDimension::WIDTH));
  
     // Get convolved dimensions
     TensorShape output_shape = misc::shape_calculator::compute_deep_convolution_shape(*src, *weights, conv_info);
  
     DataType data_type = src->data_type();
  
     // Output auto inizialitation if not yet initialized
     auto_init_if_empty(*dst, output_shape, 1, data_type);
  
     // Perform validation step
     ARM_COMPUTE_ERROR_THROW_ON(validate_arguments(src, weights, dst, conv_info));
  
     // Configure kernel window
     auto win_config = validate_and_configure_window(src, dst);
     ARM_COMPUTE_ERROR_THROW_ON(win_config.first);
     ICpuKernel::configure(win_config.second);
 }

References ARM_COMPUTE_ERROR_ON_NULLPTR, ARM_COMPUTE_ERROR_THROW_ON, arm_compute::auto_init_if_empty(), arm_compute::misc::shape_calculator::compute_deep_convolution_shape(), arm_compute::test::validation::configure(), arm_compute::test::validation::conv_info, arm_compute::test::validation::data_type, ITensorInfo::dimension(), arm_compute::test::validation::dst, arm_compute::get_data_layout_dimension_index(), arm_compute::test::validation::output_shape, arm_compute::test::validation::src, arm_compute::cpu::kernels::validate_and_configure_window(), arm_compute::cpu::kernels::validate_arguments(), and arm_compute::WIDTH.

◆ get_available_kernels()

const std::vector< CpuDirectConv2dKernel::DirectConv2dKernel > & get_available_kernels ( )

static

Definition at line 168 of file CpuDirectConv2dKernel.cpp.

 {
     return available_kernels;
 }

◆ name()

const char * name ( ) const

overridevirtual

Name of the kernel.

Returns: Kernel name

Implements ICPPKernel.

Definition at line 163 of file CpuDirectConv2dKernel.cpp.

 {
     return "CpuDirectConvolutionLayerKernel";
 }

◆ run_op()

void run_op	(	ITensorPack &	tensors,
		const Window &	window,
		const ThreadInfo &	info
	)

overridevirtual

Execute the kernel on the passed window.

Warning: If is_parallelisable() returns false then the passed window must be equal to window()

Note: The window has to be a region within the window returned by the window() method; The width of the window has to be a multiple of num_elems_processed_per_iteration().

Parameters

[in]	tensors	A vector containing the tensors to operate on.
[in]	window	Region on which to execute the kernel. (Must be a region of the window returned by window())
[in]	info	Info about executing thread and CPU.

Reimplemented from ICPPKernel.

Definition at line 147 of file CpuDirectConv2dKernel.cpp.

 {
     ARM_COMPUTE_UNUSED(info);
     ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL(this);
     ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW(ICpuKernel::window(), window);
  
     auto src     = tensors.get_const_tensor(TensorType::ACL_SRC_0);
     auto weights = tensors.get_const_tensor(TensorType::ACL_SRC_1);
     auto dst     = tensors.get_tensor(TensorType::ACL_DST);
  
     const auto *uk = CpuDirectConv2dKernel::get_implementation(
         DataTypeDataLayoutISASelectorData{src->info()->data_type(), _data_layout, CPUInfo::get().get_isa()});
     ARM_COMPUTE_ERROR_ON(uk == nullptr);
  
     uk->ukernel(window, src, weights, dst, _conv_info);
 }

References arm_compute::ACL_DST, arm_compute::ACL_SRC_0, arm_compute::ACL_SRC_1, ARM_COMPUTE_ERROR_ON, ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW, ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL, ARM_COMPUTE_UNUSED, arm_compute::test::validation::data_type, arm_compute::test::validation::dst, CPUInfo::get(), ITensorPack::get_const_tensor(), ITensorPack::get_tensor(), arm_compute::test::validation::info, and arm_compute::test::validation::src.

◆ validate()

Status validate	(	const ITensorInfo *	src,
		const ITensorInfo *	weights,
		const ITensorInfo *	dst,
		const PadStrideInfo &	conv_info
	)

static

Static function to check if given info will lead to a valid configuration.

Returns: a status

Definition at line 136 of file CpuDirectConv2dKernel.cpp.

 {
     ARM_COMPUTE_RETURN_ON_ERROR(validate_arguments(src, weights, dst, conv_info));
     ARM_COMPUTE_RETURN_ON_ERROR(validate_and_configure_window(src->clone().get(), dst->clone().get()).first);
  
     return Status{};
 }

References ARM_COMPUTE_RETURN_ON_ERROR, arm_compute::test::validation::conv_info, arm_compute::test::validation::dst, arm_compute::test::validation::src, arm_compute::cpu::kernels::validate_and_configure_window(), and arm_compute::cpu::kernels::validate_arguments().

Referenced by CpuDirectConv2d::validate().

The documentation for this class was generated from the following files:

src/cpu/kernels/CpuDirectConv2dKernel.h
src/cpu/kernels/CpuDirectConv2dKernel.cpp

Data Structures

Public Member Functions

Static Public Member Functions

Additional Inherited Members