24 #ifndef ARM_COMPUTE_CLDEPTHWISECONVOLUTIONLAYERNATIVEKERNEL_H 25 #define ARM_COMPUTE_CLDEPTHWISECONVOLUTIONLAYERNATIVEKERNEL_H 70 const ICLTensor *output_multipliers =
nullptr,
const ICLTensor *output_shifts =
nullptr);
92 const ICLTensor *output_multipliers =
nullptr,
const ICLTensor *output_shifts =
nullptr);
125 unsigned int _depth_multiplier;
const Window & window() const
The maximum window the kernel can be executed on.
CLDepthwiseConvolutionLayerNativeKernel()
Default Constructor.
Store the tensor's metadata.
Common interface for all the OpenCL kernels.
Copyright (c) 2017-2021 Arm Limited.
void run(const Window &window, cl::CommandQueue &queue) override
Enqueue the OpenCL kernel to process the given window on the passed OpenCL command queue...
Descriptor used by the depthwise convolution kernels.
Padding and stride information class.
void configure(const ICLTensor *input, const ICLTensor *weights, const ICLTensor *biases, ICLTensor *output, const DWCWeightsKernelInfo &dwc_weights_info, const DWCKernelInfo &dwc_info, const PadStrideInfo &conv_info, unsigned int depth_multiplier=1, const Size2D &dilation=Size2D(1U, 1U), const ICLTensor *output_multipliers=nullptr, const ICLTensor *output_shifts=nullptr)
Initialize the function's source, destination and parameters.
Descriptor used by the depthwise convolution kernels to retrieve the number of output elements proces...
CLDepthwiseConvolutionLayerNativeKernel & operator=(const CLDepthwiseConvolutionLayerNativeKernel &)=delete
Prevent instances of this class from being copied (As this class contains pointers) ...
Interface for OpenCL tensor.
Class for specifying the size of an image or rectangle.
Describe a multidimensional execution window.
static Status validate(const ITensorInfo *input, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *output, const DWCWeightsKernelInfo &dwc_weights_info, const DWCKernelInfo &dwc_info, const PadStrideInfo &conv_info, unsigned int depth_multiplier=1, const Size2D &dilation=Size2D(1U, 1U), const ITensorInfo *output_multipliers=nullptr, const ITensorInfo *output_shifts=nullptr)
Static function to check if given info will lead to a valid configuration of CLDepthwiseConvolutionLa...
Interface for the kernel to run a MxN depthwise convolution.