23.11
|
Go to the documentation of this file.
37 namespace cl_direct_conv
53 &ClDirectConvDefaultConfigBifrost::configure_G71_f32, &ClDirectConvDefaultConfigBifrost::configure_G71_f16,
54 &ClDirectConvDefaultConfigBifrost::configure_G71_u8);
57 &ClDirectConvDefaultConfigBifrost::configure_default_f32,
58 &ClDirectConvDefaultConfigBifrost::configure_default_f16, &ClDirectConvDefaultConfigBifrost::configure_G71_u8);
60 ConfigurationFunctionExecutorPtr func =
nullptr;
101 DirectConvComputeKernelInfo ClDirectConvDefaultConfigBifrost::configure_G71_f16(
const ITensorInfo *
src,
102 const ITensorInfo *wei,
105 DirectConvComputeKernelInfo desc;
121 desc.export_weights_to_cl_image =
false;
127 DirectConvComputeKernelInfo ClDirectConvDefaultConfigBifrost::configure_G71_u8(
const ITensorInfo *
src,
128 const ITensorInfo *wei,
131 DirectConvComputeKernelInfo desc;
147 desc.export_weights_to_cl_image =
false;
153 DirectConvComputeKernelInfo ClDirectConvDefaultConfigBifrost::configure_default_f32(
const ITensorInfo *
src,
154 const ITensorInfo *wei,
157 DirectConvComputeKernelInfo desc;
179 DirectConvComputeKernelInfo ClDirectConvDefaultConfigBifrost::configure_default_f16(
const ITensorInfo *
src,
180 const ITensorInfo *wei,
183 DirectConvComputeKernelInfo desc;
SimpleTensor< float > src
bool export_to_cl_image(const ITensorInfo *tensor)
ClDirectConvDefaultConfigBifrost(GPUTarget gpu)
Constructor.
@ NHWC
Num samples, height, width, channels.
Bifrost based OpenCL direct convolution configuration.
Basic interface for the Direct convolution kernel configuration.
Manages all the OpenCL kernels compilation and caching, provides accessors for the OpenCL Context.
int32_t n0
Number of columns to be processed by the kernel.
#define ARM_COMPUTE_ERROR_ON_MSG(cond, msg)
Basic container for the OpenCL direct convolution configuration functions.
int32_t m0
Number of rows to be processed by the kernel.
DirectConvComputeKernelInfo configure(const ITensorInfo *src, const ITensorInfo *wei, const PadStrideInfo &conv_info) override
This method returns the DirectConvComputeKernelInfo for the given inputs.
GPUTarget
Available GPU Targets.
Copyright (c) 2017-2023 Arm Limited.
bool export_weights_to_cl_image
Flag to export the weights to cl_image.
Store the tensor's metadata.
T get_function(DataType data_type)
Method to return the direct convolution configuration function based on data type.
TensorShape compute_deep_convolution_shape(const TensorShape &input_shape, DataLayout input_data_layout, const TensorShape &weights_shape, const PadStrideInfo &conv_info)
Calculate the deep convolution shape output shape of a tensor.
int32_t k0
Number of partial accumulations to be processed in a single iteration by the kernel.
Compute descriptor used by the direct convolution kernel.