23.08
|
Go to the source code of this file.
Functions | |
__kernel void | direct_convolution_nchw (__global uchar *src_ptr, uint src_stride_x, uint src_step_x, uint src_stride_y, uint src_step_y, uint src_stride_z, uint src_step_z, uint src_offset_first_element_in_bytes, __global uchar *dst_ptr, uint dst_stride_x, uint dst_step_x, uint dst_stride_y, uint dst_step_y, uint dst_stride_z, uint dst_step_z, uint dst_offset_first_element_in_bytes, __global uchar *weights_ptr, uint weights_stride_x, uint weights_step_x, uint weights_stride_y, uint weights_step_y, uint weights_stride_z, uint weights_step_z, uint weights_offset_first_element_in_bytes, __global uchar *biases_ptr, uint biases_stride_x, uint biases_step_x, uint biases_offset_first_element_in_bytes, unsigned int weights_stride_w) |
This kernel performs a direct convolution to convolve the low three dimensions. More... | |
__kernel void direct_convolution_nchw | ( | __global uchar * | src_ptr, |
uint | src_stride_x, | ||
uint | src_step_x, | ||
uint | src_stride_y, | ||
uint | src_step_y, | ||
uint | src_stride_z, | ||
uint | src_step_z, | ||
uint | src_offset_first_element_in_bytes, | ||
__global uchar * | dst_ptr, | ||
uint | dst_stride_x, | ||
uint | dst_step_x, | ||
uint | dst_stride_y, | ||
uint | dst_step_y, | ||
uint | dst_stride_z, | ||
uint | dst_step_z, | ||
uint | dst_offset_first_element_in_bytes, | ||
__global uchar * | weights_ptr, | ||
uint | weights_stride_x, | ||
uint | weights_step_x, | ||
uint | weights_stride_y, | ||
uint | weights_step_y, | ||
uint | weights_stride_z, | ||
uint | weights_step_z, | ||
uint | weights_offset_first_element_in_bytes, | ||
__global uchar * | biases_ptr, | ||
uint | biases_stride_x, | ||
uint | biases_step_x, | ||
uint | biases_offset_first_element_in_bytes, | ||
unsigned int | weights_stride_w | ||
) |
This kernel performs a direct convolution to convolve the low three dimensions.
[in] | src_ptr | Pointer to the source tensor. Supported data types: F16/F32 |
[in] | src_stride_x | Stride of the source tensor in X dimension (in bytes) |
[in] | src_step_x | src_stride_x * number of elements along X processed per workitem(in bytes) |
[in] | src_stride_y | Stride of the source tensor in Y dimension (in bytes) |
[in] | src_step_y | src_stride_y * number of elements along Y processed per workitem(in bytes) |
[in] | src_stride_z | Stride of the source tensor in Z dimension (in bytes) |
[in] | src_step_z | src_stride_z * number of elements along Z processed per workitem(in bytes) |
[in] | src_offset_first_element_in_bytes | The offset of the first element in the source tensor |
[out] | dst_ptr | Pointer to the destination tensor. Supported data types: same as src_ptr |
[in] | dst_stride_x | Stride of the destination tensor in X dimension (in bytes) |
[in] | dst_step_x | dst_stride_x * number of elements along X processed per workitem(in bytes) |
[in] | dst_stride_y | Stride of the destination tensor in Y dimension (in bytes) |
[in] | dst_step_y | dst_stride_y * number of elements along Z processed per workitem(in bytes) |
[in] | dst_stride_z | Stride of the destination tensor in Z dimension (in bytes) |
[in] | dst_step_z | dst_stride_z * number of elements along Z processed per workitem(in bytes) |
[in] | dst_offset_first_element_in_bytes | The offset of the first element in the destination tensor |
[in] | weights_ptr | Pointer to the weights tensor. Supported data types: same as src_ptr |
[in] | weights_stride_x | Stride of the weights tensor in X dimension (in bytes) |
[in] | weights_step_x | weights_stride_x * number of elements along X processed per workitem(in bytes) |
[in] | weights_stride_y | Stride of the weights tensor in Y dimension (in bytes) |
[in] | weights_step_y | weights_stride_y * number of elements along y processed per workitem(in bytes) |
[in] | weights_stride_z | Stride of the weights tensor in Z dimension (in bytes) |
[in] | weights_step_z | weights_stride_z * number of elements along Z processed per workitem(in bytes) |
[in] | weights_offset_first_element_in_bytes | The offset of the first element in the weights tensor |
[in] | biases_ptr | Pointer to the biases tensor. Same as src_ptr |
[in] | biases_stride_x | Stride of the biases tensor in X dimension (in bytes) |
[in] | biases_step_x | biases_stride_x * number of elements along X processed per workitem(in bytes) |
[in] | biases_offset_first_element_in_bytes | The offset of the first element in the biases tensor |
[in] | weights_stride_w | Stride of the weights tensor in the 4th dimension |
Definition at line 69 of file direct_convolution.cl.
References ASYMM_MULT_BY_QUANT_MULTIPLIER_GREATER_THAN_ONE, ASYMM_MULT_BY_QUANT_MULTIPLIER_LESS_THAN_ONE, bias, CONVERT_SAT, CONVERT_TO_VECTOR_STRUCT_NO_STEP, arm_compute::test::validation::input, VEC_SIZE, vector_offset(), and weights_stride_z.