24.02
|
Namespaces | |
kernel | |
kernels | |
Data Structures | |
struct | ActFpImplParams |
Constant parameters needed by the activation implementation. More... | |
struct | AsmGemmInfo |
class | CpuActivation |
Basic function to run kernels::CpuActivationKernel. More... | |
class | CpuAdd |
Basic function to run kernels::CpuAddKernel. More... | |
class | CpuAddMulAdd |
Basic function to run kernels::CpuAddMulAddKernel. More... | |
class | CpuAuxTensorHandler |
struct | CpuCapabilities |
Structure that encodes the CPU capabilities to be used. More... | |
class | CpuCast |
Basic function to run kernels::CpuCastKernel. More... | |
class | CpuComplexMul |
Basic function to run kernels::CpuComplexMulKernel. More... | |
class | CpuConcatenate |
Basic function to execute concatenate tensors along a given axis. More... | |
class | CpuContext |
CPU context implementation class. More... | |
class | CpuConv2d |
Basic function to simulate a convolution layer. More... | |
class | CpuConvertFullyConnectedWeights |
Basic function to run kernels::CpuConvertFullyConnectedWeightsKernel. More... | |
class | CpuCopy |
Basic function to run kernels::CpuCopyKernel. More... | |
class | CpuDepthwiseConv2d |
Function to execute a depthwise convolution. More... | |
class | CpuDepthwiseConv2dAssemblyDispatch |
Depthwise convolution assembly kernel glue. More... | |
class | CpuDequantize |
Basic function to run kernels::CpuDequantizeKernel that dequantizes an input tensor. More... | |
class | CpuDirectConv2d |
Function to run the direct convolution. More... | |
class | CpuDirectConv3d |
Function to run the direct convolution. More... | |
class | CpuElementwiseArithmetic |
Class to run cpu::kernels::CpuArithmeticKernel except for division and power. More... | |
class | CpuElementwiseBase |
class | CpuElementwiseComparison |
Basic function to run cpu::kernels::CpuComparisonKernel. More... | |
class | CpuElementwiseComparisonStatic |
Basic function to run cpu::kernels::CpuComparisonKernel. More... | |
class | CpuElementwiseDivision |
Basic function to run cpu::kernels::CpuArithmeticKernel for division. More... | |
class | CpuElementwisePower |
Basic function to run cpu::kernels::CpuArithmeticKernel for power. More... | |
class | CpuElementwiseUnary |
class | CpuFill |
Basic function to run kernels::CpuFillKernel. More... | |
class | CpuFlatten |
Basic function to flatten a given input. More... | |
class | CpuFloor |
Basic function to run kernels::CpuFloorKernel. More... | |
class | CpuFullyConnected |
Basic function to compute a Fully Connected layer. More... | |
class | CpuGemm |
Basic function to execute GEMM. More... | |
class | CpuGemmAssemblyDispatch |
Assembly kernel glue. More... | |
class | CpuGemmConv2d |
Basic function to compute the convolution layer. More... | |
class | CpuGemmDirectConv2d |
class | CpuGemmLowpMatrixMultiplyCore |
Basic function to execute GEMMLowpMatrixMultiplyCore. More... | |
class | CpuGemmLowpOutputStage |
Basic function to execute GEMMLowpQuantizeDown kernels. More... | |
class | CpuMatMul |
Function to execute MatMul Operation. More... | |
class | CpuMaxUnpooling |
Basic function to run kernels::CpuMaxUnpoolingLayerKernel. More... | |
class | CpuMul |
Basic function to run kernels::CpuMulKernel. More... | |
class | CpuPermute |
Basic function to run kernels::CpuPermuteKernel. More... | |
class | CpuPool2d |
Basic function to simulate a pooling layer with the specified pooling operation. More... | |
class | CpuPool3d |
Basic function to simulate a pooling layer with the specified pooling operation. More... | |
class | CpuQuantize |
Basic function to run kernels::CpuQuantizeKernel that dequantizes an input tensor. More... | |
class | CpuQueue |
CPU queue implementation class. More... | |
class | CpuReshape |
Basic function to run kernels::CpuReshapeKernel. More... | |
class | CpuScale |
Basic function to compute Scale. More... | |
class | CpuSoftmaxGeneric |
Basic function to compute a SoftmaxLayer and a Log SoftmaxLayer. More... | |
class | CpuSub |
Basic function to run kernels::CpuSubKernel. More... | |
class | CpuTensor |
CPU tensor implementation class. More... | |
class | CpuTranspose |
Basic function to run kernels::CpuTransposeKernel. More... | |
class | CpuWinogradConv2d |
class | CpuWinogradConv2dTransformInputKernel |
class | CpuWinogradConv2dTransformOutputKernel |
struct | DepthwiseConvolutionRunInfo |
class | ICpuKernel |
Enumerations | |
enum | KernelSelectionType { Preferred, Supported } |
enum | AsmConvMethod { Im2Col, Indirect, Conv } |
Functions | |
void | fp16_neon_batch_normalization (ITensor *src, ITensor *dst, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo &act_info, const Window &window) |
void | fp16_sve_batch_normalization (ITensor *src, ITensor *dst, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo &act_info, const Window &window) |
void | fp32_neon_batch_normalization (ITensor *src, ITensor *dst, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo &act_info, const Window &window) |
void | fp32_sve_batch_normalization (ITensor *src, ITensor *dst, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo &act_info, const Window &window) |
void | fp16_batch_normalization_nchw_non_fused (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp32_batch_normalization_nchw_non_fused (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp16_batch_normalization_nchw_non_fused_relu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp16_batch_normalization_nchw_non_fused_brelu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp16_batch_normalization_nchw_non_fused_lubrelu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp32_batch_normalization_nchw_non_fused_relu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp32_batch_normalization_nchw_non_fused_brelu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | fp32_batch_normalization_nchw_non_fused_lubrelu (const Window &window, ITensor *input, ITensor *output, const ITensor *mean, const ITensor *var, const ITensor *beta, const ITensor *gamma, float epsilon, ActivationLayerInfo act_info) |
void | neon_fp32_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
float32x4_t | mask_float_vector (const float32x4_t &in, const uint32x4_t &mask) |
template<typename T , const ActFpImplParams & P> | |
void | fp_neon_activation_impl (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | neon_qasymm8_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | neon_qasymm8_signed_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | neon_qsymm16_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve_fp32_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve2_qasymm8_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve2_qasymm8_signed_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve2_qsymm16_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve2_q8_activation_lut (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve_fp16_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | sve_fp16_activation_lut (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | neon_fp16_activation (const ITensor *src, ITensor *dst, const ActivationLayerInfo &act_info, const Window &window) |
void | add_fp32_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
bool | sub_q8_neon_fixedpoint_possible (const ITensorInfo *src0, const ITensorInfo *src1, const ITensorInfo *dst) |
bool | add_q8_neon_fixedpoint_possible (const ITensorInfo *src0, const ITensorInfo *src1, const ITensorInfo *dst) |
bool | add_sub_q8_neon_fixedpoint_possible (const ITensorInfo *src0, const ITensorInfo *src1, const ITensorInfo *dst, bool is_addition) |
template<typename ScalarType > | |
void | add_q8_neon_fixedpoint (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template<typename ScalarType > | |
void | add_sub_q8_neon_fixedpoint (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window, bool is_addition) |
void | add_sub_qasymm8_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window, bool is_addition) |
void | add_sub_qasymm8_signed_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window, bool is_addition) |
template void | add_q8_neon_fixedpoint< int8_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_q8_neon_fixedpoint< uint8_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_sub_q8_neon_fixedpoint< int8_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window, bool is_addition) |
template void | add_sub_q8_neon_fixedpoint< uint8_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window, bool is_addition) |
template<typename ScalarType > | |
void | add_same_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_u8_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_s16_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_s32_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qasymm8_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qasymm8_signed_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qsymm16_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_fp32_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template<typename ScalarType > | |
void | add_same_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_same_sve< float > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_same_sve< uint8_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_same_sve< int16_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
template void | add_same_sve< int32_t > (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_u8_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_s16_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_s32_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qasymm8_sve2 (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qasymm8_signed_sve2 (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_qsymm16_sve2 (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_fp16_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_fp16_sve (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | add_mul_add_fp32_neon (const ITensor *input1, const ITensor *input2, const ITensor *bn_mul, const ITensor *bn_add, ITensor *add_output, ITensor *final_output, ConvertPolicy policy, const ActivationLayerInfo &act_info, const Window &window) |
void | add_mul_add_fp16_neon (const ITensor *input1, const ITensor *input2, const ITensor *bn_mul, const ITensor *bn_add, ITensor *add_output, ITensor *final_output, ConvertPolicy policy, const ActivationLayerInfo &act_info, const Window &window) |
void | add_mul_add_u8_neon (const ITensor *input1, const ITensor *input2, const ITensor *bn_mul, const ITensor *bn_add, ITensor *add_output, ITensor *final_output, ConvertPolicy policy, const ActivationLayerInfo &act_info, const Window &window) |
void | add_mul_add_s8_neon (const ITensor *input1, const ITensor *input2, const ITensor *bn_mul, const ITensor *bn_add, ITensor *add_output, ITensor *final_output, ConvertPolicy policy, const ActivationLayerInfo &act_info, const Window &window) |
void | neon_fp32_boundingboxtransform (const ITensor *boxes, ITensor *pred_boxes, const ITensor *deltas, BoundingBoxTransformInfo bbinfo, const Window &window) |
void | bounding_box_transform_qsymm16 (const ITensor *boxes, ITensor *pred_boxes, const ITensor *deltas, BoundingBoxTransformInfo bbinfo, const Window &window) |
template<typename T > | |
void | bounding_box_transform (const ITensor *boxes, ITensor *pred_boxes, const ITensor *deltas, BoundingBoxTransformInfo bbinfo, const Window &window) |
void | neon_qu16_boundingboxtransform (const ITensor *boxes, ITensor *pred_boxes, const ITensor *deltas, BoundingBoxTransformInfo bbinfo, const Window &window) |
void | neon_fp16_boundingboxtransform (const ITensor *boxes, ITensor *pred_boxes, const ITensor *deltas, BoundingBoxTransformInfo bbinfo, const Window &window) |
void | neon_fp32_to_fp16_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_u8_to_fp16_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_fp16_to_other_dt_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_s32_to_fp16_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_qasymm8_signed_to_fp16_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_fp32_to_bfloat16_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
void | neon_bfloat16_to_fp32_cast (const ITensor *_src, ITensor *_dst, const ThreadInfo &tensor, ConvertPolicy _policy, const Window &window) |
template<typename T > | |
void | directconv3d_float_neon_ndhwc (const ITensor *src0, const ITensor *src1, const ITensor *src2, ITensor *dst, const Conv3dInfo &conv_info, const Window &window) |
template<typename T > | |
void | directconv3d_quantized_neon_ndhwc (const ITensor *src0, const ITensor *src1, const ITensor *src2, ITensor *dst, const Conv3dInfo &conv_info, const Window &window) |
template<typename T > | |
float32x4_t | load_as_f32 (T *ptr) |
template<> | |
float32x4_t | load_as_f32 (float *ptr) |
template<> | |
float32x4_t | load_as_f32 (int32_t *ptr) |
template<> | |
float32x4_t | load_as_f32 (uint32_t *ptr) |
template<> | |
float32x4_t | load_as_f32 (int16_t *ptr) |
template<> | |
float32x4_t | load_as_f32 (uint16_t *ptr) |
template<> | |
float32x4_t | load_as_f32 (uint8_t *ptr) |
void | fp32_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
template<typename T > | |
void | in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | u8_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | u16_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | u32_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | s8_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | s16_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | s32_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | fp16_in_bounds_crop_window (const ITensor *input, const ITensor *output, float *output_ptr, Coordinates input_offset, int32_t window_step_x, int32_t output_width_start, int32_t output_width_limit, bool input_has_single_channel, bool is_width_flipped) |
void | depth_to_space_nhwc_any (const uint8_t *src, uint8_t *dst, const uintptr_t src_shape[4], const uintptr_t src_strides[4], const uintptr_t dst_strides[4], uintptr_t element_size, uintptr_t block_size) |
void | depth_to_space_nchw_any (const uint8_t *src, uint8_t *dst, const uintptr_t src_shape[4], const uintptr_t src_strides[4], const uintptr_t dst_strides[4], uintptr_t element_size, uintptr_t block_size) |
void | neon_fp32_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
int32x4_t | saturating_doubling_high_mul (const int32x4_t &a, const int32_t &b) |
int32_t | saturating_doubling_high_mul (const int32_t &a, const int32_t &b) |
int32x4_t | rounding_divide_by_exp2 (const int32x4_t &x, const int exponent) |
int32x2_t | rounding_divide_by_exp2 (const int32x2_t &x, const int exponent) |
int32_t | rounding_divide_by_exp2 (const int32_t &x, const int exponent) |
template<typename T , typename TW > | |
void | run_depthwise_quanitized8bit (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
template void | run_depthwise_quanitized8bit< uint8_t, uint8_t > (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
template void | run_depthwise_quanitized8bit< int8_t, int8_t > (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
template void | run_depthwise_quanitized8bit< uint8_t, int8_t > (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
bool | is_valid_input_region (int32_t base_w, uint32_t base_h, uint32_t w, uint32_t h, const DepthwiseConvolutionRunInfo &run_info, const Size2D &dilation) |
template<typename T > | |
void | depthwise_loop_multiplier1_fp (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const PadStrideInfo &conv_info, const Size2D &dilation, const Window &window, bool has_biases) |
template<typename T > | |
void | depthwise_loop_generic_fp (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const PadStrideInfo &conv_info, const Size2D &dilation, unsigned int depth_multiplier, const Window &window, bool has_biases) |
template<typename T , typename TW > | |
void | run_depthwise_float (const ITensor *src, const ITensor *weights, const ITensor *biases, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
void | neon_qu8_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
void | neon_qp8_qu8_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
void | neon_qs8_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
void | neon_qp8_qs8_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
void | neon_fp16_deptwiseconv2dnative (const ITensor *src, const ITensor *weights, const ITensor *bias, ITensor *dst, const Window &window, bool has_biases, const ConvolutionInfo &info) |
template<ArithmeticOperation op> | |
void | neon_fp32_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_fp32_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_fp32_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op, typename VectorType > | |
VectorType::type | elementwise_arithm_op (const typename VectorType::type &a, const typename VectorType::type &b) |
template<ArithmeticOperation op, typename ScalarType , typename VectorType > | |
VectorType::type | elementwise_arithm_op_broadcast (const typename VectorType::type &a, const ScalarType &broadcast_value, const bool reorder) |
template<typename InputScalarType , typename OutputScalarType , typename InputVectorType > | |
void | elementwise_op (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window, OutputScalarType(*scalar_func)(const InputScalarType &, const InputScalarType &), int(*broadcast_func)(int, int, int, const InputScalarType *, const InputScalarType &, OutputScalarType *, const bool), int(*neon_func)(int, int, int, const InputScalarType *, const InputScalarType *, OutputScalarType *)) |
template<ArithmeticOperation op, typename ScalarType > | |
ScalarType | elementwise_arithm_op_scalar (const ScalarType &a, const ScalarType &b) |
template<> | |
int32x4_t | elementwise_arithm_op< ArithmeticOperation::DIV, typename wrapper::traits::neon_vector< int32_t, 4 > > (const int32x4_t &a, const int32x4_t &b) |
template<> | |
float32x4_t | elementwise_arithm_op< ArithmeticOperation::DIV, typename wrapper::traits::neon_vector< float, 4 > > (const float32x4_t &a, const float32x4_t &b) |
template<> | |
float32x4_t | elementwise_arithm_op< ArithmeticOperation::POWER, typename wrapper::traits::neon_vector< float, 4 > > (const float32x4_t &a, const float32x4_t &b) |
template<ArithmeticOperation op, typename ScalarType , typename VectorType > | |
int | elementwise_arithm_op_loop (int window_start_x, int window_end_x, int window_step_x, const ScalarType *input1_ptr, const ScalarType *input2_ptr, ScalarType *output_ptr) |
template<ArithmeticOperation op, typename ScalarType , typename VectorType > | |
int | elementwise_arithm_op_broadcast_loop (int window_start_x, int window_end_x, int window_step_x, const ScalarType *non_broadcast_input_ptr, const ScalarType &broadcast_value, ScalarType *output_ptr, const bool reorder) |
template<ArithmeticOperation op, typename VectorType > | |
void | elementwise_arithm_op (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op, typename InputScalarType > | |
uint8_t | elementwise_comp_op_scalar (const InputScalarType &a, const InputScalarType &b) |
template<ComparisonOperation op, typename InputVectorType , typename OutputVectorType > | |
OutputVectorType | elementwise_comp_op (const InputVectorType &a, const InputVectorType &b) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType , typename OutputVectorType > | |
OutputVectorType | elementwise_comp_op_broadcast (const InputVectorType &a, const InputScalarType &broadcast_value, const bool reorder) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_broadcast_8_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *non_broadcast_input_ptr, const InputScalarType &broadcast_value, uint8_t *output_ptr, const bool reorder) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_broadcast_16_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *non_broadcast_input_ptr, const InputScalarType &broadcast_value, uint8_t *output_ptr, const bool reorder) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_broadcast_32_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *non_broadcast_input_ptr, const InputScalarType &broadcast_value, uint8_t *output_ptr, const bool reorder) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_8_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *input1_ptr, const InputScalarType *input2_ptr, uint8_t *output_ptr) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_16_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *input1_ptr, const InputScalarType *input2_ptr, uint8_t *output_ptr) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
int | elementwise_comp_op_32_loop (int window_start_x, int window_end_x, int window_step_x, const InputScalarType *input1_ptr, const InputScalarType *input2_ptr, uint8_t *output_ptr) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
void | elementwise_comp_op_8 (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
void | elementwise_comp_op_16 (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op, typename InputScalarType , typename InputVectorType > | |
void | elementwise_comp_op_32 (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
float32x4x4_t | load_quantized (const uint8_t *input1_ptr, const int32x4_t &offset, const float32x4_t &scale) |
float32x4x4_t | load_quantized_signed (const int8_t *input1_ptr, const int32x4_t &offset, const float32x4_t &scale) |
void | store_quantized (uint8_t *output_ptr, const uint32x4x4_t &out) |
void | store_quantized (uint8_t *output_ptr, const int32x4x4_t &out) |
void | store_quantized (uint8_t *output_ptr, const float32x4x4_t &rf, const float32x4_t &offset, const float32x4_t &invscale) |
void | store_quantized_signed (int8_t *output_ptr, const int32x4x4_t &out) |
void | store_quantized_signed (int8_t *output_ptr, const float32x4x4_t &rf, const float32x4_t &offset, const float32x4_t &invscale) |
template<ArithmeticOperation op> | |
uint8_t | elementwise_arithm_op_quantized_scalar (const float &a, const float &b, UniformQuantizationInfo qinfo) |
template<ArithmeticOperation op> | |
int8_t | elementwise_arithm_op_quantized_signed_scalar (const float &a, const float &b, UniformQuantizationInfo qinfo) |
template<ArithmeticOperation op> | |
float32x4x4_t | elementwise_arithm_op (const float32x4x4_t &a, const float32x4x4_t &b) |
template<ComparisonOperation op> | |
uint8_t | elementwise_comp_op_quantized_scalar (const float &a, const float &b, UniformQuantizationInfo qinfo) |
template<ComparisonOperation op> | |
uint32x4x4_t | elementwise_comp_op (const float32x4x4_t &a, const float32x4x4_t &b) |
template<ArithmeticOperation op> | |
int | elementwise_arithm_op_quantized_loop (int window_start_x, int window_end_x, int window_step_x, const uint8_t *input1_ptr, const uint8_t *input2_ptr, uint8_t *output_ptr, int32x4_t voffset1, int32x4_t voffset2, float32x4_t vscale1, float32x4_t vscale2, float32x4_t voffseto, float32x4_t invvscaleo) |
template<ArithmeticOperation op> | |
int | elementwise_arithm_op_quantized_singed_loop (int window_start_x, int window_end_x, int window_step_x, const int8_t *input1_ptr, const int8_t *input2_ptr, int8_t *output_ptr, int32x4_t voffset1, int32x4_t voffset2, float32x4_t vscale1, float32x4_t vscale2, float32x4_t voffseto, float32x4_t invvscaleo) |
template<ArithmeticOperation op> | |
int | elementwise_arithm_op_quantized_broadcast_loop (int window_start_x, int window_end_x, int window_step_x, const uint8_t *non_broadcast_input_ptr, float32x4x4_t broadcast_vector, uint8_t *output_ptr, int32x4_t voffset_non_broadcast, float32x4_t vscale_non_broadcast, float32x4_t voffseto, float32x4_t invvscaleo, bool reorder) |
template<ArithmeticOperation op> | |
int | elementwise_arithm_op_quantized_signed_broadcast_loop (int window_start_x, int window_end_x, int window_step_x, const int8_t *non_broadcast_input_ptr, float32x4x4_t broadcast_vector, int8_t *output_ptr, int32x4_t voffset_non_broadcast, float32x4_t vscale_non_broadcast, float32x4_t voffseto, float32x4_t invvscaleo, bool reorder) |
template<ComparisonOperation op> | |
int | elementwise_comp_op_quantized_loop (int window_start_x, int window_end_x, int window_step_x, const uint8_t *input1_ptr, const uint8_t *input2_ptr, uint8_t *output_ptr, int32x4_t voffset1, int32x4_t voffset2, float32x4_t vscale1, float32x4_t vscale2, float32x4_t voffseto, float32x4_t invvscaleo) |
template<ComparisonOperation op> | |
int | elementwise_comp_op_quantized_signed_loop (int window_start_x, int window_end_x, int window_step_x, const int8_t *input1_ptr, const int8_t *input2_ptr, uint8_t *output_ptr, int32x4_t voffset1, int32x4_t voffset2, float32x4_t vscale1, float32x4_t vscale2, float32x4_t voffseto, float32x4_t invvscaleo) |
template<ComparisonOperation op> | |
int | elementwise_comp_op_quantized_broadcast_loop (int window_start_x, int window_end_x, int window_step_x, const uint8_t *non_broadcast_input_ptr, float32x4x4_t broadcast_vector, uint8_t *output_ptr, int32x4_t voffset_non_broadcast, float32x4_t vscale_non_broadcast, float32x4_t voffseto, float32x4_t invvscaleo, bool reorder) |
template<ComparisonOperation op> | |
int | elementwise_comp_op_quantized_signed_broadcast_loop (int window_start_x, int window_end_x, int window_step_x, const int8_t *non_broadcast_input_ptr, float32x4x4_t broadcast_vector, uint8_t *output_ptr, int32x4_t voffset_non_broadcast, float32x4_t vscale_non_broadcast, float32x4_t voffseto, float32x4_t invvscaleo, bool reorder) |
void | elementwise_op_quantized (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window, uint8_t(*scalar_func)(const float &, const float &, UniformQuantizationInfo), int(*broadcast_func)(int, int, int, const uint8_t *, float32x4x4_t, uint8_t *, int32x4_t, float32x4_t, float32x4_t, float32x4_t, const bool), int(*neon_func)(int, int, int, const uint8_t *, const uint8_t *, uint8_t *, int32x4_t, int32x4_t, float32x4_t, float32x4_t, float32x4_t, float32x4_t)) |
void | elementwise_comp_quantized_signed (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window, uint8_t(*scalar_func)(const float &, const float &, UniformQuantizationInfo), int(*broadcast_func)(int, int, int, const int8_t *, float32x4x4_t, uint8_t *, int32x4_t, float32x4_t, float32x4_t, float32x4_t, const bool), int(*neon_func)(int, int, int, const int8_t *, const int8_t *, uint8_t *, int32x4_t, int32x4_t, float32x4_t, float32x4_t, float32x4_t, float32x4_t)) |
void | elementwise_op_quantized_signed (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window, int8_t(*scalar_func)(const float &, const float &, UniformQuantizationInfo), int(*broadcast_func)(int, int, int, const int8_t *, float32x4x4_t, int8_t *, int32x4_t, float32x4_t, float32x4_t, float32x4_t, const bool), int(*neon_func)(int, int, int, const int8_t *, const int8_t *, int8_t *, int32x4_t, int32x4_t, float32x4_t, float32x4_t, float32x4_t, float32x4_t)) |
template<ArithmeticOperation op> | |
void | elementwise_arithm_op_quantized (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | elementwise_arithm_op_quantized_signed (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | elementwise_comp_op_quantized (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | elementwise_comp_op_quantized_signed (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | neon_s32_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | neon_s16_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_u8_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_u8_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_s16_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s16_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_s32_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_s32_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | neon_qasymm8_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_qasymm8_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | neon_qasymm8_signed_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_qasymm8_signed_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | sve_fp32_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve_fp32_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_fp32_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<typename ScalarType > | |
void | elementwise_arithmetic_op (const ITensor *in1, const ITensor *in2, ITensor *out, ArithmeticOperation op, const Window &window) |
template void | elementwise_arithmetic_op< float32_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ArithmeticOperation op, const Window &window) |
template void | elementwise_arithmetic_op< float16_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ArithmeticOperation op, const Window &window) |
template void | elementwise_arithmetic_op< int16_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ArithmeticOperation op, const Window &window) |
template void | elementwise_arithmetic_op< int32_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ArithmeticOperation op, const Window &window) |
template<typename InputScalarType , typename OutputScalarType > | |
void | elementwise_comparison_op (const ITensor *in1, const ITensor *in2, ITensor *out, ComparisonOperation op, const Window &window) |
template void | elementwise_comparison_op< float32_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ComparisonOperation op, const Window &window) |
template void | elementwise_comparison_op< float16_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ComparisonOperation op, const Window &window) |
template void | elementwise_comparison_op< uint8_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ComparisonOperation op, const Window &window) |
template void | elementwise_comparison_op< int16_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ComparisonOperation op, const Window &window) |
template void | elementwise_comparison_op< int32_t > (const ITensor *in1, const ITensor *in2, ITensor *out, const ComparisonOperation op, const Window &window) |
template<> | |
svint32_t | elementwise_pow< svint32_t > (svbool_t &pg, const svint32_t &a, const svint32_t &b) |
template<> | |
svint32_t | elementwise_div< svint32_t > (svbool_t &pg, const svint32_t &a, const svint32_t &b) |
template<> | |
svint16_t | elementwise_div< svint16_t > (svbool_t &pg, const svint16_t &a, const svint16_t &b) |
template<typename VectorType > | |
VectorType | elementwise_pow (svbool_t &pg, const VectorType &a, const VectorType &b) |
template<typename VectorType > | |
VectorType | elementwise_div (svbool_t &pg, const VectorType &a, const VectorType &b) |
template<uint32_t bytewidth> | |
svbool_t | narrow_to_byte_predicate (svbool_t pg) |
template<typename VectorType > | |
VectorType | elementwise_arithmetic_op (svbool_t &pg, const VectorType &a, const VectorType &b, ArithmeticOperation op) |
template<typename InputVectorType , typename OutputVectorType > | |
OutputVectorType | elementwise_comparison_op (svbool_t &pg, const InputVectorType &a, const InputVectorType &b, ComparisonOperation op) |
template<ArithmeticOperation op> | |
void | sve_s32_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | sve_s16_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve_u8_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_u8_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve_s16_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s16_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve_s32_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve_s32_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
svfloat32x4_t | load_quantized (const int8_t *ptr, svbool_t pg, const svint32_t &offset, const svfloat32_t &scale) |
svfloat32x4_t | load_quantized (const uint8_t *ptr, svbool_t pg, const svint32_t &offset, const svfloat32_t &scale) |
void | store_quantized (uint8_t *ptr, svbool_t pg, svfloat32x4_t data, const svint32_t &offset, const svfloat32_t &inv_scale) |
void | store_quantized (int8_t *ptr, svbool_t pg, svfloat32x4_t data, const svint32_t &offset, const svfloat32_t &inv_scale) |
template<typename ScalarType > | |
void | elementwise_arithmetic_quantized_op (const ITensor *in1, const ITensor *in2, ITensor *out, ArithmeticOperation op, const Window &window) |
template<typename InputScalarType , typename OutputScalarType = uint8_t> | |
void | elementwise_comparison_quantized_op (const ITensor *in1, const ITensor *in2, ITensor *out, ComparisonOperation op, const Window &window) |
template<ArithmeticOperation op> | |
void | sve2_qasymm8_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve2_qasymm8_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | sve2_qasymm8_signed_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::ADD > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::SUB > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::DIV > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::MIN > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::MAX > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::POWER > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::PRELU > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve2_qasymm8_signed_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Equal > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::NotEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Greater > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Less > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template void | sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::LessEqual > (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | sve_fp16_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ArithmeticOperation op> | |
void | neon_fp16_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | sve_fp16_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<ComparisonOperation op> | |
void | neon_fp16_comparison_elementwise_binary (const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
void | neon_fp32_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
template<typename ScalarType > | |
ScalarType | elementwise_op_scalar_imp (ElementWiseUnary op, const ScalarType &a) |
template<typename ScalarType , typename VectorType > | |
VectorType | elementwise_op_imp (ElementWiseUnary op, const VectorType &a) |
template<typename ScalarType > | |
void | elementwise_op (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
template<> | |
void | elementwise_op< int8_t > (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
template<> | |
void | elementwise_op< uint8_t > (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
void | neon_s32_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | neon_qasymm8_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | neon_qasymm8_signed_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | sve_fp32_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
template<typename ScalarType , typename VectorType > | |
std::enable_if< utils::traits::is_floating_point< ScalarType >::value, VectorType >::type | elementwise_op_sve_imp (svbool_t pg, ElementWiseUnary op, const VectorType &a) |
template<typename ScalarType , typename VectorType > | |
std::enable_if< std::is_integral< ScalarType >::value, VectorType >::type | elementwise_op_sve_imp (svbool_t pg, ElementWiseUnary op, const VectorType &a) |
template<typename ScalarType > | |
void | elementwise_sve_op (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
template void | elementwise_sve_op< float16_t > (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
template void | elementwise_sve_op< float32_t > (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
template void | elementwise_sve_op< int32_t > (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op) |
void | sve_s32_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | sve2_q8_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | sve_fp16_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | neon_fp16_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | neon_q8_elementwise_unary (const ITensor *in, ITensor *out, const Window &window, ElementWiseUnary op, const uint8_t *lut) |
void | fp16_neon_floor (const void *src, void *dst, int len) |
void | fp32_neon_floor (const void *src, void *dst, int len) |
void | fused_batch_normalization_conv_f32 (const ITensor *conv_weights, const ITensor *conv_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
template<typename T , bool fused_activation, typename F > | |
void | batch_normalization_nchw (const Window &window, ITensor *in, ITensor *out, const ITensor *in_mean, const ITensor *in_var, const ITensor *in_beta, const ITensor *in_gamma, float epsilon, ActivationLayerInfo act_info) |
template<typename T > | |
void | fused_batch_normalization_conv (const ITensor *conv_weights, const ITensor *conv_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
template<typename T > | |
void | fused_batch_normalization_dwc_nchw (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | fused_batch_normalization_conv_f16 (const ITensor *conv_weights, const ITensor *conv_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | fused_batch_normalization_dwc_nhwc_f16 (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | fused_batch_normalization_dwc_nhwc_f32 (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | fused_batch_normalization_dwc_nchw_f16 (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | fused_batch_normalization_dwc_nchw_f32 (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
template<typename T > | |
void | fused_batch_normalization_dwc_nhwc (const ITensor *dwc_weights, const ITensor *dwc_bias, ITensor *fused_weights, ITensor *fused_bias, const ITensor *bn_mean, const ITensor *bn_var, const ITensor *bn_beta, const ITensor *bn_gamma, float epsilon, const Window &window) |
void | neon_fp32_gemm_matrix_add (const ITensor *src, ITensor *dst, const Window &window, float beta) |
void | matrix_addition_f32 (const ITensor *src, ITensor *dst, const Window &window, float beta) |
void | neon_fp16_gemm_matrix_add (const ITensor *src, ITensor *dst, const Window &window, float beta) |
void | neon_fp32_gemm_matrix_mul (const ITensor *lhs, const ITensor *rhs, ITensor *dst, const Window &window, const ThreadInfo &info, float alpha, const bool is_dst_vector) |
void | vector_matrix_multiply_f32 (const ITensor *lhs, const ITensor *rhs, ITensor *dst, const Window &window, const ThreadInfo &info, float alpha) |
void | matrix_matrix_multiply_f32 (const ITensor *lhs, const ITensor *rhs, ITensor *dst, const Window &window, const ThreadInfo &info, float alpha) |
void | neon_fp16_gemm_matrix_mul (const ITensor *lhs, const ITensor *rhs, ITensor *dst, const Window &window, const ThreadInfo &info, float alpha, const bool is_dst_vector) |
void | neon_fp32_computeallanchors (const ITensor *anchors, ITensor *all_anchors, ComputeAnchorsInfo anchors_info, const Window &window) |
void | compute_all_anchors_qasymm16 (const ITensor *anchors, ITensor *all_anchors, ComputeAnchorsInfo anchors_info, const Window &window) |
template<typename T > | |
void | compute_all_anchors (const ITensor *anchors, ITensor *all_anchors, ComputeAnchorsInfo anchors_info, const Window &window) |
void | neon_qu16_computeallanchors (const ITensor *anchors, ITensor *all_anchors, ComputeAnchorsInfo anchors_info, const Window &window) |
void | neon_fp16_computeallanchors (const ITensor *anchors, ITensor *all_anchors, ComputeAnchorsInfo anchors_info, const Window &window) |
void | neon_fp32_instancenorm (ITensor *input, ITensor *output, float gamma, float beta, float epsilon, bool use_mixed_precision, const Window &window) |
template<typename InputType , typename AccType > | |
void | vector_float_sum (AccType &result, AccType &result_square, const InputType &inputs) |
template<typename InputType , typename AccType > | |
InputType | vector_float_norm (const InputType &inputs, const AccType &vec_mean, const AccType &vec_multip, const AccType &vec_beta) |
template<typename T , typename AccType > | |
void | instance_normalization_nchw (ITensor *input, ITensor *output, float gamma, float beta, float epsilon, const Window &window) |
template void | instance_normalization_nchw< float > (ITensor *input, ITensor *output, float gamma, float beta, float epsilon, const Window &window) |
void | neon_fp16_instancenorm (ITensor *input, ITensor *output, float gamma, float beta, float epsilon, bool use_mixed_precision, const Window &window) |
void | neon_fp32_l2_normalize_x (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window, size_t unused_axis) |
void | neon_fp32_l2_normalize_yz (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window, size_t axis) |
template<typename T , int S> | |
void | l2_normalize_x (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window) |
template<typename T , int S> | |
void | l2_normalize_yz (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window, size_t axis) |
void | neon_fp16_l2_normalize_x (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window, size_t axis) |
void | neon_fp16_l2_normalize_yz (const ITensor *in, const ITensor *sum, ITensor *out, float epsilon, const Window &window, size_t axis) |
void | neon_fp32_maxunpooling (const ITensor *input, const ITensor *indices, ITensor *output, const Window &window) |
template<typename T > | |
void | max_unpooling (const ITensor *input, const ITensor *indices, ITensor *output, const Window &window) |
void | neon_qs8_maxunpooling (const ITensor *input, const ITensor *indices, ITensor *output, const Window &window) |
void | neon_qu8_maxunpooling (const ITensor *input, const ITensor *indices, ITensor *output, const Window &window) |
void | neon_fp16_maxunpooling (const ITensor *input, const ITensor *indices, ITensor *output, const Window &window) |
void | neon_fp32_meanstddevnorm (ITensor *input, ITensor *output, float epsilon, const Window &window) |
template<typename ScalarType , int size> | |
void | mean_stddev_normalization (ITensor *input, ITensor *output, float epsilon, const Window &window) |
template void | mean_stddev_normalization< float, 4 > (ITensor *input, ITensor *output, float epsilon, const Window &window) |
void | neon_qasymm8_meanstddevnorm (ITensor *input, ITensor *output, float epsilon, const Window &window) |
void | neon_fp16_meanstddevnorm (ITensor *input, ITensor *output, float epsilon, const Window &window) |
void | mul_F32_F32_F32 (const ITensor *src1, const ITensor *src2, ITensor *out, const Window &window, float scale) |
void | mul_F16_F16_F16 (const ITensor *src1, const ITensor *src2, ITensor *out, const Window &window, float scale) |
void | neon_normalize_float32_4_0_2D (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float32_4_0 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float32_4_1_2D (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float32_4_1 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float32_4_2 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float16_8_0_2D (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float16_8_0 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float16_8_1_2D (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float16_8_1 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | neon_normalize_float16_8_2 (const Window &window, const ITensor *in, const ITensor *in_squared, ITensor *out, NormalizationLayerInfo ninfo) |
void | poolingMxN_fp32_neon_nhwc_kernel_indices (const ITensor *src, ITensor *dst0, ITensor *dst1, const PoolingLayerInfo &pool_info, const Window &window) |
void | poolingMxN_fp32_neon_nhwc (const ITensor *src, ITensor *dst0, ITensor *dst1, PoolingLayerInfo &pool_info, const Window &window_src, const Window &window) |
void | poolingMxN_qasymm8_neon_nhwc (const ITensor *src0, ITensor *dst0, ITensor *dst1, PoolingLayerInfo &, const Window &window_src, const Window &window) |
void | poolingMxN_qasymm8_signed_neon_nhwc (const ITensor *src0, ITensor *dst0, ITensor *dst1, PoolingLayerInfo &, const Window &window_src, const Window &window) |
void | poolingMxN_fp16_neon_nhwc (const ITensor *src0, ITensor *dst0, ITensor *dst1, PoolingLayerInfo &, const Window &window_src, const Window &window) |
template<typename T > | |
T | get_initial_min (bool use_inf_as_limit) |
template<typename T > | |
uint32_t | offset_no_padding (uint32_t padded_offset, const Coordinates &id, const ITensorInfo &info, int pool_stride_x, int pool_stride_y, DataLayout data_layout) |
template<typename T > | |
void | poolingMxN_q8_neon_nhwc (const ITensor *src, ITensor *dst0, ITensor *dst1, PoolingLayerInfo &pool_info, const Window &window_src, const Window &window) |
void | neon_q8_pool3d (const ITensor *src0, ITensor *dst0, Pooling3dLayerInfo &, const Window &window) |
void | neon_q8_signed_pool3d (const ITensor *src0, ITensor *dst0, Pooling3dLayerInfo &, const Window &window) |
void | neon_fp16_pool3d (const ITensor *src0, ITensor *dst0, Pooling3dLayerInfo &, const Window &window) |
void | neon_fp32_pool3d (const ITensor *src0, ITensor *dst0, Pooling3dLayerInfo &, const Window &window) |
template<typename T > | |
void | poolingMxNxD_fp_neon_ndhwc (const ITensor *src, ITensor *dst0, Pooling3dLayerInfo &pool_info, const Window &window) |
template<typename T > | |
void | poolingMxNxD_q8_neon_ndhwc (const ITensor *src, ITensor *dst0, Pooling3dLayerInfo &pool_info, const Window &window) |
template<typename T > | |
void | avg_poolingMxNxD_q8_neon_ndhwc (const ITensor *src, ITensor *dst0, Pooling3dLayerInfo &pool_info, const Window &window_out, const int window_step_x) |
template<typename T > | |
void | max_poolingMxNxD_q8_neon_ndhwc (const ITensor *src, ITensor *dst0, Pooling3dLayerInfo &pool_info, const Window &window_out, const int window_step_x) |
void | fp32_neon_range_function (ITensor *output, float start, float step, const Window &window) |
template<typename T > | |
void | neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | u8_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | u16_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | u32_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | s8_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | s16_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | s32_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | fp16_neon_range_function (ITensor *output, float start, float step, const Window &window) |
void | neon_fp32_roialign (const ITensor *input, ITensor *output, const ITensor *rois, ROIPoolingLayerInfo pool_info, const Window &window, const ThreadInfo &info) |
template<typename input_data_type > | |
input_data_type | roi_align_1x1 (const ITensor *input, unsigned int roi_batch, float region_start_x, float bin_size_x, int grid_size_x, float region_end_x, float region_start_y, float bin_size_y, int grid_size_y, float region_end_y, int pz) |
Average pooling over an aligned window. More... | |
template<typename input_data_type > | |
input_data_type | roi_align_1x1_qasymm8 (const ITensor *input, unsigned int roi_batch, float region_start_x, float bin_size_x, int grid_size_x, float region_end_x, float region_start_y, float bin_size_y, int grid_size_y, float region_end_y, int pz, const QuantizationInfo &out_qinfo) |
Average pooling over an aligned window. More... | |
float | compute_region_coordinate (int p, float bin_size, float roi_anchor, float max_value) |
template<typename input_data_type , typename roi_data_type > | |
void | roi_align (const ITensor *input, ITensor *output, const ITensor *rois, ROIPoolingLayerInfo pool_info, const Window &window, const ThreadInfo &info) |
void | neon_qu8_roialign (const ITensor *input, ITensor *output, const ITensor *rois, ROIPoolingLayerInfo pool_info, const Window &window, const ThreadInfo &info) |
void | neon_qs8_roialign (const ITensor *input, ITensor *output, const ITensor *rois, ROIPoolingLayerInfo pool_info, const Window &window, const ThreadInfo &info) |
void | neon_fp16_roialign (const ITensor *input, ITensor *output, const ITensor *rois, ROIPoolingLayerInfo pool_info, const Window &window, const ThreadInfo &info) |
void | s8_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | u8_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | s16_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | qasymm8_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | qasymm8_signed_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | fp16_common_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | fp16_bilinear_neon_scale_nchw (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | fp16_nearest_neon_scale_nchw (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
template<typename T > | |
void | nearest_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, float sampling_offset, bool align_corners, const Window &window) |
template<typename T > | |
void | bilinear_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
template<typename T > | |
void | common_neon_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | fp32_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | u8_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | s16_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | fp16_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | qasymm8_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | qasymm8_signed_sve_scale (const ITensor *src, ITensor *dst, const ITensor *offsets, const ITensor *dx, const ITensor *dy, InterpolationPolicy policy, BorderMode border_mode, PixelValue constant_border_value, float sampling_offset, bool align_corners, const Window &window) |
void | neon_f32_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_f32_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
template<typename ScalarType , typename VectorType > | |
void | select_op (const ITensor *cond, const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window, const int window_step_x, const int window_start_x, const int window_end_x, const int limit, VectorType(*condition_conversion)(const uint8_t *)) |
template<typename ScalarType , typename VectorType > | |
void | select_op_8 (const ITensor *cond, const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<typename ScalarType , typename VectorType > | |
void | select_op_16 (const ITensor *cond, const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<typename ScalarType , typename VectorType > | |
void | select_op_32 (const ITensor *cond, const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
template<typename ScalarType > | |
void | select_op_not_same_rank (const ITensor *cond, const ITensor *in1, const ITensor *in2, ITensor *out, const Window &window) |
void | neon_s8_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_s16_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_s32_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_s8_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_s16_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_s32_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u8_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u16_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u32_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u8_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u16_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_u32_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_f16_select_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
void | neon_f16_select_not_same_rank (const ITensor *c, const ITensor *x, const ITensor *y, ITensor *output, const Window &window) |
template<bool IS_LOG> | |
void | neon_fp32_softmax (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_fp32_softmax< true > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_fp32_softmax< false > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template<typename T , bool IS_LOG> | |
void | neon_softmax_quantized (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template void | neon_softmax_quantized< qasymm8_signed_t, true > (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template void | neon_softmax_quantized< qasymm8_signed_t, false > (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template void | neon_softmax_quantized< qasymm8_t, true > (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template void | neon_softmax_quantized< qasymm8_t, false > (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template<typename T , bool IS_LOG> | |
void | neon_softmax_float (const ITensor *in, void *const tmp, ITensor *out, float beta, const Window &window) |
template<bool IS_LOG> | |
void | neon_qasymm8_softmax (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_qasymm8_softmax< true > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_qasymm8_softmax< false > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template<bool IS_LOG> | |
void | neon_qasymm8_signed_softmax (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_qasymm8_signed_softmax< true > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template void | neon_qasymm8_signed_softmax< false > (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template<typename ScalarType > | |
void | sve_logits_1d_max (const ITensor *in, ITensor *out, const Window &window) |
TODO: (COMPMID-6505) Similar to Neon(TM), this implementation be converted to a single kernel that performs softmax operation. More... | |
template<typename ScalarType > | |
void | sve_softmax_logits_1d_float (const ITensor *in, const ITensor *max, void *const tmp, ITensor *out, const float beta, bool is_log, const Window &window) |
template<typename ScalarType > | |
void | sve2_softmax_logits_1d_quantized (const ITensor *in, const ITensor *max, void *const tmp, ITensor *out, float beta, bool is_log, const Window &window) |
TODO: (COMPMID-6505) Similar to Neon(TM), this implementation be converted to a single kernel that performs softmax operation. More... | |
template<bool IS_LOG> | |
void | neon_fp16_softmax (const ITensor *in, void *const tmp, ITensor *out, const float beta, const Window &window) |
template<typename T > | |
void | sub_same_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_qasymm8_neon_fixedpoint (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_qasymm8_signed_neon_fixedpoint (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_qasymm8_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_qasymm8_signed_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_qsymm16_neon (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
void | sub_same_neon_fp16 (const ITensor *src0, const ITensor *src1, ITensor *dst, const ConvertPolicy &policy, const Window &window) |
Variables | |
constexpr auto | data_layout = DataLayout::NHWC |
const size_t | width_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH) |
const size_t | height_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT) |
const size_t | channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL) |
constexpr auto | dim_manual_loop = Window::Dimension(0, 0, 0) |
constexpr auto | dim_single_unit_step = Window::Dimension(0, 1, 1) |
constexpr size_t | vector_size = 8 |
constexpr int | step = 4 |
Class to run cpu::kernels::CpuArithmeticKernel except for maximum operation.
Definition at line 65 of file CpuElementwise.h.
Class to run cpu::kernels::CpuArithmeticKernel except for minimum operation.
Definition at line 67 of file CpuElementwise.h.
Class to run cpu::kernels::CpuArithmeticKernel except for squared difference operation.
Definition at line 69 of file CpuElementwise.h.
Class to run cpu::kernels::CpuArithmeticKernel except for PRelu operation.
Definition at line 34 of file CpuPRelu.h.
Definition at line 33 of file ICpuOperator.h.
Definition at line 34 of file CpuElementwiseUnary.cpp.
Basic function to run equal comparison.
Definition at line 172 of file CpuElementwise.h.
Basic function to run greater comparison.
Definition at line 176 of file CpuElementwise.h.
Basic function to run greater-equal comparison.
Definition at line 178 of file CpuElementwise.h.
Basic function to run less comparison.
Definition at line 180 of file CpuElementwise.h.
Basic function to run less-equal comparison.
Definition at line 182 of file CpuElementwise.h.
Basic function to run not equal comparison.
Definition at line 174 of file CpuElementwise.h.
|
strong |
Enumerator | |
---|---|
Im2Col | |
Indirect | |
Conv |
Definition at line 37 of file CpuGemmAssemblyDispatch.h.
|
strong |
Definition at line 35 of file ICpuKernel.h.
void arm_compute::cpu::add_fp16_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
void arm_compute::cpu::add_fp16_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
void add_fp32_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 31 of file fp32.cpp.
References arm_compute::test::validation::dst.
Referenced by CpuAddKernel::get_mws().
void add_fp32_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 34 of file fp32.cpp.
References add_same_sve< float >(), and arm_compute::test::validation::dst.
void arm_compute::cpu::add_mul_add_fp16_neon | ( | const ITensor * | input1, |
const ITensor * | input2, | ||
const ITensor * | bn_mul, | ||
const ITensor * | bn_add, | ||
ITensor * | add_output, | ||
ITensor * | final_output, | ||
ConvertPolicy | policy, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::add_mul_add_fp32_neon | ( | const ITensor * | input1, |
const ITensor * | input2, | ||
const ITensor * | bn_mul, | ||
const ITensor * | bn_add, | ||
ITensor * | add_output, | ||
ITensor * | final_output, | ||
ConvertPolicy | policy, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::add_mul_add_s8_neon | ( | const ITensor * | input1, |
const ITensor * | input2, | ||
const ITensor * | bn_mul, | ||
const ITensor * | bn_add, | ||
ITensor * | add_output, | ||
ITensor * | final_output, | ||
ConvertPolicy | policy, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::add_mul_add_u8_neon | ( | const ITensor * | input1, |
const ITensor * | input2, | ||
const ITensor * | bn_mul, | ||
const ITensor * | bn_add, | ||
ITensor * | add_output, | ||
ITensor * | final_output, | ||
ConvertPolicy | policy, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void add_q8_neon_fixedpoint | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::add_q8_neon_fixedpoint< int8_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::add_q8_neon_fixedpoint< uint8_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
bool add_q8_neon_fixedpoint_possible | ( | const ITensorInfo * | src0, |
const ITensorInfo * | src1, | ||
const ITensorInfo * | dst | ||
) |
Definition at line 40 of file impl.cpp.
References add_sub_q8_neon_fixedpoint_possible(), and arm_compute::test::validation::dst.
Referenced by CpuAddKernel::configure().
void add_qasymm8_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8.cpp.
References add_sub_qasymm8_neon(), and arm_compute::test::validation::dst.
void add_qasymm8_signed_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8_signed.cpp.
References add_sub_qasymm8_signed_neon(), and arm_compute::test::validation::dst.
void add_qasymm8_signed_sve2 | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 39 of file qasymm8_signed.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
void add_qasymm8_sve2 | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 39 of file qasymm8.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
void add_qsymm16_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 36 of file qsymm16.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::for(), ITensor::info(), Iterator::ptr(), ITensorInfo::quantization_info(), arm_compute::quantize_qsymm16(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
void add_qsymm16_sve2 | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 39 of file qsymm16.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
void add_s16_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 37 of file integer.cpp.
References arm_compute::test::validation::dst.
void add_s16_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 40 of file integer.cpp.
References add_same_sve< int16_t >(), and arm_compute::test::validation::dst.
void add_s32_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 43 of file integer.cpp.
References arm_compute::test::validation::dst.
void add_s32_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 46 of file integer.cpp.
References add_same_sve< int32_t >(), and arm_compute::test::validation::dst.
void arm_compute::cpu::add_same_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 39 of file impl.h.
References arm_compute::wrapper::add_sat(), Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), arm_compute::SATURATE, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vqadd(), arm_compute::wrapper::vstore(), Dimensions< T >::x(), and Window::x().
void add_same_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 39 of file impl.cpp.
References Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), arm_compute::SATURATE, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), Dimensions< T >::x(), and Window::x().
template void arm_compute::cpu::add_same_sve< float > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Referenced by add_fp32_sve().
template void arm_compute::cpu::add_same_sve< int16_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Referenced by add_s16_sve().
template void arm_compute::cpu::add_same_sve< int32_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Referenced by add_s32_sve().
template void arm_compute::cpu::add_same_sve< uint8_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Referenced by add_u8_sve().
void add_sub_q8_neon_fixedpoint | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window, | ||
bool | is_addition | ||
) |
Definition at line 85 of file impl.cpp.
References ARM_COMPUTE_UNUSED, Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::support::cpp11::lround(), offset(), Iterator::ptr(), Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), arm_compute::wrapper::vcombine(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmlal(), arm_compute::wrapper::vmovl(), arm_compute::wrapper::vreinterpret(), arm_compute::wrapper::vstore(), and Window::x().
template void arm_compute::cpu::add_sub_q8_neon_fixedpoint< int8_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window, | ||
bool | is_addition | ||
) |
Referenced by sub_qasymm8_signed_neon_fixedpoint().
template void arm_compute::cpu::add_sub_q8_neon_fixedpoint< uint8_t > | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window, | ||
bool | is_addition | ||
) |
Referenced by sub_qasymm8_neon_fixedpoint().
bool add_sub_q8_neon_fixedpoint_possible | ( | const ITensorInfo * | src0, |
const ITensorInfo * | src1, | ||
const ITensorInfo * | dst, | ||
bool | is_addition | ||
) |
Definition at line 45 of file impl.cpp.
References arm_compute::test::validation::dst, offset(), ITensorInfo::quantization_info(), and QuantizationInfo::uniform().
Referenced by add_q8_neon_fixedpoint_possible(), and sub_q8_neon_fixedpoint_possible().
void add_sub_qasymm8_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window, | ||
bool | is_addition | ||
) |
Definition at line 311 of file impl.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::support::cpp11::lround(), UniformQuantizationInfo::offset, offset(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), arm_compute::support::cpp11::trunc(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
Referenced by add_qasymm8_neon(), and sub_qasymm8_neon().
void add_sub_qasymm8_signed_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window, | ||
bool | is_addition | ||
) |
Definition at line 501 of file impl.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::support::cpp11::lround(), UniformQuantizationInfo::offset, offset(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), arm_compute::support::cpp11::trunc(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
Referenced by add_qasymm8_signed_neon(), and sub_qasymm8_signed_neon().
void add_u8_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 31 of file integer.cpp.
References arm_compute::test::validation::dst.
void add_u8_sve | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 34 of file integer.cpp.
References add_same_sve< uint8_t >(), and arm_compute::test::validation::dst.
void arm_compute::cpu::avg_poolingMxNxD_q8_neon_ndhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window_out, | ||
const int | window_step_x | ||
) |
Definition at line 39 of file quantized.h.
References Padding3D::back, Padding3D::bottom, Size3D::depth, Pooling3dLayerInfo::exclude_padding, arm_compute::execute_window_loop(), Padding3D::front, Size3D::height, ITensor::info(), Pooling3dLayerInfo::is_global_pooling, Padding3D::left, UniformQuantizationInfo::offset, Pooling3dLayerInfo::padding, Pooling3dLayerInfo::pool_size, Iterator::ptr(), ITensorInfo::quantization_info(), Padding3D::right, UniformQuantizationInfo::scale, arm_compute::test::validation::scale, arm_compute::test::validation::src, Pooling3dLayerInfo::stride, Padding3D::top, QuantizationInfo::uniform(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vcombine(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmovl(), arm_compute::wrapper::vmovn(), arm_compute::wrapper::vstore(), and Size3D::width.
void arm_compute::cpu::batch_normalization_nchw | ( | const Window & | window, |
ITensor * | in, | ||
ITensor * | out, | ||
const ITensor * | in_mean, | ||
const ITensor * | in_var, | ||
const ITensor * | in_beta, | ||
const ITensor * | in_gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
SIMD vector tag type.
Definition at line 36 of file impl.h.
References arm_compute::test::validation::act_info, Window::DimX, Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), ITensor::ptr_to_element(), Window::set(), arm_compute::test::validation::reference::slice(), Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), and Window::x().
void arm_compute::cpu::bilinear_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 315 of file list.h.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, arm_compute::scale_utils::calculate_resize_ratio(), arm_compute::CONSTANT, Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), PixelValue::get(), offset(), Iterator::ptr(), arm_compute::REPLICATE, arm_compute::test::validation::scale_x, arm_compute::test::validation::scale_y, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), Window::Dimension::step(), type, arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), Window::y(), and Window::z().
void arm_compute::cpu::bounding_box_transform | ( | const ITensor * | boxes, |
ITensor * | pred_boxes, | ||
const ITensor * | deltas, | ||
BoundingBoxTransformInfo | bbinfo, | ||
const Window & | window | ||
) |
Definition at line 33 of file impl.h.
References BoundingBoxTransformInfo::apply_scale(), ARM_COMPUTE_ERROR_ON, BoundingBoxTransformInfo::bbox_xform_clip(), ITensor::buffer(), BoundingBoxTransformInfo::correct_transform_coords(), arm_compute::execute_window_loop(), BoundingBoxTransformInfo::img_height(), BoundingBoxTransformInfo::img_width(), ITensor::info(), offset(), ITensorInfo::offset_first_element_in_bytes(), Iterator::ptr(), BoundingBoxTransformInfo::scale(), ITensorInfo::tensor_shape(), and BoundingBoxTransformInfo::weights().
void bounding_box_transform_qsymm16 | ( | const ITensor * | boxes, |
ITensor * | pred_boxes, | ||
const ITensor * | deltas, | ||
BoundingBoxTransformInfo | bbinfo, | ||
const Window & | window | ||
) |
Definition at line 32 of file impl.cpp.
References BoundingBoxTransformInfo::apply_scale(), BoundingBoxTransformInfo::bbox_xform_clip(), ITensor::buffer(), BoundingBoxTransformInfo::correct_transform_coords(), arm_compute::dequantize_qasymm16(), arm_compute::dequantize_qasymm8(), arm_compute::execute_window_loop(), BoundingBoxTransformInfo::img_height(), BoundingBoxTransformInfo::img_width(), ITensor::info(), offset(), ITensorInfo::offset_first_element_in_bytes(), Iterator::ptr(), ITensorInfo::quantization_info(), arm_compute::quantize_qasymm16(), BoundingBoxTransformInfo::scale(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), and BoundingBoxTransformInfo::weights().
Referenced by neon_qu16_boundingboxtransform().
void arm_compute::cpu::common_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 592 of file list.h.
References arm_compute::BILINEAR, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void arm_compute::cpu::compute_all_anchors | ( | const ITensor * | anchors, |
ITensor * | all_anchors, | ||
ComputeAnchorsInfo | anchors_info, | ||
const Window & | window | ||
) |
Definition at line 36 of file impl.h.
References ITensorInfo::dimension(), arm_compute::execute_window_loop(), ComputeAnchorsInfo::feat_width(), ITensor::info(), Iterator::ptr(), ITensor::ptr_to_element(), ComputeAnchorsInfo::spatial_scale(), and Window::y().
void compute_all_anchors_qasymm16 | ( | const ITensor * | anchors, |
ITensor * | all_anchors, | ||
ComputeAnchorsInfo | anchors_info, | ||
const Window & | window | ||
) |
Definition at line 31 of file impl.cpp.
References arm_compute::dequantize_qsymm16(), ITensorInfo::dimension(), arm_compute::execute_window_loop(), ComputeAnchorsInfo::feat_width(), ITensor::info(), Iterator::ptr(), ITensor::ptr_to_element(), arm_compute::test::validation::qinfo, ITensorInfo::quantization_info(), arm_compute::quantize_qsymm16(), QuantizationInfo::scale(), ComputeAnchorsInfo::spatial_scale(), QuantizationInfo::uniform(), and Window::y().
Referenced by neon_qu16_computeallanchors().
|
inline |
Definition at line 267 of file impl.h.
References arm_compute::utility::clamp().
Referenced by roi_align().
void depth_to_space_nchw_any | ( | const uint8_t * | src, |
uint8_t * | dst, | ||
const uintptr_t | src_shape[4], | ||
const uintptr_t | src_strides[4], | ||
const uintptr_t | dst_strides[4], | ||
uintptr_t | element_size, | ||
uintptr_t | block_size | ||
) |
Definition at line 35 of file impl.cpp.
References ARM_COMPUTE_ERROR_ON, arm_compute::test::validation::dst, and arm_compute::test::validation::src.
Referenced by NEDepthToSpaceLayerKernel::run().
void depth_to_space_nhwc_any | ( | const uint8_t * | src, |
uint8_t * | dst, | ||
const uintptr_t | src_shape[4], | ||
const uintptr_t | src_strides[4], | ||
const uintptr_t | dst_strides[4], | ||
uintptr_t | element_size, | ||
uintptr_t | block_size | ||
) |
Definition at line 35 of file impl.cpp.
References ARM_COMPUTE_ERROR_ON, arm_compute::test::validation::dst, and arm_compute::test::validation::src.
Referenced by NEDepthToSpaceLayerKernel::run().
void arm_compute::cpu::depthwise_loop_generic_fp | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const PadStrideInfo & | conv_info, | ||
const Size2D & | dilation, | ||
unsigned int | depth_multiplier, | ||
const Window & | window, | ||
bool | has_biases | ||
) |
Definition at line 244 of file impl.h.
References arm_compute::test::validation::conv_info, dim_manual_loop, Window::DimW, Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, arm_compute::execute_window_loop(), arm_compute::support::cpp11::fma(), ITensor::info(), is_valid_input_region(), Iterator::ptr(), Window::set(), Window::set_dimension_step(), arm_compute::test::validation::src, arm_compute::test::validation::w, Size2D::x(), and Size2D::y().
void arm_compute::cpu::depthwise_loop_multiplier1_fp | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const PadStrideInfo & | conv_info, | ||
const Size2D & | dilation, | ||
const Window & | window, | ||
bool | has_biases | ||
) |
Definition at line 114 of file impl.h.
References arm_compute::test::validation::conv_info, dim_manual_loop, dim_single_unit_step, Window::DimW, Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, arm_compute::execute_window_loop(), arm_compute::test::validation::for(), ITensor::info(), is_valid_input_region(), Iterator::ptr(), Window::set(), arm_compute::test::validation::src, arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), vector_size, arm_compute::wrapper::vload(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vstore(), arm_compute::test::validation::w, Size2D::x(), and Size2D::y().
void arm_compute::cpu::directconv3d_float_neon_ndhwc | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
const ITensor * | src2, | ||
ITensor * | dst, | ||
const Conv3dInfo & | conv_info, | ||
const Window & | window | ||
) |
Definition at line 40 of file list.h.
References ITensor::buffer(), arm_compute::calculate_max_window(), arm_compute::test::validation::conv_info, ITensorInfo::dimension(), Window::DimW, Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, arm_compute::execute_window_loop(), ITensor::info(), ITensorInfo::offset_first_element_in_bytes(), Iterator::ptr(), Window::set(), arm_compute::test::validation::src, ITensorInfo::strides_in_bytes(), type, arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmla(), arm_compute::vreduce(), and arm_compute::wrapper::vsetlane().
void arm_compute::cpu::directconv3d_quantized_neon_ndhwc | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
const ITensor * | src2, | ||
ITensor * | dst, | ||
const Conv3dInfo & | conv_info, | ||
const Window & | window | ||
) |
Definition at line 41 of file quantized.h.
References ITensor::buffer(), arm_compute::calculate_max_window(), arm_compute::quantization::calculate_quantized_multiplier(), arm_compute::test::validation::conv_info, ITensorInfo::dimension(), Window::DimW, Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, arm_compute::execute_window_loop(), arm_compute::finalize_quantization(), ITensor::info(), UniformQuantizationInfo::offset, ITensorInfo::offset_first_element_in_bytes(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, ITensorInfo::strides_in_bytes(), type, QuantizationInfo::uniform(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmovl(), arm_compute::wrapper::vpadd(), and arm_compute::wrapper::vsetlane().
float32x4x4_t arm_compute::cpu::elementwise_arithm_op | ( | const float32x4x4_t & | a, |
const float32x4x4_t & | b | ||
) |
void arm_compute::cpu::elementwise_arithm_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
VectorType::type arm_compute::cpu::elementwise_arithm_op | ( | const typename VectorType::type & | a, |
const typename VectorType::type & | b | ||
) |
Definition at line 34 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::MAX, arm_compute::MIN, arm_compute::PRELU, arm_compute::SQUARED_DIFF, type, arm_compute::wrapper::vbsl(), arm_compute::wrapper::vcgt(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmin(), arm_compute::wrapper::vmul(), and arm_compute::wrapper::vsub().
|
inline |
Definition at line 232 of file impl.h.
References arm_compute::test::validation::b, and arm_compute::wrapper::vdiv().
|
inline |
Definition at line 224 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vdiv(), and arm_compute::vfloorq_f32().
|
inline |
Definition at line 240 of file impl.h.
References arm_compute::test::validation::b, and arm_compute::wrapper::vpow().
VectorType::type arm_compute::cpu::elementwise_arithm_op_broadcast | ( | const typename VectorType::type & | a, |
const ScalarType & | broadcast_value, | ||
const bool | reorder | ||
) |
Definition at line 74 of file impl.h.
References type, and arm_compute::wrapper::vdup_n().
|
inline |
Definition at line 282 of file impl.h.
References arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
|
inline |
Definition at line 264 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
void arm_compute::cpu::elementwise_arithm_op_quantized | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
|
inline |
|
inline |
|
inline |
Definition at line 630 of file impl.h.
References arm_compute::test::validation::b, arm_compute::test::validation::qinfo, and arm_compute::quantize_qasymm8().
void arm_compute::cpu::elementwise_arithm_op_quantized_signed | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 1291 of file impl.h.
References elementwise_op_quantized_signed().
|
inline |
Definition at line 749 of file impl.h.
References load_quantized_signed(), and store_quantized_signed().
|
inline |
Definition at line 637 of file impl.h.
References arm_compute::test::validation::b, arm_compute::test::validation::qinfo, and arm_compute::quantize_qasymm8_signed().
|
inline |
Definition at line 699 of file impl.h.
References load_quantized_signed(), and store_quantized_signed().
|
inline |
Definition at line 176 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::DIV, arm_compute::MAX, arm_compute::MIN, arm_compute::POWER, arm_compute::PRELU, and arm_compute::SQUARED_DIFF.
void elementwise_arithmetic_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
ArithmeticOperation | op, | ||
const Window & | window | ||
) |
Definition at line 38 of file impl.cpp.
References Window::broadcast_if_dimension_le_one(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), type, Dimensions< T >::x(), and Window::x().
VectorType arm_compute::cpu::elementwise_arithmetic_op | ( | svbool_t & | pg, |
const VectorType & | a, | ||
const VectorType & | b, | ||
ArithmeticOperation | op | ||
) |
Definition at line 73 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::DIV, elementwise_div(), elementwise_pow(), arm_compute::MAX, arm_compute::MIN, arm_compute::POWER, arm_compute::PRELU, arm_compute::SQUARED_DIFF, and type.
template void arm_compute::cpu::elementwise_arithmetic_op< float16_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ArithmeticOperation | op, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::elementwise_arithmetic_op< float32_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ArithmeticOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_fp32_elementwise_binary().
template void arm_compute::cpu::elementwise_arithmetic_op< int16_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ArithmeticOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_s16_elementwise_binary().
template void arm_compute::cpu::elementwise_arithmetic_op< int32_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ArithmeticOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_s32_elementwise_binary().
void arm_compute::cpu::elementwise_arithmetic_quantized_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
ArithmeticOperation | op, | ||
const Window & | window | ||
) |
Definition at line 96 of file impl.h.
References Window::broadcast_if_dimension_le_one(), Qasymm8QuantizationHelper< QUANTIZED_TYPE >::dequantize(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), load_quantized(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), store_quantized(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
|
inline |
|
inline |
Definition at line 343 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::Equal, arm_compute::Greater, arm_compute::GreaterEqual, arm_compute::Less, arm_compute::LessEqual, arm_compute::NotEqual, arm_compute::wrapper::vceq(), arm_compute::wrapper::vcge(), arm_compute::wrapper::vcgt(), and arm_compute::wrapper::vnot().
void arm_compute::cpu::elementwise_comp_op_16 | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
|
inline |
Definition at line 472 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmovn(), and arm_compute::wrapper::vstore().
void arm_compute::cpu::elementwise_comp_op_32 | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
|
inline |
Definition at line 491 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vcombine(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmovn(), and arm_compute::wrapper::vstore().
void arm_compute::cpu::elementwise_comp_op_8 | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
|
inline |
Definition at line 453 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
|
inline |
Definition at line 376 of file impl.h.
References arm_compute::wrapper::vdup_n().
|
inline |
Definition at line 403 of file impl.h.
References arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmovn(), and arm_compute::wrapper::vstore().
|
inline |
Definition at line 422 of file impl.h.
References arm_compute::test::validation::b, arm_compute::wrapper::vcombine(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmovn(), and arm_compute::wrapper::vstore().
|
inline |
Definition at line 384 of file impl.h.
References arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
void arm_compute::cpu::elementwise_comp_op_quantized | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
|
inline |
Definition at line 826 of file impl.h.
References ARM_COMPUTE_UNUSED, load_quantized(), and store_quantized().
|
inline |
Definition at line 774 of file impl.h.
References ARM_COMPUTE_UNUSED, load_quantized(), and store_quantized().
|
inline |
Definition at line 656 of file impl.h.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, and arm_compute::test::validation::qinfo.
void arm_compute::cpu::elementwise_comp_op_quantized_signed | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 1307 of file impl.h.
References elementwise_comp_quantized_signed().
|
inline |
Definition at line 852 of file impl.h.
References ARM_COMPUTE_UNUSED, load_quantized_signed(), and store_quantized().
|
inline |
Definition at line 800 of file impl.h.
References ARM_COMPUTE_UNUSED, load_quantized_signed(), and store_quantized().
|
inline |
Definition at line 312 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::Equal, arm_compute::Greater, arm_compute::GreaterEqual, arm_compute::Less, arm_compute::LessEqual, and arm_compute::NotEqual.
|
inline |
Definition at line 1013 of file impl.h.
References arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), arm_compute::dequantize_qasymm8_signed(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), arm_compute::vdequantize(), Dimensions< T >::x(), and Window::x().
Referenced by elementwise_comp_op_quantized_signed().
void elementwise_comparison_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
ComparisonOperation | op, | ||
const Window & | window | ||
) |
Definition at line 152 of file impl.cpp.
References Window::broadcast_if_dimension_le_one(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), type, Dimensions< T >::x(), and Window::x().
OutputVectorType arm_compute::cpu::elementwise_comparison_op | ( | svbool_t & | pg, |
const InputVectorType & | a, | ||
const InputVectorType & | b, | ||
ComparisonOperation | op | ||
) |
Definition at line 119 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::test::validation::b, arm_compute::Equal, arm_compute::Greater, arm_compute::GreaterEqual, arm_compute::Less, arm_compute::LessEqual, arm_compute::NotEqual, and type.
template void arm_compute::cpu::elementwise_comparison_op< float16_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ComparisonOperation | op, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::elementwise_comparison_op< float32_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ComparisonOperation | op, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::elementwise_comparison_op< int16_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ComparisonOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_s16_comparison_elementwise_binary().
template void arm_compute::cpu::elementwise_comparison_op< int32_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ComparisonOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_s32_comparison_elementwise_binary().
template void arm_compute::cpu::elementwise_comparison_op< uint8_t > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const ComparisonOperation | op, | ||
const Window & | window | ||
) |
Referenced by sve_u8_comparison_elementwise_binary().
void arm_compute::cpu::elementwise_comparison_quantized_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
ComparisonOperation | op, | ||
const Window & | window | ||
) |
Definition at line 235 of file impl.h.
References Window::broadcast_if_dimension_le_one(), Qasymm8QuantizationHelper< QUANTIZED_TYPE >::dequantize(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), load_quantized(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), type, QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
VectorType arm_compute::cpu::elementwise_div | ( | svbool_t & | pg, |
const VectorType & | a, | ||
const VectorType & | b | ||
) |
Definition at line 45 of file impl.h.
References arm_compute::test::validation::b.
Referenced by elementwise_arithmetic_op().
svint16_t arm_compute::cpu::elementwise_div< svint16_t > | ( | svbool_t & | pg, |
const svint16_t & | a, | ||
const svint16_t & | b | ||
) |
Definition at line 290 of file impl.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, and arm_compute::test::validation::b.
svint32_t arm_compute::cpu::elementwise_div< svint32_t > | ( | svbool_t & | pg, |
const svint32_t & | a, | ||
const svint32_t & | b | ||
) |
Definition at line 284 of file impl.cpp.
References arm_compute::test::validation::b.
|
inline |
Definition at line 86 of file impl.h.
References Window::DimX, elementwise_op_scalar_imp(), Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vstore(), and Window::x().
void arm_compute::cpu::elementwise_op | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window, | ||
OutputScalarType(*)(const InputScalarType &, const InputScalarType &) | scalar_func, | ||
int(*)(int, int, int, const InputScalarType *, const InputScalarType &, OutputScalarType *, const bool) | broadcast_func, | ||
int(*)(int, int, int, const InputScalarType *, const InputScalarType *, OutputScalarType *) | neon_func | ||
) |
Definition at line 86 of file impl.h.
References arm_compute::test::validation::b, Window::broadcast_if_dimension_le_one(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), Dimensions< T >::x(), and Window::x().
|
inline |
Definition at line 119 of file impl.h.
References arm_compute::dequantize_qasymm8_signed(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::input, arm_compute::LOG, UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), arm_compute::quantize_qasymm8_signed(), arm_compute::RSQRT, UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), arm_compute::TO_ZERO, QuantizationInfo::uniform(), arm_compute::vdequantize(), arm_compute::wrapper::vloadq(), arm_compute::vquantize_signed(), arm_compute::wrapper::vstore(), and Window::x().
Referenced by neon_qasymm8_signed_elementwise_unary().
|
inline |
Definition at line 211 of file impl.h.
References arm_compute::dequantize_qasymm8(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::input, arm_compute::LOG, UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), arm_compute::quantize_qasymm8(), arm_compute::RSQRT, UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), arm_compute::TO_ZERO, QuantizationInfo::uniform(), arm_compute::vdequantize(), arm_compute::wrapper::vloadq(), arm_compute::vquantize(), arm_compute::wrapper::vstore(), and Window::x().
Referenced by neon_qasymm8_elementwise_unary().
|
inline |
Definition at line 62 of file impl.h.
References arm_compute::ABS, ARM_COMPUTE_ERROR, arm_compute::EXP, arm_compute::LOG, arm_compute::NEG, arm_compute::ROUND, arm_compute::RSQRT, arm_compute::SIN, arm_compute::wrapper::vabs(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vlog(), arm_compute::wrapper::vneg(), arm_compute::wrapper::vround(), and arm_compute::wrapper::vsin().
|
inline |
Definition at line 877 of file impl.h.
References arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), arm_compute::dequantize_qasymm8(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), arm_compute::vdequantize(), Dimensions< T >::x(), and Window::x().
Referenced by elementwise_arithm_op_quantized(), and elementwise_comp_op_quantized().
|
inline |
Definition at line 1148 of file impl.h.
References arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), arm_compute::dequantize_qasymm8_signed(), Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), arm_compute::vdequantize(), Dimensions< T >::x(), and Window::x().
Referenced by elementwise_arithm_op_quantized_signed().
|
inline |
Definition at line 38 of file impl.h.
References arm_compute::ABS, ARM_COMPUTE_ERROR, arm_compute::EXP, arm_compute::LOG, arm_compute::support::cpp11::nearbyint(), arm_compute::NEG, arm_compute::ROUND, arm_compute::RSQRT, and arm_compute::SIN.
Referenced by elementwise_op().
|
inline |
Definition at line 36 of file impl.cpp.
References arm_compute::ABS, ARM_COMPUTE_ERROR, arm_compute::EXP, arm_compute::LOG, arm_compute::NEG, arm_compute::ROUND, arm_compute::RSQRT, and arm_compute::SIN.
Referenced by elementwise_sve_op().
|
inline |
Definition at line 61 of file impl.cpp.
References arm_compute::ABS, ARM_COMPUTE_ERROR, and arm_compute::NEG.
VectorType arm_compute::cpu::elementwise_pow | ( | svbool_t & | pg, |
const VectorType & | a, | ||
const VectorType & | b | ||
) |
Definition at line 39 of file impl.h.
References arm_compute::test::validation::b.
Referenced by elementwise_arithmetic_op().
svint32_t arm_compute::cpu::elementwise_pow< svint32_t > | ( | svbool_t & | pg, |
const svint32_t & | a, | ||
const svint32_t & | b | ||
) |
Definition at line 278 of file impl.cpp.
References arm_compute::test::validation::b.
void elementwise_sve_op | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op | ||
) |
Definition at line 75 of file impl.cpp.
References Window::DimX, elementwise_op_sve_imp(), Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), Window::Dimension::start(), and Window::x().
template void arm_compute::cpu::elementwise_sve_op< float16_t > | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op | ||
) |
template void arm_compute::cpu::elementwise_sve_op< float32_t > | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op | ||
) |
Referenced by sve_fp32_elementwise_unary().
template void arm_compute::cpu::elementwise_sve_op< int32_t > | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op | ||
) |
Referenced by sve_s32_elementwise_unary().
void arm_compute::cpu::fp16_batch_normalization_nchw_non_fused | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
void arm_compute::cpu::fp16_batch_normalization_nchw_non_fused_brelu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
void arm_compute::cpu::fp16_batch_normalization_nchw_non_fused_lubrelu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
void arm_compute::cpu::fp16_batch_normalization_nchw_non_fused_relu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
void arm_compute::cpu::fp16_bilinear_neon_scale_nchw | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Referenced by CpuScaleKernel::configure().
void arm_compute::cpu::fp16_common_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
void arm_compute::cpu::fp16_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
void arm_compute::cpu::fp16_nearest_neon_scale_nchw | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Referenced by CpuScaleKernel::configure().
void arm_compute::cpu::fp16_neon_batch_normalization | ( | ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::fp16_neon_floor | ( | const void * | src, |
void * | dst, | ||
int | len | ||
) |
void arm_compute::cpu::fp16_neon_range_function | ( | ITensor * | output, |
float | start, | ||
float | step, | ||
const Window & | window | ||
) |
void arm_compute::cpu::fp16_sve_batch_normalization | ( | ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::fp16_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
void fp32_batch_normalization_nchw_non_fused | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
Definition at line 37 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::quantization::epsilon, and arm_compute::test::validation::input.
void fp32_batch_normalization_nchw_non_fused_brelu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
Definition at line 65 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::quantization::epsilon, and arm_compute::test::validation::input.
void fp32_batch_normalization_nchw_non_fused_lubrelu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
Definition at line 79 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::quantization::epsilon, and arm_compute::test::validation::input.
void fp32_batch_normalization_nchw_non_fused_relu | ( | const Window & | window, |
ITensor * | input, | ||
ITensor * | output, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo | act_info | ||
) |
Definition at line 51 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::quantization::epsilon, and arm_compute::test::validation::input.
void fp32_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 31 of file fp32.cpp.
References arm_compute::test::validation::input.
void fp32_neon_batch_normalization | ( | ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 156 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::test::validation::dst, arm_compute::quantization::epsilon, and arm_compute::test::validation::src.
void fp32_neon_floor | ( | const void * | src, |
void * | dst, | ||
int | len | ||
) |
Definition at line 37 of file fp32.cpp.
References ARM_COMPUTE_ASSERT, ARM_COMPUTE_ASSERT_NOT_NULLPTR, arm_compute::test::validation::dst, arm_compute::test::validation::src, step, and arm_compute::vfloorq_f32().
void arm_compute::cpu::fp32_sve_batch_normalization | ( | ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | mean, | ||
const ITensor * | var, | ||
const ITensor * | beta, | ||
const ITensor * | gamma, | ||
float | epsilon, | ||
ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void fp32_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 97 of file fp32.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void arm_compute::cpu::fp_neon_activation_impl | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 60 of file impl.h.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, arm_compute::test::validation::b, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, mask_float_vector(), Iterator::ptr(), Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::wrapper::vabs(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vbsl(), arm_compute::wrapper::vceq(), arm_compute::wrapper::vcge(), arm_compute::wrapper::vcgt(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::verf(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vinv(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vlog(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmin(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vneg(), arm_compute::wrapper::vnot(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), arm_compute::wrapper::vtanh(), and Window::x().
void arm_compute::cpu::fused_batch_normalization_conv | ( | const ITensor * | conv_weights, |
const ITensor * | conv_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 154 of file impl.h.
References Window::DimX, ITensorInfo::element_size(), Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensor::ptr_to_element(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), and Window::x().
void arm_compute::cpu::fused_batch_normalization_conv_f16 | ( | const ITensor * | conv_weights, |
const ITensor * | conv_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
void fused_batch_normalization_conv_f32 | ( | const ITensor * | conv_weights, |
const ITensor * | conv_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 31 of file fp32.cpp.
References arm_compute::quantization::epsilon.
void arm_compute::cpu::fused_batch_normalization_dwc_nchw | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 266 of file impl.h.
References Window::DimX, ITensorInfo::element_size(), Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensor::ptr_to_element(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), and Window::x().
void arm_compute::cpu::fused_batch_normalization_dwc_nchw_f16 | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
void fused_batch_normalization_dwc_nchw_f32 | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 31 of file all.cpp.
References arm_compute::quantization::epsilon.
void arm_compute::cpu::fused_batch_normalization_dwc_nhwc | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 36 of file impl.h.
References Window::DimX, ITensorInfo::element_size(), Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensor::ptr_to_element(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), and Window::x().
void arm_compute::cpu::fused_batch_normalization_dwc_nhwc_f16 | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
void fused_batch_normalization_dwc_nhwc_f32 | ( | const ITensor * | dwc_weights, |
const ITensor * | dwc_bias, | ||
ITensor * | fused_weights, | ||
ITensor * | fused_bias, | ||
const ITensor * | bn_mean, | ||
const ITensor * | bn_var, | ||
const ITensor * | bn_beta, | ||
const ITensor * | bn_gamma, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 32 of file fp32.cpp.
References arm_compute::quantization::epsilon.
T arm_compute::cpu::get_initial_min | ( | bool | use_inf_as_limit | ) |
Definition at line 65 of file list.h.
References arm_compute::support::cpp11::lowest().
void arm_compute::cpu::in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 39 of file impl.h.
References ITensorInfo::dimension(), ITensorInfo::element_size(), ITensor::info(), arm_compute::test::validation::input, load_as_f32(), Dimensions< T >::set(), arm_compute::wrapper::vcombine(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vrev64(), and arm_compute::wrapper::vstore().
void instance_normalization_nchw | ( | ITensor * | input, |
ITensor * | output, | ||
float | gamma, | ||
float | beta, | ||
float | epsilon, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 49 of file impl.cpp.
References ITensorInfo::dimension(), Window::DimX, Window::DimY, Window::DimZ, Window::Dimension::end(), arm_compute::mlgo::parser::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vdup_n(), vector_float_norm(), vector_float_sum(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vpadd(), arm_compute::wrapper::vstore(), and Window::x().
template void arm_compute::cpu::instance_normalization_nchw< float > | ( | ITensor * | input, |
ITensor * | output, | ||
float | gamma, | ||
float | beta, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Referenced by neon_fp32_instancenorm().
|
inline |
Definition at line 97 of file impl.h.
References DepthwiseConvolutionRunInfo::input_height, DepthwiseConvolutionRunInfo::input_width, arm_compute::test::validation::w, Size2D::x(), and Size2D::y().
Referenced by depthwise_loop_generic_fp(), and depthwise_loop_multiplier1_fp().
void arm_compute::cpu::l2_normalize_x | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 40 of file impl.h.
References Window::collapse_if_possible(), arm_compute::data_size_from_type(), ITensorInfo::data_type(), Window::DimX, Window::DimZ, Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), and Window::x().
void arm_compute::cpu::l2_normalize_yz | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window, | ||
size_t | axis | ||
) |
Definition at line 83 of file impl.h.
References arm_compute::data_size_from_type(), ITensorInfo::data_type(), Window::DimX, Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vinvsqrt(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), and Window::x().
|
inline |
Definition at line 49 of file crop_helper.h.
References arm_compute::wrapper::vloadq().
|
inline |
Definition at line 67 of file crop_helper.h.
References arm_compute::wrapper::vload().
|
inline |
Definition at line 55 of file crop_helper.h.
References arm_compute::wrapper::vloadq().
|
inline |
Definition at line 34 of file crop_helper.h.
References ARM_COMPUTE_ERROR, and ARM_COMPUTE_UNUSED.
Referenced by in_bounds_crop_window().
|
inline |
Definition at line 73 of file crop_helper.h.
References arm_compute::wrapper::vload().
|
inline |
Definition at line 61 of file crop_helper.h.
References arm_compute::wrapper::vloadq().
|
inline |
Definition at line 79 of file crop_helper.h.
References arm_compute::wrapper::vload().
|
inline |
Definition at line 34 of file impl.h.
References offset(), and arm_compute::test::validation::scale.
|
inline |
Definition at line 550 of file impl.h.
References offset(), and arm_compute::test::validation::scale.
Referenced by elementwise_arithm_op_quantized_broadcast_loop(), elementwise_arithm_op_quantized_loop(), elementwise_arithmetic_quantized_op(), elementwise_comp_op_quantized_broadcast_loop(), elementwise_comp_op_quantized_loop(), and elementwise_comparison_quantized_op().
|
inline |
Definition at line 48 of file impl.h.
References offset(), and arm_compute::test::validation::scale.
|
inline |
Definition at line 570 of file impl.h.
References offset(), and arm_compute::test::validation::scale.
Referenced by elementwise_arithm_op_quantized_signed_broadcast_loop(), elementwise_arithm_op_quantized_singed_loop(), elementwise_comp_op_quantized_signed_broadcast_loop(), and elementwise_comp_op_quantized_signed_loop().
|
inline |
Definition at line 45 of file impl.h.
References arm_compute::wrapper::vand().
Referenced by fp_neon_activation_impl().
Definition at line 33 of file impl.cpp.
References ARM_COMPUTE_ERROR_ON_NULLPTR, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), Iterator::ptr(), Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), and Window::x().
Referenced by neon_fp32_gemm_matrix_add().
void matrix_matrix_multiply_f32 | ( | const ITensor * | lhs, |
const ITensor * | rhs, | ||
ITensor * | dst, | ||
const Window & | window, | ||
const ThreadInfo & | info, | ||
float | alpha | ||
) |
Definition at line 279 of file impl.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::data_size_from_type(), ITensorInfo::data_type(), ITensorInfo::dimension(), Window::DimX, Window::DimY, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::info, arm_compute::helpers::float_ops::is_one(), ITensorInfo::num_dimensions(), Iterator::ptr(), Window::set(), Window::Dimension::start(), ITensorInfo::strides_in_bytes(), Window::x(), and Window::y().
Referenced by neon_fp32_gemm_matrix_mul().
void arm_compute::cpu::max_poolingMxNxD_q8_neon_ndhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window_out, | ||
const int | window_step_x | ||
) |
Definition at line 232 of file quantized.h.
References Size3D::depth, arm_compute::execute_window_loop(), Padding3D::front, Size3D::height, ITensor::info(), Pooling3dLayerInfo::is_global_pooling, Padding3D::left, UniformQuantizationInfo::offset, Pooling3dLayerInfo::padding, Pooling3dLayerInfo::pool_size, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, arm_compute::test::validation::src, Pooling3dLayerInfo::stride, Padding3D::top, QuantizationInfo::uniform(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vload(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vstore(), and Size3D::width.
void arm_compute::cpu::max_unpooling | ( | const ITensor * | input, |
const ITensor * | indices, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 35 of file impl.h.
References ITensor::buffer(), arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::input, Iterator::ptr(), and ITensorInfo::strides_in_bytes().
void mean_stddev_normalization | ( | ITensor * | input, |
ITensor * | output, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 34 of file impl.cpp.
References Window::DimX, Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vpadd(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), and Window::x().
template void arm_compute::cpu::mean_stddev_normalization< float, 4 > | ( | ITensor * | input, |
ITensor * | output, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Referenced by neon_fp32_meanstddevnorm().
void arm_compute::cpu::mul_F16_F16_F16 | ( | const ITensor * | src1, |
const ITensor * | src2, | ||
ITensor * | out, | ||
const Window & | window, | ||
float | scale | ||
) |
Referenced by CpuMulKernel::configure().
void mul_F32_F32_F32 | ( | const ITensor * | src1, |
const ITensor * | src2, | ||
ITensor * | out, | ||
const Window & | window, | ||
float | scale | ||
) |
Definition at line 36 of file fp32.cpp.
References Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), arm_compute::test::validation::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vstore(), Dimensions< T >::x(), and Window::x().
Referenced by CpuMulKernel::configure(), and CpuMulKernel::get_mws().
svbool_t arm_compute::cpu::narrow_to_byte_predicate | ( | svbool_t | pg | ) |
void arm_compute::cpu::nearest_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 219 of file list.h.
References ARM_COMPUTE_UNUSED, arm_compute::scale_utils::calculate_resize_ratio(), Window::DimX, Window::DimY, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), Iterator::ptr(), arm_compute::utils::rounding::round_half_away_from_zero(), arm_compute::test::validation::scale_x, arm_compute::test::validation::scale_y, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), Window::Dimension::step(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vstore(), Window::y(), and Window::z().
void arm_compute::cpu::neon_bfloat16_to_fp32_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_f16_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_f16_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_boundingboxtransform | ( | const ITensor * | boxes, |
ITensor * | pred_boxes, | ||
const ITensor * | deltas, | ||
BoundingBoxTransformInfo | bbinfo, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_computeallanchors | ( | const ITensor * | anchors, |
ITensor * | all_anchors, | ||
ComputeAnchorsInfo | anchors_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
void arm_compute::cpu::neon_fp16_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
void arm_compute::cpu::neon_fp16_gemm_matrix_add | ( | const ITensor * | src, |
ITensor * | dst, | ||
const Window & | window, | ||
float | beta | ||
) |
void arm_compute::cpu::neon_fp16_gemm_matrix_mul | ( | const ITensor * | lhs, |
const ITensor * | rhs, | ||
ITensor * | dst, | ||
const Window & | window, | ||
const ThreadInfo & | info, | ||
float | alpha, | ||
const bool | is_dst_vector | ||
) |
void arm_compute::cpu::neon_fp16_instancenorm | ( | ITensor * | input, |
ITensor * | output, | ||
float | gamma, | ||
float | beta, | ||
float | epsilon, | ||
bool | use_mixed_precision, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_l2_normalize_x | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window, | ||
size_t | axis | ||
) |
void arm_compute::cpu::neon_fp16_l2_normalize_yz | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window, | ||
size_t | axis | ||
) |
void arm_compute::cpu::neon_fp16_maxunpooling | ( | const ITensor * | input, |
const ITensor * | indices, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_meanstddevnorm | ( | ITensor * | input, |
ITensor * | output, | ||
float | epsilon, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_pool3d | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | , | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_roialign | ( | const ITensor * | input, |
ITensor * | output, | ||
const ITensor * | rois, | ||
ROIPoolingLayerInfo | pool_info, | ||
const Window & | window, | ||
const ThreadInfo & | info | ||
) |
void arm_compute::cpu::neon_fp16_softmax | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp16_to_other_dt_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void neon_fp32_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 34 of file fp32.cpp.
References arm_compute::test::validation::act_info, arm_compute::test::validation::dst, and arm_compute::test::validation::src.
void neon_fp32_boundingboxtransform | ( | const ITensor * | boxes, |
ITensor * | pred_boxes, | ||
const ITensor * | deltas, | ||
BoundingBoxTransformInfo | bbinfo, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_fp32_computeallanchors | ( | const ITensor * | anchors, |
ITensor * | all_anchors, | ||
ComputeAnchorsInfo | anchors_info, | ||
const Window & | window | ||
) |
void neon_fp32_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 29 of file fp32.cpp.
References bias, arm_compute::test::validation::dst, arm_compute::test::validation::info, and arm_compute::test::validation::src.
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_fp32_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 32 of file fp32.cpp.
References ARM_COMPUTE_UNUSED.
void neon_fp32_gemm_matrix_add | ( | const ITensor * | src, |
ITensor * | dst, | ||
const Window & | window, | ||
float | beta | ||
) |
Definition at line 31 of file fp32.cpp.
References arm_compute::test::validation::dst, matrix_addition_f32(), and arm_compute::test::validation::src.
void neon_fp32_gemm_matrix_mul | ( | const ITensor * | lhs, |
const ITensor * | rhs, | ||
ITensor * | dst, | ||
const Window & | window, | ||
const ThreadInfo & | info, | ||
float | alpha, | ||
const bool | is_dst_vector | ||
) |
Definition at line 31 of file fp32.cpp.
References arm_compute::test::validation::dst, arm_compute::test::validation::info, matrix_matrix_multiply_f32(), and vector_matrix_multiply_f32().
void neon_fp32_instancenorm | ( | ITensor * | input, |
ITensor * | output, | ||
float | gamma, | ||
float | beta, | ||
float | epsilon, | ||
bool | use_mixed_precision, | ||
const Window & | window | ||
) |
Definition at line 29 of file fp32.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::quantization::epsilon, arm_compute::test::validation::input, and instance_normalization_nchw< float >().
void neon_fp32_l2_normalize_x | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window, | ||
size_t | unused_axis | ||
) |
Definition at line 33 of file fp32.cpp.
References ARM_COMPUTE_UNUSED, and arm_compute::quantization::epsilon.
void neon_fp32_l2_normalize_yz | ( | const ITensor * | in, |
const ITensor * | sum, | ||
ITensor * | out, | ||
float | epsilon, | ||
const Window & | window, | ||
size_t | axis | ||
) |
Definition at line 40 of file fp32.cpp.
References arm_compute::quantization::epsilon.
void neon_fp32_maxunpooling | ( | const ITensor * | input, |
const ITensor * | indices, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 29 of file fp32.cpp.
References arm_compute::test::validation::input.
void neon_fp32_meanstddevnorm | ( | ITensor * | input, |
ITensor * | output, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 30 of file fp32.cpp.
References arm_compute::quantization::epsilon, arm_compute::test::validation::input, and mean_stddev_normalization< float, 4 >().
void neon_fp32_pool3d | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 29 of file fp32.cpp.
References arm_compute::test::validation::src.
void neon_fp32_roialign | ( | const ITensor * | input, |
ITensor * | output, | ||
const ITensor * | rois, | ||
ROIPoolingLayerInfo | pool_info, | ||
const Window & | window, | ||
const ThreadInfo & | info | ||
) |
Definition at line 29 of file fp32.cpp.
References arm_compute::test::validation::info, and arm_compute::test::validation::input.
template void arm_compute::cpu::neon_fp32_softmax< false > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_fp32_softmax< true > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp32_to_bfloat16_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_fp32_to_fp16_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_normalize_float16_8_0 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Referenced by NENormalizationLayerKernel::configure().
void arm_compute::cpu::neon_normalize_float16_8_0_2D | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Referenced by NENormalizationLayerKernel::configure().
void arm_compute::cpu::neon_normalize_float16_8_1 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Referenced by NENormalizationLayerKernel::configure().
void arm_compute::cpu::neon_normalize_float16_8_1_2D | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Referenced by NENormalizationLayerKernel::configure().
void arm_compute::cpu::neon_normalize_float16_8_2 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Referenced by NENormalizationLayerKernel::configure().
void neon_normalize_float32_4_0 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Definition at line 39 of file fp32.cpp.
Referenced by NENormalizationLayerKernel::configure().
void neon_normalize_float32_4_0_2D | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Definition at line 33 of file fp32.cpp.
Referenced by NENormalizationLayerKernel::configure().
void neon_normalize_float32_4_1 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Definition at line 51 of file fp32.cpp.
Referenced by NENormalizationLayerKernel::configure().
void neon_normalize_float32_4_1_2D | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Definition at line 45 of file fp32.cpp.
Referenced by NENormalizationLayerKernel::configure().
void neon_normalize_float32_4_2 | ( | const Window & | window, |
const ITensor * | in, | ||
const ITensor * | in_squared, | ||
ITensor * | out, | ||
NormalizationLayerInfo | ninfo | ||
) |
Definition at line 57 of file fp32.cpp.
Referenced by NENormalizationLayerKernel::configure().
void arm_compute::cpu::neon_q8_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
void neon_q8_pool3d | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 29 of file qasymm8.cpp.
References arm_compute::test::validation::src.
void neon_q8_signed_pool3d | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 29 of file qasymm8_signed.cpp.
References arm_compute::test::validation::src.
void neon_qasymm8_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 42 of file qasymm8.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, arm_compute::test::validation::b, Window::collapse_if_possible(), arm_compute::dequantize_qasymm8(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, arm_compute::support::cpp11::lround(), UniformQuantizationInfo::offset, Iterator::ptr(), arm_compute::quantize_qasymm8(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vbsl(), arm_compute::wrapper::vcgt(), arm_compute::vdequantize(), arm_compute::wrapper::vdiv(), arm_compute::wrapper::verf(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmin(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vneg(), arm_compute::vquantize(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vtanh(), and Window::x().
void neon_qasymm8_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 71 of file qasymm8.cpp.
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_qasymm8_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 32 of file qasymm8.cpp.
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_qasymm8_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 35 of file qasymm8.cpp.
References ARM_COMPUTE_UNUSED, and elementwise_op< uint8_t >().
void neon_qasymm8_meanstddevnorm | ( | ITensor * | input, |
ITensor * | output, | ||
float | epsilon, | ||
const Window & | window | ||
) |
Definition at line 52 of file qasymm8.cpp.
References Window::DimX, Window::Dimension::end(), arm_compute::quantization::epsilon, arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::input, UniformQuantizationInfo::offset, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), QuantizationInfo::uniform(), and Window::x().
void neon_qasymm8_signed_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 40 of file qasymm8_signed.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, arm_compute::test::validation::b, Window::collapse_if_possible(), arm_compute::dequantize_qasymm8_signed(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, arm_compute::support::cpp11::lround(), UniformQuantizationInfo::offset, Iterator::ptr(), arm_compute::quantize_qasymm8_signed(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vbsl(), arm_compute::wrapper::vcgt(), arm_compute::vdequantize(), arm_compute::wrapper::vdiv(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmin(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vneg(), arm_compute::vquantize_signed(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vtanh(), and Window::x().
void neon_qasymm8_signed_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 72 of file qasymm8_signed.cpp.
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_qasymm8_signed_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8_signed.cpp.
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_qasymm8_signed_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 35 of file qasymm8_signed.cpp.
References ARM_COMPUTE_UNUSED, and elementwise_op< int8_t >().
void neon_qasymm8_signed_softmax | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8_signed.cpp.
template void arm_compute::cpu::neon_qasymm8_signed_softmax< false > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_signed_softmax< true > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
void arm_compute::cpu::neon_qasymm8_signed_to_fp16_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void neon_qasymm8_softmax | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8.cpp.
template void arm_compute::cpu::neon_qasymm8_softmax< false > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_qasymm8_softmax< true > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
const Window & | window | ||
) |
void neon_qp8_qs8_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 40 of file qasymm8_signed.cpp.
References bias, arm_compute::test::validation::dst, arm_compute::test::validation::info, run_depthwise_quanitized8bit< int8_t, int8_t >(), and arm_compute::test::validation::src.
void neon_qp8_qu8_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 40 of file qasymm8.cpp.
References bias, arm_compute::test::validation::dst, arm_compute::test::validation::info, run_depthwise_quanitized8bit< uint8_t, int8_t >(), and arm_compute::test::validation::src.
void neon_qs8_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 29 of file qasymm8_signed.cpp.
References bias, arm_compute::test::validation::dst, arm_compute::test::validation::info, run_depthwise_quanitized8bit< int8_t, int8_t >(), and arm_compute::test::validation::src.
void neon_qs8_maxunpooling | ( | const ITensor * | input, |
const ITensor * | indices, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 29 of file qasymm8.cpp.
References arm_compute::test::validation::input.
void neon_qs8_roialign | ( | const ITensor * | input, |
ITensor * | output, | ||
const ITensor * | rois, | ||
ROIPoolingLayerInfo | pool_info, | ||
const Window & | window, | ||
const ThreadInfo & | info | ||
) |
Definition at line 29 of file qasymm8_signed.cpp.
References arm_compute::test::validation::info, and arm_compute::test::validation::input.
void neon_qsymm16_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 42 of file qsymm16.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, Window::collapse_if_possible(), arm_compute::dequantize_qsymm16(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), arm_compute::quantize_qsymm16(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::wrapper::vadd(), arm_compute::vdequantize_int16(), arm_compute::wrapper::vdiv(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmin(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vneg(), arm_compute::vquantize_int16(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vtanh(), and Window::x().
void neon_qu16_boundingboxtransform | ( | const ITensor * | boxes, |
ITensor * | pred_boxes, | ||
const ITensor * | deltas, | ||
BoundingBoxTransformInfo | bbinfo, | ||
const Window & | window | ||
) |
Definition at line 29 of file qsymm16.cpp.
References bounding_box_transform_qsymm16().
void neon_qu16_computeallanchors | ( | const ITensor * | anchors, |
ITensor * | all_anchors, | ||
ComputeAnchorsInfo | anchors_info, | ||
const Window & | window | ||
) |
Definition at line 29 of file qsymm16.cpp.
References compute_all_anchors_qasymm16().
void neon_qu8_deptwiseconv2dnative | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | bias, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 29 of file qasymm8.cpp.
References bias, arm_compute::test::validation::dst, arm_compute::test::validation::info, run_depthwise_quanitized8bit< uint8_t, uint8_t >(), and arm_compute::test::validation::src.
void neon_qu8_maxunpooling | ( | const ITensor * | input, |
const ITensor * | indices, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 29 of file qasymm8_signed.cpp.
References arm_compute::test::validation::input.
void neon_qu8_roialign | ( | const ITensor * | input, |
ITensor * | output, | ||
const ITensor * | rois, | ||
ROIPoolingLayerInfo | pool_info, | ||
const Window & | window, | ||
const ThreadInfo & | info | ||
) |
Definition at line 29 of file qasymm8.cpp.
References arm_compute::test::validation::info, and arm_compute::test::validation::input.
void arm_compute::cpu::neon_range_function | ( | ITensor * | output, |
float | start, | ||
float | step, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 38 of file impl.h.
References Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), Iterator::ptr(), Window::set(), Window::Dimension::start(), step, arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vsetlane(), arm_compute::wrapper::vstore(), and Window::x().
void neon_s16_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 139 of file integer.cpp.
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_s16_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 71 of file integer.cpp.
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s16_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_s16_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 56 of file integer.cpp.
void neon_s16_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 41 of file integer.cpp.
void neon_s32_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 169 of file integer.cpp.
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_s32_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 32 of file integer.cpp.
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_s32_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_s32_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 32 of file integer.cpp.
References ARM_COMPUTE_UNUSED.
void neon_s32_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 61 of file integer.cpp.
void neon_s32_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 46 of file integer.cpp.
void arm_compute::cpu::neon_s32_to_fp16_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
void neon_s8_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 51 of file integer.cpp.
void neon_s8_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 36 of file integer.cpp.
void arm_compute::cpu::neon_softmax_float | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 65 of file impl.h.
References ARM_COMPUTE_UNUSED, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ValidRegion::shape, arm_compute::wrapper::vadd(), ITensorInfo::valid_region(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vexpq(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vpadd(), arm_compute::wrapper::vpmax(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), and Dimensions< T >::x().
void neon_softmax_quantized | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
Definition at line 33 of file impl.cpp.
References arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, ValidRegion::shape, QuantizationInfo::uniform(), ITensorInfo::valid_region(), arm_compute::wrapper::vdup_n(), arm_compute::vexpq_f32(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlane(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vpmax(), arm_compute::wrapper::vqsub(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), and Dimensions< T >::x().
template void arm_compute::cpu::neon_softmax_quantized< qasymm8_signed_t, false > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_softmax_quantized< qasymm8_signed_t, true > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_softmax_quantized< qasymm8_t, false > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_softmax_quantized< qasymm8_t, true > | ( | const ITensor * | in, |
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
const Window & | window | ||
) |
void neon_u16_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 86 of file integer.cpp.
void neon_u16_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 71 of file integer.cpp.
void neon_u32_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 91 of file integer.cpp.
void neon_u32_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 76 of file integer.cpp.
void neon_u8_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 109 of file integer.cpp.
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::neon_u8_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void neon_u8_select_not_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 81 of file integer.cpp.
void neon_u8_select_same_rank | ( | const ITensor * | c, |
const ITensor * | x, | ||
const ITensor * | y, | ||
ITensor * | output, | ||
const Window & | window | ||
) |
Definition at line 66 of file integer.cpp.
void arm_compute::cpu::neon_u8_to_fp16_cast | ( | const ITensor * | _src, |
ITensor * | _dst, | ||
const ThreadInfo & | tensor, | ||
ConvertPolicy | _policy, | ||
const Window & | window | ||
) |
|
inline |
Definition at line 71 of file list.h.
References data_layout, arm_compute::test::validation::info, and arm_compute::NCHW.
void arm_compute::cpu::poolingMxN_fp16_neon_nhwc | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
PoolingLayerInfo & | , | ||
const Window & | window_src, | ||
const Window & | window | ||
) |
void poolingMxN_fp32_neon_nhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
PoolingLayerInfo & | pool_info, | ||
const Window & | window_src, | ||
const Window & | window | ||
) |
Definition at line 282 of file fp32.cpp.
References Window::DimX, Window::Dimension::end(), PoolingLayerInfo::exclude_padding, arm_compute::execute_window_loop(), PadStrideInfo::has_padding(), Size2D::height, arm_compute::test::validation::idx_height, arm_compute::test::validation::idx_width, PoolingLayerInfo::is_global_pooling, arm_compute::L2, arm_compute::MAX, arm_compute::NHWC, PadStrideInfo::pad_bottom(), PadStrideInfo::pad_left(), PadStrideInfo::pad_right(), PoolingLayerInfo::pad_stride_info, PadStrideInfo::pad_top(), PoolingLayerInfo::pool_size, PoolingLayerInfo::pool_type, poolingMxN_fp32_neon_nhwc_kernel_indices(), Iterator::ptr(), arm_compute::test::validation::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), PadStrideInfo::stride(), PoolingLayerInfo::use_inf_as_limit, PoolingLayerInfo::use_kernel_indices, Size2D::width, Window::x(), Window::y(), and Window::z().
void arm_compute::cpu::poolingMxN_fp32_neon_nhwc_kernel_indices | ( | const ITensor * | src, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
const PoolingLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 163 of file fp32.cpp.
References Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), Size2D::height, arm_compute::test::validation::idx_height, arm_compute::test::validation::idx_width, PoolingLayerInfo::is_global_pooling, PadStrideInfo::pad_left(), PoolingLayerInfo::pad_stride_info, PadStrideInfo::pad_top(), PoolingLayerInfo::pool_size, Iterator::ptr(), Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), PadStrideInfo::stride(), arm_compute::utils::cast::U, PoolingLayerInfo::use_inf_as_limit, Size2D::width, and Window::x().
Referenced by poolingMxN_fp32_neon_nhwc().
void arm_compute::cpu::poolingMxN_q8_neon_nhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
PoolingLayerInfo & | pool_info, | ||
const Window & | window_src, | ||
const Window & | window | ||
) |
Definition at line 43 of file quantized.h.
References ARM_COMPUTE_UNUSED, Window::DimX, Window::Dimension::end(), PoolingLayerInfo::exclude_padding, arm_compute::execute_window_loop(), Size2D::height, arm_compute::test::validation::idx_height, arm_compute::test::validation::idx_width, ITensor::info(), PoolingLayerInfo::is_global_pooling, arm_compute::MAX, arm_compute::NHWC, UniformQuantizationInfo::offset, PadStrideInfo::pad_bottom(), PadStrideInfo::pad_left(), PadStrideInfo::pad_right(), PoolingLayerInfo::pad_stride_info, PadStrideInfo::pad_top(), PoolingLayerInfo::pool_size, PoolingLayerInfo::pool_type, Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, arm_compute::test::validation::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), PadStrideInfo::stride(), QuantizationInfo::uniform(), arm_compute::wrapper::vadd(), arm_compute::wrapper::vcombine(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgethigh(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vload(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmax(), arm_compute::wrapper::vmla(), arm_compute::wrapper::vmovl(), arm_compute::wrapper::vmovn(), arm_compute::wrapper::vstore(), Size2D::width, Window::x(), Window::y(), and Window::z().
void poolingMxN_qasymm8_neon_nhwc | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
PoolingLayerInfo & | pool_info, | ||
const Window & | window_src, | ||
const Window & | window | ||
) |
Definition at line 37 of file qasymm8.cpp.
References arm_compute::test::validation::src.
void poolingMxN_qasymm8_signed_neon_nhwc | ( | const ITensor * | src0, |
ITensor * | dst0, | ||
ITensor * | dst1, | ||
PoolingLayerInfo & | pool_info, | ||
const Window & | window_src, | ||
const Window & | window | ||
) |
Definition at line 37 of file qasymm8_signed.cpp.
References arm_compute::test::validation::src.
void arm_compute::cpu::poolingMxNxD_fp_neon_ndhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 432 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::AVG, Window::DimX, Window::Dimension::end(), arm_compute::L2, arm_compute::MAX, Pooling3dLayerInfo::pool_type, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), and Window::x().
void arm_compute::cpu::poolingMxNxD_q8_neon_ndhwc | ( | const ITensor * | src, |
ITensor * | dst0, | ||
Pooling3dLayerInfo & | pool_info, | ||
const Window & | window | ||
) |
Definition at line 462 of file impl.h.
References ARM_COMPUTE_ERROR, arm_compute::AVG, Window::DimX, arm_compute::MAX, Pooling3dLayerInfo::pool_type, Window::set(), and arm_compute::test::validation::src.
void qasymm8_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 375 of file qasymm8.cpp.
References arm_compute::BILINEAR, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, arm_compute::test::validation::src, and u8_neon_scale().
void qasymm8_signed_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 362 of file qasymm8_signed.cpp.
References arm_compute::BILINEAR, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, arm_compute::REPLICATE, s8_neon_scale(), and arm_compute::test::validation::src.
void qasymm8_signed_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 97 of file qasymm8_signed.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void qasymm8_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 97 of file qasymm8.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void arm_compute::cpu::roi_align | ( | const ITensor * | input, |
ITensor * | output, | ||
const ITensor * | rois, | ||
ROIPoolingLayerInfo | pool_info, | ||
const Window & | window, | ||
const ThreadInfo & | info | ||
) |
Definition at line 274 of file impl.h.
References ARM_COMPUTE_UNUSED, ITensor::buffer(), arm_compute::CHANNEL, compute_region_coordinate(), data_layout, arm_compute::test::validation::data_type, arm_compute::dequantize_qasymm16(), ITensorInfo::dimension(), Window::Dimension::end(), arm_compute::get_data_layout_dimension_index(), arm_compute::HEIGHT, arm_compute::test::validation::idx_height, arm_compute::test::validation::idx_width, ITensor::info(), arm_compute::test::validation::info, arm_compute::test::validation::input, arm_compute::is_data_type_quantized_asymmetric(), arm_compute::NCHW, ROIPoolingLayerInfo::pooled_height(), ROIPoolingLayerInfo::pooled_width(), ITensor::ptr_to_element(), ITensorInfo::quantization_info(), ROIPoolingLayerInfo::sampling_ratio(), ROIPoolingLayerInfo::spatial_scale(), Window::Dimension::start(), arm_compute::WIDTH, and Window::x().
|
inline |
Average pooling over an aligned window.
Definition at line 37 of file impl.h.
References data_layout, arm_compute::test::validation::input, and arm_compute::NCHW.
Referenced by arm_compute::test::validation::reference::roi_align_layer().
|
inline |
Average pooling over an aligned window.
Definition at line 115 of file impl.h.
References data_layout, arm_compute::dequantize_qasymm8(), arm_compute::dequantize_qasymm8_signed(), arm_compute::test::validation::input, arm_compute::is_data_type_quantized_asymmetric_signed(), arm_compute::NCHW, UniformQuantizationInfo::offset, arm_compute::quantize_qasymm8(), arm_compute::quantize_qasymm8_signed(), and QuantizationInfo::uniform().
|
inline |
|
inline |
|
inline |
void arm_compute::cpu::run_depthwise_float | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 340 of file impl.h.
References arm_compute::test::validation::conv_info, arm_compute::test::validation::dst, arm_compute::test::validation::info, and arm_compute::test::validation::src.
void run_depthwise_quanitized8bit | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Definition at line 559 of file impl.cpp.
References arm_compute::quantization::calculate_quantized_multiplier(), channel_idx, arm_compute::test::validation::conv_info, ITensorInfo::data_type(), arm_compute::test::validation::dst, ITensor::info(), arm_compute::test::validation::info, arm_compute::is_data_type_quantized_per_channel(), ITensorInfo::quantization_info(), QuantizationInfo::scale(), and arm_compute::test::validation::src.
template void arm_compute::cpu::run_depthwise_quanitized8bit< int8_t, int8_t > | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Referenced by neon_qp8_qs8_deptwiseconv2dnative(), and neon_qs8_deptwiseconv2dnative().
template void arm_compute::cpu::run_depthwise_quanitized8bit< uint8_t, int8_t > | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Referenced by neon_qp8_qu8_deptwiseconv2dnative().
template void arm_compute::cpu::run_depthwise_quanitized8bit< uint8_t, uint8_t > | ( | const ITensor * | src, |
const ITensor * | weights, | ||
const ITensor * | biases, | ||
ITensor * | dst, | ||
const Window & | window, | ||
bool | has_biases, | ||
const ConvolutionInfo & | info | ||
) |
Referenced by neon_qu8_deptwiseconv2dnative().
void s16_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 88 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 53 of file integer.cpp.
References step.
void s16_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 760 of file integer.cpp.
References arm_compute::BILINEAR, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void s16_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 172 of file integer.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
void s32_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 102 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 58 of file integer.cpp.
References step.
void s8_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 74 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 48 of file integer.cpp.
References step.
void s8_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 714 of file integer.cpp.
References ARM_COMPUTE_ERROR, arm_compute::BILINEAR, arm_compute::test::validation::dst, and arm_compute::test::validation::src.
Referenced by qasymm8_signed_neon_scale().
|
inline |
Definition at line 40 of file impl.cpp.
References arm_compute::test::validation::b.
|
inline |
Definition at line 35 of file impl.cpp.
References arm_compute::test::validation::b.
void arm_compute::cpu::select_op | ( | const ITensor * | cond, |
const ITensor * | in1, | ||
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window, | ||
const int | window_step_x, | ||
const int | window_start_x, | ||
const int | window_end_x, | ||
const int | limit, | ||
VectorType(*)(const uint8_t *) | condition_conversion | ||
) |
Definition at line 41 of file impl.h.
References arm_compute::test::validation::b, arm_compute::mlgo::parser::condition(), Window::DimX, arm_compute::execute_window_loop(), Iterator::ptr(), Window::set(), arm_compute::wrapper::vbsl(), arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
void arm_compute::cpu::select_op_16 | ( | const ITensor * | cond, |
const ITensor * | in1, | ||
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 106 of file impl.h.
References Window::Dimension::end(), Window::Dimension::start(), arm_compute::wrapper::vcgt(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vload(), arm_compute::wrapper::vmovl(), and Window::x().
void arm_compute::cpu::select_op_32 | ( | const ITensor * | cond, |
const ITensor * | in1, | ||
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 123 of file impl.h.
References Window::Dimension::end(), Window::Dimension::start(), arm_compute::wrapper::vcgt(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vgetlow(), arm_compute::wrapper::vload(), arm_compute::wrapper::vmovl(), and Window::x().
void arm_compute::cpu::select_op_8 | ( | const ITensor * | cond, |
const ITensor * | in1, | ||
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 89 of file impl.h.
References Window::Dimension::end(), Window::Dimension::start(), arm_compute::wrapper::vcgt(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), and Window::x().
void arm_compute::cpu::select_op_not_same_rank | ( | const ITensor * | cond, |
const ITensor * | in1, | ||
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 140 of file impl.h.
References ARM_COMPUTE_UNUSED, ITensor::buffer(), ITensorInfo::element_size(), ITensor::info(), offset(), step, ITensorInfo::total_size(), arm_compute::wrapper::vload(), arm_compute::wrapper::vloadq(), and arm_compute::wrapper::vstore().
|
inline |
|
inline |
|
inline |
|
inline |
Definition at line 582 of file impl.h.
Referenced by elementwise_arithm_op_quantized_broadcast_loop(), elementwise_arithm_op_quantized_loop(), elementwise_arithmetic_quantized_op(), elementwise_comp_op_quantized_broadcast_loop(), elementwise_comp_op_quantized_loop(), elementwise_comp_op_quantized_signed_broadcast_loop(), elementwise_comp_op_quantized_signed_loop(), and store_quantized().
|
inline |
|
inline |
|
inline |
Definition at line 608 of file impl.h.
Referenced by elementwise_arithm_op_quantized_signed_broadcast_loop(), elementwise_arithm_op_quantized_singed_loop(), and store_quantized_signed().
bool sub_q8_neon_fixedpoint_possible | ( | const ITensorInfo * | src0, |
const ITensorInfo * | src1, | ||
const ITensorInfo * | dst | ||
) |
Definition at line 35 of file impl.cpp.
References add_sub_q8_neon_fixedpoint_possible(), and arm_compute::test::validation::dst.
Referenced by CpuSubKernel::configure().
void sub_qasymm8_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 39 of file qasymm8.cpp.
References add_sub_qasymm8_neon(), and arm_compute::test::validation::dst.
void sub_qasymm8_neon_fixedpoint | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8.cpp.
References add_sub_q8_neon_fixedpoint< uint8_t >(), and arm_compute::test::validation::dst.
void sub_qasymm8_signed_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 40 of file qasymm8_signed.cpp.
References add_sub_qasymm8_signed_neon(), and arm_compute::test::validation::dst.
void sub_qasymm8_signed_neon_fixedpoint | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 34 of file qasymm8_signed.cpp.
References add_sub_q8_neon_fixedpoint< int8_t >(), and arm_compute::test::validation::dst.
void sub_qsymm16_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
Definition at line 36 of file qsymm16.cpp.
References ARM_COMPUTE_UNUSED, arm_compute::test::validation::b, arm_compute::graph::bfs(), Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::for(), ITensor::info(), Iterator::ptr(), ITensorInfo::quantization_info(), arm_compute::quantize_qsymm16(), UniformQuantizationInfo::scale, Window::set(), Window::Dimension::start(), Window::Dimension::step(), ITensorInfo::tensor_shape(), QuantizationInfo::uniform(), Dimensions< T >::x(), and Window::x().
void arm_compute::cpu::sub_same_neon | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
SIMD vector tag type.
Definition at line 42 of file impl.h.
References Window::broadcast_if_dimension_le_one(), Window::DimX, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), arm_compute::SATURATE, Window::set(), Window::Dimension::start(), Window::Dimension::step(), arm_compute::wrapper::sub_sat(), ITensorInfo::tensor_shape(), arm_compute::wrapper::vdup_n(), arm_compute::wrapper::vloadq(), arm_compute::wrapper::vmul(), arm_compute::wrapper::vqsub(), arm_compute::wrapper::vstore(), arm_compute::wrapper::vsub(), Dimensions< T >::x(), and Window::x().
void arm_compute::cpu::sub_same_neon_fp16 | ( | const ITensor * | src0, |
const ITensor * | src1, | ||
ITensor * | dst, | ||
const ConvertPolicy & | policy, | ||
const Window & | window | ||
) |
void arm_compute::cpu::sve2_q8_activation_lut | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void sve2_q8_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 33 of file q8.cpp.
References ARM_COMPUTE_UNUSED, Window::Dimension::end(), arm_compute::execute_window_loop(), Iterator::ptr(), and Window::x().
void sve2_qasymm8_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 40 of file qasymm8.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, UniformQuantizationInfo::offset, Iterator::ptr(), arm_compute::quantize_qasymm8(), arm_compute::round(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::TO_NEAREST_EVEN, and Window::x().
void sve2_qasymm8_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 72 of file qasymm8.cpp.
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve2_qasymm8_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8.cpp.
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve2_qasymm8_signed_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 40 of file qasymm8_signed.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, UniformQuantizationInfo::offset, Iterator::ptr(), arm_compute::quantize_qasymm8_signed(), arm_compute::round(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), arm_compute::TO_NEAREST_EVEN, and Window::x().
void sve2_qasymm8_signed_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 72 of file qasymm8_signed.cpp.
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve2_qasymm8_signed_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 33 of file qasymm8_signed.cpp.
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve2_qasymm8_signed_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve2_qsymm16_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 41 of file qsymm16.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), UniformQuantizationInfo::scale, Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), and Window::x().
void sve2_softmax_logits_1d_quantized | ( | const ITensor * | in, |
const ITensor * | max, | ||
void *const | tmp, | ||
ITensor * | out, | ||
float | beta, | ||
bool | is_log, | ||
const Window & | window | ||
) |
TODO: (COMPMID-6505) Similar to Neon(TM), this implementation be converted to a single kernel that performs softmax operation.
Leaving the SVE2 code here for future references. Implementation for Neon(TM) is introduced in COMPMID-6500
Definition at line 39 of file impl.cpp.
References ValidRegion::anchor, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ITensorInfo::quantization_info(), UniformQuantizationInfo::scale, ValidRegion::shape, type, QuantizationInfo::uniform(), ITensorInfo::valid_region(), and Dimensions< T >::x().
void arm_compute::cpu::sve_fp16_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::sve_fp16_activation_lut | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
void arm_compute::cpu::sve_fp16_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void arm_compute::cpu::sve_fp16_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void arm_compute::cpu::sve_fp16_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
void sve_fp32_activation | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ActivationLayerInfo & | act_info, | ||
const Window & | window | ||
) |
Definition at line 40 of file fp32.cpp.
References arm_compute::test::validation::act_info, ARM_COMPUTE_ERROR, Window::collapse_if_possible(), Window::DimX, Window::DimZ, arm_compute::test::validation::dst, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), arm_compute::test::validation::src, Window::Dimension::start(), and Window::x().
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_fp32_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 33 of file fp32.cpp.
References elementwise_arithmetic_op< float32_t >().
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_fp32_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_fp32_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 34 of file fp32.cpp.
References ARM_COMPUTE_UNUSED, and elementwise_sve_op< float32_t >().
TODO: (COMPMID-6505) Similar to Neon(TM), this implementation be converted to a single kernel that performs softmax operation.
Leaving the SVE code here for future references. Implementation for Neon(TM) is introduced in COMPMID-6500
Definition at line 37 of file impl.cpp.
References Window::DimX, Window::Dimension::end(), arm_compute::execute_window_loop(), arm_compute::test::validation::input, Iterator::ptr(), Window::set(), Window::Dimension::start(), and Window::x().
void sve_s16_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 139 of file integer.cpp.
References elementwise_comparison_op< int16_t >().
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_s16_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 71 of file integer.cpp.
References elementwise_arithmetic_op< int16_t >().
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s16_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_s32_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 169 of file integer.cpp.
References elementwise_comparison_op< int32_t >().
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_s32_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 33 of file integer.cpp.
References elementwise_arithmetic_op< int32_t >().
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::ADD > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::DIV > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::MAX > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::MIN > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::POWER > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::PRELU > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::SQUARED_DIFF > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_s32_elementwise_binary< ArithmeticOperation::SUB > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void sve_s32_elementwise_unary | ( | const ITensor * | in, |
ITensor * | out, | ||
const Window & | window, | ||
ElementWiseUnary | op, | ||
const uint8_t * | lut | ||
) |
Definition at line 33 of file integer.cpp.
References ARM_COMPUTE_UNUSED, and elementwise_sve_op< int32_t >().
void sve_softmax_logits_1d_float | ( | const ITensor * | in, |
const ITensor * | max, | ||
void *const | tmp, | ||
ITensor * | out, | ||
const float | beta, | ||
bool | is_log, | ||
const Window & | window | ||
) |
Definition at line 78 of file impl.cpp.
References ValidRegion::anchor, arm_compute::execute_window_loop(), ITensor::info(), Iterator::ptr(), ValidRegion::shape, ITensorInfo::valid_region(), and Dimensions< T >::x().
void sve_u8_comparison_elementwise_binary | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
Definition at line 109 of file integer.cpp.
References elementwise_comparison_op< uint8_t >().
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::Equal > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::Greater > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::GreaterEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::Less > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::LessEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
template void arm_compute::cpu::sve_u8_comparison_elementwise_binary< ComparisonOperation::NotEqual > | ( | const ITensor * | in1, |
const ITensor * | in2, | ||
ITensor * | out, | ||
const Window & | window | ||
) |
void u16_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 46 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 38 of file integer.cpp.
References step.
void u32_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 60 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 43 of file integer.cpp.
References step.
void u8_in_bounds_crop_window | ( | const ITensor * | input, |
const ITensor * | output, | ||
float * | output_ptr, | ||
Coordinates | input_offset, | ||
int32_t | window_step_x, | ||
int32_t | output_width_start, | ||
int32_t | output_width_limit, | ||
bool | input_has_single_channel, | ||
bool | is_width_flipped | ||
) |
Definition at line 32 of file integer.cpp.
References arm_compute::test::validation::input.
Definition at line 33 of file integer.cpp.
References step.
void u8_neon_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 737 of file integer.cpp.
References arm_compute::BILINEAR, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
Referenced by qasymm8_neon_scale().
void u8_sve_scale | ( | const ITensor * | src, |
ITensor * | dst, | ||
const ITensor * | offsets, | ||
const ITensor * | dx, | ||
const ITensor * | dy, | ||
InterpolationPolicy | policy, | ||
BorderMode | border_mode, | ||
PixelValue | constant_border_value, | ||
float | sampling_offset, | ||
bool | align_corners, | ||
const Window & | window | ||
) |
Definition at line 149 of file integer.cpp.
References ARM_COMPUTE_ERROR, ARM_COMPUTE_UNUSED, arm_compute::test::validation::dst, arm_compute::NEAREST_NEIGHBOR, and arm_compute::test::validation::src.
InputType vector_float_norm | ( | const InputType & | inputs, |
const AccType & | vec_mean, | ||
const AccType & | vec_multip, | ||
const AccType & | vec_beta | ||
) |
Definition at line 43 of file impl.cpp.
References arm_compute::wrapper::vadd(), arm_compute::wrapper::vmul(), and arm_compute::wrapper::vsub().
Referenced by instance_normalization_nchw().
void vector_float_sum | ( | AccType & | result, |
AccType & | result_square, | ||
const InputType & | inputs | ||
) |
Definition at line 35 of file impl.cpp.
References arm_compute::wrapper::vadd(), and arm_compute::wrapper::vmul().
Referenced by instance_normalization_nchw().
void vector_matrix_multiply_f32 | ( | const ITensor * | lhs, |
const ITensor * | rhs, | ||
ITensor * | dst, | ||
const Window & | window, | ||
const ThreadInfo & | info, | ||
float | alpha | ||
) |
Definition at line 35 of file impl.cpp.
References arm_compute::ceil_to_multiple(), arm_compute::data_size_from_type(), ITensorInfo::data_type(), ITensorInfo::dimension(), Window::DimX, Window::DimY, arm_compute::test::validation::dst, arm_compute::execute_window_loop(), ITensor::info(), arm_compute::test::validation::info, arm_compute::helpers::float_ops::is_one(), ITensorInfo::num_dimensions(), Iterator::ptr(), Window::set(), and ITensorInfo::strides_in_bytes().
Referenced by neon_fp32_gemm_matrix_mul().
const size_t channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL) |
Definition at line 39 of file impl.h.
Referenced by arm_compute::test::colorconvert_helper::detail::colorconvert_rgb_to_rgbx(), arm_compute::test::colorconvert_helper::detail::colorconvert_rgbx_to_rgb(), arm_compute::misc::shape_calculator::compute_col2im_shape(), arm_compute::misc::shape_calculator::compute_deconvolution_output_shape(), arm_compute::misc::shape_calculator::compute_depthwise_convolution_shape(), arm_compute::misc::shape_calculator::compute_im2col_conv_shape(), arm_compute::test::colorconvert_helper::detail::compute_rgb_value(), ClTransposedConvolutionKernel::configure(), CpuConvertFullyConnectedWeightsKernel::configure(), ClConvertFullyConnectedWeightsKernel::configure(), ClIndirectConv2dKernel::configure(), CLNormalizePlanarYUVLayerKernel::configure(), ClDirectConv2dKernel::configure(), CpuIm2ColKernel::configure(), CLComputeMeanVariance::configure(), arm_compute::test::validation::reference::convert_fully_connected_weights(), ClTemplateDirectConv2d::get_build_options(), ClTemplateDirectConv2d::get_component_code(), ClTemplatePool2d::get_config_id(), arm_compute::get_normalization_dimension_index(), ClTemplateDirectConv2d::get_tag_lut(), CpuWinogradConv2d::prepare(), NESpaceToDepthLayerKernel::run(), run_depthwise_quanitized8bit(), arm_compute::cpu::kernels::run_im2col(), ClComponentDirectConv2d::validate(), ClComponentDepthwiseConv2d::validate(), NEDeconvolutionLayer::validate(), arm_compute::cpu::kernels::validate_arguments(), GpuCkwDirectConv2d::write_component_code(), and arm_compute::test::colorconvert_helper::detail::yuyv_to_rgb_calculation().
|
constexpr |
Definition at line 36 of file impl.h.
Referenced by arm_compute::calculate_same_pad(), arm_compute::calculate_valid_region_scale(), arm_compute::cl_winograd_convolution_layer_supported(), arm_compute::misc::shape_calculator::compute_col2im_shape(), arm_compute::misc::shape_calculator::compute_deconvolution_output_shape(), arm_compute::misc::shape_calculator::compute_deconvolution_padding(), arm_compute::misc::shape_calculator::compute_deconvolution_upsampled_shape(), arm_compute::misc::shape_calculator::compute_depth_to_space_shape(), arm_compute::misc::shape_calculator::compute_depthwise_convolution_shape(), arm_compute::misc::shape_calculator::compute_im2col_conv_shape(), DepthToSpaceLayerNode::compute_output_descriptor(), PoolingLayerNode::compute_output_descriptor(), ReorgLayerNode::compute_output_descriptor(), DeconvolutionLayerNode::compute_output_descriptor(), FusedConvolutionBatchNormalizationNode::compute_output_descriptor(), DepthwiseConvolutionLayerNode::compute_output_descriptor(), ConvolutionLayerNode::compute_output_descriptor(), arm_compute::misc::shape_calculator::compute_pool3d_shape(), arm_compute::misc::shape_calculator::compute_prior_box_shape(), arm_compute::misc::shape_calculator::compute_space_to_batch_shape(), arm_compute::misc::shape_calculator::compute_space_to_depth_shape(), arm_compute::misc::shape_calculator::compute_upsample_shape(), arm_compute::misc::shape_calculator::compute_vector_to_tensor_output_shape(), arm_compute::misc::shape_calculator::compute_winograd_output_transform_shape(), CpuConvertFullyConnectedWeights::configure(), ClConvertFullyConnectedWeights::configure(), CpuConvertFullyConnectedWeightsKernel::configure(), CpuPool2dKernel::configure(), ClConvertFullyConnectedWeightsKernel::configure(), CpuPool3dKernel::configure(), CLChannelShuffleLayerKernel::configure(), CLNormalizationLayerKernel::configure(), CLSpaceToBatchLayerKernel::configure(), NEConvertFullyConnectedWeights::configure(), CLNormalizePlanarYUVLayerKernel::configure(), CLConvertFullyConnectedWeights::configure(), NEScale::configure(), CLPriorBoxLayerKernel::configure(), NEInstanceNormalizationLayer::configure(), CLDeconvolutionReshapeOutputKernel::configure(), CpuGemmConv2d::configure(), ClGemmConv2d::configure(), CLComputeMeanVariance::configure(), NEDeconvolutionLayer::configure(), CLDirectDeconvolutionLayer::configure(), CLConvertFullyConnectedWeightsManaged::configure(), ResizeLayerNode::configure_output(), arm_compute::experimental::dynamic_fusion::convert_pool_attr_to_pool_info(), arm_compute::graph::backends::detail::create_concatenate_layer(), arm_compute::test::create_tensor(), IImageLoader::fill_planar_tensor(), ClTemplateDirectConv2d::get_config_id(), ClTemplatePool2d::get_config_id(), ClConv2d::get_convolution_method(), arm_compute::get_data_layout_dimension_index(), CLDeconvolutionLayer::get_deconvolution_method(), arm_compute::graph::get_dimension_idx(), arm_compute::get_index_data_layout_dimension(), arm_compute::graph_utils::get_npy_output_accessor(), CpuGemmConv2d::has_opt_impl(), arm_compute::cpu::kernels::internal_run_im2col_fp16_nchw_nopad(), arm_compute::cpu::kernels::internal_run_im2col_fp16_nchw_pad(), arm_compute::cpu::kernels::internal_run_im2col_fp16_nopad(), arm_compute::cpu::kernels::internal_run_im2col_fp16_pad(), arm_compute::scale_utils::is_precomputation_required(), NumPyAccessor::NumPyAccessor(), offset_no_padding(), arm_compute::operator<<(), arm_compute::operator>>(), roi_align(), roi_align_1x1(), roi_align_1x1_qasymm8(), CPPUpsampleKernel::run(), NEReorgLayerKernel::run(), NEROIAlignLayerKernel::run(), arm_compute::cpu::kernels::run_im2col(), arm_compute::cpu::kernels::run_im2col_fp16_nchw_nopad(), arm_compute::cpu::kernels::run_im2col_fp16_nchw_pad(), arm_compute::cpu::kernels::run_im2col_fp16_nopad(), arm_compute::cpu::kernels::run_im2col_fp16_pad(), arm_compute::cpu::kernels::run_im2col_fp32_nchw_nopad(), arm_compute::cpu::kernels::run_im2col_fp32_nchw_pad(), arm_compute::cpu::kernels::run_im2col_fp32_nopad(), arm_compute::cpu::kernels::run_im2col_fp32_pad(), arm_compute::cpu::kernels::run_im2col_int8_nopad_nhwc(), arm_compute::cpu::kernels::run_im2col_qasymm8_nchw_nopad(), arm_compute::cpu::kernels::run_im2col_qasymm8_nchw_pad(), arm_compute::cpu::kernels::run_im2col_qasymm8_nopad(), arm_compute::cpu::kernels::run_im2col_qasymm8_pad(), arm_compute::cpu::kernels::run_im2col_qasymm8_pad_nhwc(), arm_compute::cpu::kernels::run_im2col_uint8_nopad_nhwc(), arm_compute::set_data_layout_if_unknown(), TensorDescriptor::set_layout(), arm_compute::test::validation::TEST_CASE(), arm_compute::to_string(), CpuConvertFullyConnectedWeights::validate(), ClConvertFullyConnectedWeights::validate(), CpuScale::validate(), CpuPool2dKernel::validate(), CpuConvertFullyConnectedWeightsKernel::validate(), ClConvertFullyConnectedWeightsKernel::validate(), CLDeconvolutionLayerUpsampleKernel::validate(), NEConvertFullyConnectedWeights::validate(), CLConvertFullyConnectedWeights::validate(), ClComponentDirectConv2d::validate(), ClGemmConv2d::validate(), CpuGemmConv2d::validate(), ClComponentDepthwiseConv2d::validate(), CLGEMMDeconvolutionLayer::validate(), CLDirectDeconvolutionLayer::validate(), and arm_compute::cpu::kernels::validate_arguments().
|
constexpr |
Definition at line 41 of file impl.h.
Referenced by depthwise_loop_generic_fp(), and depthwise_loop_multiplier1_fp().
|
constexpr |
Definition at line 42 of file impl.h.
Referenced by depthwise_loop_multiplier1_fp().
const size_t height_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT) |
Definition at line 38 of file impl.h.
Referenced by arm_compute::calculate_same_pad(), arm_compute::misc::shape_calculator::compute_col2im_shape(), arm_compute::misc::shape_calculator::compute_deconvolution_output_shape(), arm_compute::misc::shape_calculator::compute_depthwise_convolution_shape(), arm_compute::misc::shape_calculator::compute_im2col_conv_shape(), ClTransposedConvolutionKernel::configure(), CpuConvertFullyConnectedWeightsKernel::configure(), ClConvertFullyConnectedWeightsKernel::configure(), ClIndirectConv2dAddressPrecalculationKernel::configure(), ClIndirectConv2dKernel::configure(), ClDirectConv2dKernel::configure(), CLPriorBoxLayerKernel::configure(), ClIm2ColKernel::configure(), CpuIm2ColKernel::configure(), NEDeconvolutionLayer::configure(), ResizeLayerNode::configure_output(), arm_compute::test::validation::reference::convert_fully_connected_weights(), ClTemplateDepthwiseConv2d::get_component_code(), ClTemplateDirectConv2d::get_config_id(), ClTemplatePool2d::get_config_id(), ClTemplateDepthwiseConv2d::get_tag_lut(), ClTemplateDirectConv2d::get_tag_lut(), ClTemplatePool2d::get_tag_lut(), CpuWinogradConv2d::prepare(), NESpaceToBatchLayerKernel::run(), arm_compute::cpu::kernels::run_im2col(), CpuWinogradConv2dTransformInputKernel::run_op(), CpuWinogradConv2dTransformOutputKernel::run_op(), NEDeconvolutionLayer::validate(), arm_compute::cpu::kernels::validate_arguments(), GpuCkwPool2d::write_component_code(), GpuCkwDepthwiseConv2d::write_component_code(), and GpuCkwDirectConv2d::write_component_code().
|
constexpr |
Definition at line 35 of file fp32.cpp.
Referenced by arm_compute::adjust_down(), arm_compute::adjust_up(), Window::collapse_if_possible(), CLRangeKernel::configure(), NERangeKernel::configure(), CLRange::configure(), NERange::configure(), arm_compute::convert_window_coord_to_position(), arm_compute::enqueue(), arm_compute::error_on_invalid_subwindow(), arm_compute::error_on_mismatching_windows(), arm_compute::error_on_window_dimensions_gte(), arm_compute::execute_window_loop(), fp32_neon_floor(), fp32_neon_range_function(), arm_compute::experimental::dynamic_fusion::get_coordinate_from_gws(), arm_compute::experimental::dynamic_fusion::get_coordinate_from_gws_overlapping_min(), Dimensions< size_t >::increment(), arm_compute::test::framework::dataset::make(), neon_range_function(), arm_compute::num_of_elements_in_range(), arm_compute::test::validation::reference::range(), NEDepthToSpaceLayerKernel::run(), s16_neon_range_function(), s32_neon_range_function(), s8_neon_range_function(), select_op_not_same_rank(), Window::set_dimension_step(), WindowIterator< L >::set_step(), Window::shape(), TensorShape::shift_right(), Window::split_window(), u16_neon_range_function(), u32_neon_range_function(), u8_neon_range_function(), NERangeKernel::validate(), CLRangeKernel::validate(), CLRange::validate(), NERange::validate(), and Window::validate().
|
constexpr |
Definition at line 43 of file impl.h.
Referenced by CLArgMinMaxLayerKernel::configure(), CpuGemmTranspose1xWKernel::configure(), arm_compute::create_lws_hint_parallel_implementations(), depthwise_loop_multiplier1_fp(), ClTemplateLogits1DMaxShiftExpSum::get_build_options(), ClTemplateLogits1DMaxShiftExpSum::get_component_code(), ClTemplateLogits1DNorm::get_window(), CpuGemmTranspose1xWKernel::run_op(), and arm_compute::test::validation::TEST_CASE().
const size_t width_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH) |
Definition at line 37 of file impl.h.
Referenced by arm_compute::calculate_same_pad(), arm_compute::misc::shape_calculator::compute_col2im_shape(), arm_compute::misc::shape_calculator::compute_deconvolution_output_shape(), arm_compute::misc::shape_calculator::compute_depthwise_convolution_shape(), arm_compute::misc::shape_calculator::compute_im2col_conv_shape(), ClTransposedConvolutionKernel::configure(), CpuConvertFullyConnectedWeightsKernel::configure(), ClConvertFullyConnectedWeightsKernel::configure(), ClIndirectConv2dAddressPrecalculationKernel::configure(), ClIndirectConv2dKernel::configure(), ClDirectConv2dKernel::configure(), CLPriorBoxLayerKernel::configure(), ClIm2ColKernel::configure(), CpuIm2ColKernel::configure(), NEDeconvolutionLayer::configure(), ResizeLayerNode::configure_output(), arm_compute::test::validation::reference::convert_fully_connected_weights(), ClTemplateDepthwiseConv2d::get_build_options(), ClTemplateDirectConv2d::get_config_id(), ClTemplatePool2d::get_config_id(), arm_compute::get_normalization_dimension_index(), ClTemplateDepthwiseConv2d::get_tag_lut(), ClTemplateDirectConv2d::get_tag_lut(), ClTemplatePool2d::get_tag_lut(), arm_compute::test::validation::reference::indirect_conv2d_addr_precalculation(), CpuWinogradConv2d::prepare(), NESpaceToBatchLayerKernel::run(), arm_compute::cpu::kernels::run_im2col(), CpuWinogradConv2dTransformInputKernel::run_op(), CpuWinogradConv2dTransformOutputKernel::run_op(), NEDeconvolutionLayer::validate(), arm_compute::cpu::kernels::validate_arguments(), GpuCkwPool2d::write_component_code(), GpuCkwDepthwiseConv2d::write_component_code(), and GpuCkwDirectConv2d::write_component_code().