23.11
|
Namespaces | |
depthfirst_multiplier | |
depthwise_depthfirst | |
interleaves | |
Functions | |
std::tuple< size_t, size_t, size_t, size_t, size_t > | get_reduced_view_for_dilation (size_t out_size, size_t in_size, const size_t d, const size_t dilation_factor, const size_t kernel_size, const size_t stride, const size_t orig_pad_before) |
template<> | |
const DepthwiseImplementation< float > * | depthwise_implementation_list () |
template UniqueDepthwiseCommon< float > | depthwise (const DepthwiseArgs &, const Nothing &) |
template std::vector< KernelDescription > | get_compatible_kernels< float > (const DepthwiseArgs &, const Nothing &) |
template<typename TInput , typename TWeight = TInput, typename TOutput = TInput, class OutputStage = Nothing> | |
bool | find_implementation (const DepthwiseArgs &args, const OutputStage &os, const DepthwiseImplementation< TInput, TWeight, TOutput, OutputStage > *&selected) |
template<typename TInput , typename TWeight , typename TOutput , class OutputStage > | |
std::vector< KernelDescription > | get_compatible_kernels (const DepthwiseArgs &args, const OutputStage &os) |
template<typename TInput , typename TWeight , typename TOutput , class OutputStage > | |
UniqueDepthwiseCommon< TInput, TWeight, TOutput > | depthwise (const DepthwiseArgs &args, const OutputStage &os) |
template UniqueDepthwiseCommon< int8_t, int8_t, int8_t > | depthwise (const DepthwiseArgs &, const Requantize32 &) |
template std::vector< KernelDescription > | get_compatible_kernels< int8_t, int8_t, int8_t, Requantize32 > (const DepthwiseArgs &, const Requantize32 &) |
template std::vector< KernelDescription > | get_compatible_kernels< uint8_t, uint8_t, uint8_t, Requantize32 > (const DepthwiseArgs &, const Requantize32 &) |
template std::vector< KernelDescription > | get_compatible_kernels< uint8_t, int8_t, uint8_t, Requantize32 > (const DepthwiseArgs &, const Requantize32 &) |
void | sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst_indirect_impl (const __fp16 *const *const input_ptrs, __fp16 *const *const outptrs, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst_direct_impl (const unsigned int n_tile_rows, const unsigned int n_tile_cols, const __fp16 *inptr, int64_t ld_input_row, int64_t ld_input_col, __fp16 *outptr, int64_t ld_output_row, int64_t ld_output_col, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst_indirect_impl (const __fp16 *const *const input_ptrs, __fp16 *const *const outptrs, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst_direct_impl (const unsigned int n_tile_rows, const unsigned int n_tile_cols, const __fp16 *inptr, int64_t ld_input_row, int64_t ld_input_col, __fp16 *outptr, int64_t ld_output_row, int64_t ld_output_col, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst_indirect_impl (const __fp16 *const *const input_ptrs, __fp16 *const *const outptrs, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst_direct_impl (const unsigned int n_tile_rows, const unsigned int n_tile_cols, const __fp16 *inptr, int64_t ld_input_row, int64_t ld_input_col, __fp16 *outptr, int64_t ld_output_row, int64_t ld_output_col, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst_indirect_impl (const __fp16 *const *const input_ptrs, __fp16 *const *const outptrs, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst_direct_impl (const unsigned int n_tile_rows, const unsigned int n_tile_cols, const __fp16 *inptr, int64_t ld_input_row, int64_t ld_input_col, __fp16 *outptr, int64_t ld_output_row, int64_t ld_output_col, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst_indirect_impl (const __fp16 *const *const input_ptrs, __fp16 *const *const outptrs, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst_direct_impl (const unsigned int n_tile_rows, const unsigned int n_tile_cols, const __fp16 *inptr, int64_t ld_input_row, int64_t ld_input_col, __fp16 *outptr, int64_t ld_output_row, int64_t ld_output_col, const void *params, unsigned int n_channels, const __fp16 activation_min, const __fp16 activation_max) |
void | sme2_fp32_planar_3x3_s1_4rows_mla_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32_planar_3x3_s2_4rows_mla_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32_planar_5x5_s1_4rows_mla_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32_planar_5x5_s2_4rows_mla_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za_impl (const float *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const float *weights, const float *bias, float **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, float act_min, float act_max) |
void | sme2_s8q_planar_3x3_s1_4rows_dot_za_impl (const int8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, int8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_s8q_planar_3x3_s2_4rows_dot_za_impl (const int8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, int8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_s8q_planar_5x5_s1_4rows_dot_za_impl (const int8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, int8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_s8q_planar_5x5_s2_4rows_dot_za_impl (const int8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, int8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8q_planar_3x3_s1_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const uint8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8q_planar_3x3_s2_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const uint8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8q_planar_5x5_s1_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const uint8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8q_planar_5x5_s2_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const uint8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
void | sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za_impl (const uint8_t *inptr, size_t ld_in_row, size_t ld_in_col, size_t ld_in_vl, unsigned int pad_top, unsigned int valid_input_rows, unsigned int pad_left, unsigned int valid_input_cols, const int8_t *weights, uint8_t **outptrs, const size_t *outlds, const size_t *outvllds, unsigned int output_cols, unsigned int start_channel, unsigned int valid_channels, const arm_gemm::Requantize32 &qp) |
template UniqueDepthwiseCommon<float> arm_conv::depthwise::depthwise | ( | const DepthwiseArgs & | , |
const Nothing & | |||
) |
template UniqueDepthwiseCommon< uint8_t, int8_t, uint8_t > depthwise | ( | const DepthwiseArgs & | , |
const Requantize32 & | |||
) |
UniqueDepthwiseCommon<TInput, TWeight, TOutput> arm_conv::depthwise::depthwise | ( | const DepthwiseArgs & | args, |
const OutputStage & | os | ||
) |
Definition at line 140 of file depthwise_implementation.hpp.
References GemmTuner::args, and DepthwiseImplementation< TInput, TWeight, TOutput, OutputStage >::get_instance().
|
related |
Definition at line 530 of file depthwise_fp32.cpp.
bool arm_conv::depthwise::find_implementation | ( | const DepthwiseArgs & | args, |
const OutputStage & | os, | ||
const DepthwiseImplementation< TInput, TWeight, TOutput, OutputStage > *& | selected | ||
) |
std::vector<KernelDescription> arm_conv::depthwise::get_compatible_kernels | ( | const DepthwiseArgs & | args, |
const OutputStage & | os | ||
) |
Definition at line 114 of file depthwise_implementation.hpp.
References GemmTuner::args, and DepthwiseImplementation< TInput, TWeight, TOutput, OutputStage >::get_cycle_estimate().
template std::vector<KernelDescription> arm_conv::depthwise::get_compatible_kernels< float > | ( | const DepthwiseArgs & | , |
const Nothing & | |||
) |
template std::vector<KernelDescription> arm_conv::depthwise::get_compatible_kernels< int8_t, int8_t, int8_t, Requantize32 > | ( | const DepthwiseArgs & | , |
const Requantize32 & | |||
) |
template std::vector<KernelDescription> arm_conv::depthwise::get_compatible_kernels< uint8_t, int8_t, uint8_t, Requantize32 > | ( | const DepthwiseArgs & | , |
const Requantize32 & | |||
) |
template std::vector<KernelDescription> arm_conv::depthwise::get_compatible_kernels< uint8_t, uint8_t, uint8_t, Requantize32 > | ( | const DepthwiseArgs & | , |
const Requantize32 & | |||
) |
std::tuple<size_t, size_t, size_t, size_t, size_t> arm_conv::depthwise::get_reduced_view_for_dilation | ( | size_t | out_size, |
size_t | in_size, | ||
const size_t | d, | ||
const size_t | dilation_factor, | ||
const size_t | kernel_size, | ||
const size_t | stride, | ||
const size_t | orig_pad_before | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst_direct_impl | ( | const unsigned int | n_tile_rows, |
const unsigned int | n_tile_cols, | ||
const __fp16 * | inptr, | ||
int64_t | ld_input_row, | ||
int64_t | ld_input_col, | ||
__fp16 * | outptr, | ||
int64_t | ld_output_row, | ||
int64_t | ld_output_col, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst_indirect_impl | ( | const __fp16 *const *const | input_ptrs, |
__fp16 *const *const | outptrs, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst_direct_impl | ( | const unsigned int | n_tile_rows, |
const unsigned int | n_tile_cols, | ||
const __fp16 * | inptr, | ||
int64_t | ld_input_row, | ||
int64_t | ld_input_col, | ||
__fp16 * | outptr, | ||
int64_t | ld_output_row, | ||
int64_t | ld_output_col, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst_indirect_impl | ( | const __fp16 *const *const | input_ptrs, |
__fp16 *const *const | outptrs, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst_direct_impl | ( | const unsigned int | n_tile_rows, |
const unsigned int | n_tile_cols, | ||
const __fp16 * | inptr, | ||
int64_t | ld_input_row, | ||
int64_t | ld_input_col, | ||
__fp16 * | outptr, | ||
int64_t | ld_output_row, | ||
int64_t | ld_output_col, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst_indirect_impl | ( | const __fp16 *const *const | input_ptrs, |
__fp16 *const *const | outptrs, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst_direct_impl | ( | const unsigned int | n_tile_rows, |
const unsigned int | n_tile_cols, | ||
const __fp16 * | inptr, | ||
int64_t | ld_input_row, | ||
int64_t | ld_input_col, | ||
__fp16 * | outptr, | ||
int64_t | ld_output_row, | ||
int64_t | ld_output_col, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst_indirect_impl | ( | const __fp16 *const *const | input_ptrs, |
__fp16 *const *const | outptrs, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst_direct_impl | ( | const unsigned int | n_tile_rows, |
const unsigned int | n_tile_cols, | ||
const __fp16 * | inptr, | ||
int64_t | ld_input_row, | ||
int64_t | ld_input_col, | ||
__fp16 * | outptr, | ||
int64_t | ld_output_row, | ||
int64_t | ld_output_col, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst_indirect_impl | ( | const __fp16 *const *const | input_ptrs, |
__fp16 *const *const | outptrs, | ||
const void * | params, | ||
unsigned int | n_channels, | ||
const __fp16 | activation_min, | ||
const __fp16 | activation_max | ||
) |
void arm_conv::depthwise::sme2_fp32_planar_3x3_s1_4rows_mla_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32_planar_3x3_s1_4rows_mla_za::get_kernel().
void arm_conv::depthwise::sme2_fp32_planar_3x3_s2_4rows_mla_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32_planar_3x3_s2_4rows_mla_za::get_kernel().
void arm_conv::depthwise::sme2_fp32_planar_5x5_s1_4rows_mla_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32_planar_5x5_s1_4rows_mla_za::get_kernel().
void arm_conv::depthwise::sme2_fp32_planar_5x5_s2_4rows_mla_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32_planar_5x5_s2_4rows_mla_za::get_kernel().
void arm_conv::depthwise::sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za_impl | ( | const float * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const float * | weights, | ||
const float * | bias, | ||
float ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
float | act_min, | ||
float | act_max | ||
) |
Referenced by sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_s8q_planar_3x3_s1_4rows_dot_za_impl | ( | const int8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
int8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_s8q_planar_3x3_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_s8q_planar_3x3_s2_4rows_dot_za_impl | ( | const int8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
int8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_s8q_planar_3x3_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_s8q_planar_5x5_s1_4rows_dot_za_impl | ( | const int8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
int8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_s8q_planar_5x5_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_s8q_planar_5x5_s2_4rows_dot_za_impl | ( | const int8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
int8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_s8q_planar_5x5_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8q_planar_3x3_s1_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const uint8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8q_planar_3x3_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8q_planar_3x3_s2_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const uint8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8q_planar_3x3_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8q_planar_5x5_s1_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const uint8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8q_planar_5x5_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8q_planar_5x5_s2_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const uint8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8q_planar_5x5_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za::get_kernel().
void arm_conv::depthwise::sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za_impl | ( | const uint8_t * | inptr, |
size_t | ld_in_row, | ||
size_t | ld_in_col, | ||
size_t | ld_in_vl, | ||
unsigned int | pad_top, | ||
unsigned int | valid_input_rows, | ||
unsigned int | pad_left, | ||
unsigned int | valid_input_cols, | ||
const int8_t * | weights, | ||
uint8_t ** | outptrs, | ||
const size_t * | outlds, | ||
const size_t * | outvllds, | ||
unsigned int | output_cols, | ||
unsigned int | start_channel, | ||
unsigned int | valid_channels, | ||
const arm_gemm::Requantize32 & | qp | ||
) |
Referenced by sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za::get_kernel().