24.02.1
|
Namespaces | |
utils | |
Data Structures | |
struct | Activation |
class | barrier |
struct | ConvolutionParameters |
class | convolver |
struct | GemmArgs |
class | GemmCommon |
struct | GemmConfig |
class | GemmHybrid |
class | GemmHybridIndirect |
class | GemmHybridQuantized |
class | GemmHybridQuantizedInline |
struct | GemmImplementation |
struct | GemmImplementation< Top, Tret, Nothing > |
class | GemmInterleaved |
class | GemvBatched |
class | GemvPretransposed |
class | IGemmCommon |
struct | IndirectInputArg |
struct | IndirectOutputArg |
struct | is_sme |
struct | KernelDescription |
class | NDCoordinate |
NDCoordinate builds upon a range, but specifies a starting position in addition to a size which it inherits from NDRange. More... | |
class | NDRange |
struct | Nothing |
struct | PerformanceParameters |
class | QuantizeWrapper |
struct | Requantize32 |
class | StdTransformsFixed |
class | StdTransformsSME |
class | StdTransformsSVE |
Typedefs | |
using | bfloat16 = arm_compute::bfloat16 |
template<typename strategy , typename To , typename Tr , typename OutputStage = Nothing> | |
using | GemmHybridIndirectFixedFormat = GemmHybridIndirect< strategy, To, Tr, OutputStage, false, true > |
template<typename strategy , typename To , typename Tr , typename OutputStage = Nothing> | |
using | GemmInterleavedNoMerge = GemmInterleaved< strategy, To, Tr, OutputStage, false > |
template<typename strategy , typename To , typename Tr , typename OutputStage = Nothing> | |
using | GemmInterleavedFixedFormat = GemmInterleaved< strategy, To, Tr, OutputStage, true, true > |
template<typename strategy , typename To , typename Tr > | |
using | GemmInterleavedPretransposedNoMergeQuantizedInline = GemmInterleaved< strategy, To, Tr, Requantize32, false > |
template<typename strategy , typename To , typename Tr > | |
using | GemmInterleavedQuantized = GemmInterleaved< strategy, To, Tr, Requantize32 > |
template<typename Top , typename Tret > | |
using | UniqueGemmCommon = std::unique_ptr< GemmCommon< Top, Tret > > |
using | ndrange_t = NDRange< ndrange_max > |
using | ndcoord_t = NDCoordinate< ndrange_max > |
Functions | |
template<typename T > | |
void | bias_adder (T *out, unsigned int stride, const T *bias, unsigned int rows, unsigned int cols) |
template<bool DoBias, typename T > | |
void | activator (T *out, unsigned int stride, const T *bias, Activation act, unsigned int rows, unsigned int cols) |
template<> | |
const GemmImplementation< bfloat16, float > * | gemm_implementation_list< bfloat16, float > () |
template UniqueGemmCommon< bfloat16, float > | gemm< bfloat16, float, Nothing > (const GemmArgs &args, const Nothing &) |
template bool | has_opt_gemm< bfloat16, float, Nothing > (WeightFormat &weight_format, const GemmArgs &args, const Nothing &) |
template KernelDescription | get_gemm_method< bfloat16, float, Nothing > (const GemmArgs &args, const Nothing &) |
template std::vector< KernelDescription > | get_compatible_kernels< bfloat16, float, Nothing > (const GemmArgs &args, const Nothing &) |
template<> | |
const GemmImplementation< float, float > * | gemm_implementation_list< float, float > () |
template UniqueGemmCommon< float, float > | gemm< float, float, Nothing > (const GemmArgs &args, const Nothing &) |
template bool | has_opt_gemm< float, float, Nothing > (WeightFormat &weight_format, const GemmArgs &args, const Nothing &) |
template KernelDescription | get_gemm_method< float, float, Nothing > (const GemmArgs &args, const Nothing &) |
template std::vector< KernelDescription > | get_compatible_kernels< float, float, Nothing > (const GemmArgs &args, const Nothing &) |
template<typename Top , typename Tret , class OutputStage = Nothing> | |
const GemmImplementation< Top, Tret, OutputStage > * | gemm_implementation_list () |
template<typename Top , typename Tret , class OutputStage > | |
bool | find_implementation (const GemmArgs &args, const OutputStage &os, const GemmImplementation< Top, Tret, OutputStage > *&impl) |
template<typename Top , typename Tret , class OutputStage > | |
std::vector< KernelDescription > | get_compatible_kernels (const GemmArgs &args, const OutputStage &os) |
template<typename Top , typename Tret , class OutputStage > | |
bool | has_opt_gemm (WeightFormat &wf, const GemmArgs &args, const OutputStage &os) |
template<typename Top , typename Tret , class OutputStage > | |
UniqueGemmCommon< Top, Tret > | gemm (const GemmArgs &args, const OutputStage &os) |
template<typename Top , typename Tret , class OutputStage > | |
KernelDescription | get_gemm_method (const GemmArgs &args, const OutputStage &os) |
template<unsigned int height_vectors, unsigned int block, VLType vlt, bool integrate_sums, typename TIn , typename TOut > | |
void | interleave_block (TOut *&out, const TIn *const *in, size_t width, size_t height, size_t row_offset, bool first) |
template<unsigned int height_vectors, unsigned int block, VLType vlt, typename TOut > | |
void | FixupRowSums (TOut *&out, const int32_t row_sum_multiplier) |
template<unsigned int height_vectors, unsigned int block, VLType vlt, typename TIn , typename TOut > | |
void | IndirectInterleave (TOut *out, const TIn *const *const *ptr, unsigned int stringlen, unsigned int rounded_stringlen, const unsigned int y0, const unsigned int ymax, const unsigned int k0, const unsigned int kmax, bool integrate_sums, const int32_t row_sum_multiplier) |
template<unsigned int height_vectors, unsigned int block, VLType vlt, typename TIn , typename TOut > | |
void | ConvolutionInterleave (TOut *out, const TIn *in, size_t in_stride, const convolver< TIn > &conv, const unsigned int rounded_stringlen, const unsigned int y0, const unsigned int ymax, const unsigned int k0, const unsigned int kmax, bool integrate_sums, const int32_t row_sum_multiplier) |
template<unsigned int height_vectors, unsigned int block, VLType vlt, typename TIn , typename TOut > | |
void | Interleave (TOut *out, const TIn *in, size_t in_stride, const unsigned int y0, const unsigned int ymax, const unsigned int k0, const unsigned int kmax, bool integrate_sums, const int32_t row_sum_multiplier) |
WeightFormat | get_weight_format (const KernelWeightFormat, size_t) |
template<unsigned int twidth, unsigned int height, bool sve = false, typename Tin , typename Tout > | |
void | MergeResults (Tout *out, const Tin *in, int ldc, int y0, int ymax, int x0, int xmax, const Tout *bias, Activation act, bool append) |
template<typename Tin , typename Tout > | |
void | requantize_block_32 (const Requantize32 &qp, unsigned int width, unsigned int height, const Tin *input, unsigned int in_stride, Tout *output, unsigned int out_stride, const int32_t *row_bias, const int32_t *col_bias, unsigned int start_col) |
template<typename T > | |
void | compute_row_sums (const Requantize32 &qp, unsigned int width, unsigned int height, const T *input, unsigned int in_stride, int32_t *row_bias) |
template<typename T > | |
void | compute_col_sums (const Requantize32 &qp, unsigned int width, unsigned int height, const T *input, unsigned int in_stride, int32_t *col_bias, unsigned int depth, unsigned int multi, unsigned int first_col) |
template<typename T > | |
void | row_sums_indirect (size_t num_strings, const unsigned int *string_lengths, IndirectInputArg< T > A_arg, size_t M, int32_t *output_ptr, const Requantize32 *qp) |
template<unsigned int IntBy, unsigned int BlockBy, bool Transposed, VLType vlt = VLType::None, typename TOut , typename TIn > | |
void | Transform (TOut *out, const TIn *const in, const int stride, const int k0, const int kmax, const int x0, const int xmax) |
template<typename T > | |
std::string | get_type_name () |
template<typename T > | |
T | iceildiv (const T a, const T b) |
template<typename T > | |
T | roundup (const T a, const T b) |
bool | quant_no_left_shift (const Requantize32 &qp) |
bool | quant_hybrid_symmetric (const Requantize32 &qp) |
bool | quant_hybrid_asymmetric (const Requantize32 &qp) |
arm_compute::Window | to_window (const ndrange_t &ndr) |
arm_compute::Window | to_window (const ndcoord_t &ndc) |
ndrange_t | to_ndrange (const arm_compute::Window &win) |
Convert an arm_compute::Window to an arm_gemm::NDRange of the same max dimensions. More... | |
ndcoord_t | to_ndcoord (const arm_compute::Window &win) |
Convert an arm_compute::Window to an arm_gemm::NDCoord of the same max dimensions. More... | |
Variables | |
std::mutex | report_mutex |
constexpr std::size_t | ndrange_max = arm_compute::Dimensions<unsigned int>::num_max_dimensions |
using bfloat16 = arm_compute::bfloat16 |
Definition at line 30 of file bfloat.hpp.
using GemmHybridIndirectFixedFormat = GemmHybridIndirect<strategy, To, Tr, OutputStage, false, true> |
Definition at line 832 of file gemm_hybrid_indirect.hpp.
using GemmInterleavedFixedFormat = GemmInterleaved<strategy, To, Tr, OutputStage, true, true> |
Definition at line 1235 of file gemm_interleaved.hpp.
using GemmInterleavedNoMerge = GemmInterleaved<strategy, To, Tr, OutputStage, false> |
Definition at line 1232 of file gemm_interleaved.hpp.
using GemmInterleavedPretransposedNoMergeQuantizedInline = GemmInterleaved<strategy, To, Tr, Requantize32, false> |
Definition at line 1238 of file gemm_interleaved.hpp.
using GemmInterleavedQuantized = GemmInterleaved<strategy, To, Tr, Requantize32> |
Definition at line 1241 of file gemm_interleaved.hpp.
typedef NDCoordinate< 6 > ndcoord_t |
Definition at line 43 of file arm_gemm_compute_iface.hpp.
Definition at line 42 of file arm_gemm_compute_iface.hpp.
using UniqueGemmCommon = std::unique_ptr<GemmCommon<Top, Tret> > |
Definition at line 261 of file arm_gemm.hpp.
|
strong |
Enumerator | |
---|---|
DEFAULT | |
GEMV_BATCHED | |
GEMV_PRETRANSPOSED | |
GEMV_NATIVE_TRANSPOSED | |
GEMM_NATIVE | |
GEMM_HYBRID | |
GEMM_INTERLEAVED | |
GEMM_INTERLEAVED_2D | |
QUANTIZE_WRAPPER | |
QUANTIZE_WRAPPER_2D | |
GEMM_HYBRID_QUANTIZED |
Definition at line 34 of file arm_gemm.hpp.
|
strong |
Enumerator | |
---|---|
NON_FIXED | |
VL128_BL16 | |
VL128_BL32 | |
VL128_BL32_BF16 | |
VL128_BL64 | |
VL256_BL64 | |
VL256_BL64_BF16 | |
VL1VL_BL16 | |
VL1VL_BL32 | |
VL1VL_BL32_BF16 | |
VL1VL_BL64 | |
VL2VL_BL64 | |
VL2VL_BL64_BF16 |
Definition at line 42 of file kernel_weight_format.hpp.
|
strong |
|
strong |
Definition at line 49 of file arm_gemm.hpp.
|
inline |
Definition at line 40 of file bias_adder.hpp.
References bias, bias_adder(), Activation::BoundedReLU, caffe_mnist_image_extractor::cols, Activation::None, Activation::param1, Activation::ReLU, caffe_mnist_image_extractor::rows, and Activation::type.
|
inline |
Definition at line 31 of file bias_adder.hpp.
References bias, caffe_mnist_image_extractor::cols, and caffe_mnist_image_extractor::rows.
Referenced by activator(), and GemmHybrid< strategy, To, Tr >::execute().
void arm_gemm::compute_col_sums | ( | const Requantize32 & | qp, |
unsigned int | width, | ||
unsigned int | height, | ||
const T * | input, | ||
unsigned int | in_stride, | ||
int32_t * | col_bias, | ||
unsigned int | depth, | ||
unsigned int | multi, | ||
unsigned int | first_col | ||
) |
Referenced by GemvPretransposed< strategy, To, Tr, OutputStage >::requantize_bias(), GemmHybridQuantizedInline< strategy, To, Tr >::requantize_bias(), GemmHybridQuantized< strategy, To, Tr >::requantize_bias(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::requantize_bias(), and GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::requantize_bias().
void arm_gemm::compute_row_sums | ( | const Requantize32 & | qp, |
unsigned int | width, | ||
unsigned int | height, | ||
const T * | input, | ||
unsigned int | in_stride, | ||
int32_t * | row_bias | ||
) |
Referenced by GemmHybridQuantized< strategy, To, Tr >::execute().
void ConvolutionInterleave | ( | TOut * | out, |
const TIn * | in, | ||
size_t | in_stride, | ||
const convolver< TIn > & | conv, | ||
const unsigned int | rounded_stringlen, | ||
const unsigned int | y0, | ||
const unsigned int | ymax, | ||
const unsigned int | k0, | ||
const unsigned int | kmax, | ||
bool | integrate_sums, | ||
const int32_t | row_sum_multiplier | ||
) |
Definition at line 226 of file interleave_indirect.cpp.
References offset(), convolver< T >::process_columns(), and SVE.
bool arm_gemm::find_implementation | ( | const GemmArgs & | args, |
const OutputStage & | os, | ||
const GemmImplementation< Top, Tret, OutputStage > *& | impl | ||
) |
Definition at line 238 of file gemm_implementation.hpp.
References GemmTuner::args, DEFAULT, GemmImplementation< Top, Tret, OutputStage >::do_cycle_estimate(), GemmConfig::filter, GemmImplementation< Top, Tret, OutputStage >::method, and GemmConfig::method.
Referenced by get_compatible_kernels().
|
inline |
Definition at line 125 of file interleave_indirect.cpp.
References SVE.
UniqueGemmCommon< Top, Tret > gemm | ( | const GemmArgs & | args, |
const OutputStage & | os | ||
) |
Definition at line 320 of file gemm_implementation.hpp.
References GemmTuner::args, and GemmImplementation< Top, Tret, OutputStage >::do_instantiate().
Referenced by arm_compute::test::validation::TEST_CASE().
template UniqueGemmCommon<bfloat16, float> arm_gemm::gemm< bfloat16, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
template UniqueGemmCommon<float, float> arm_gemm::gemm< float, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
const GemmImplementation<Top, Tret, OutputStage>* arm_gemm::gemm_implementation_list | ( | ) |
const GemmImplementation<bfloat16, float>* arm_gemm::gemm_implementation_list< bfloat16, float > | ( | ) |
Definition at line 229 of file gemm_bf16.cpp.
const GemmImplementation<float, float>* arm_gemm::gemm_implementation_list< float, float > | ( | ) |
Definition at line 393 of file gemm_fp32.cpp.
std::vector< KernelDescription > get_compatible_kernels | ( | const GemmArgs & | args, |
const OutputStage & | os | ||
) |
Definition at line 288 of file gemm_implementation.hpp.
References GemmTuner::args, DEFAULT, GemmImplementation< Top, Tret, OutputStage >::do_cycle_estimate(), find_implementation(), and GemmImplementation< Top, Tret, OutputStage >::method.
template std::vector<KernelDescription> arm_gemm::get_compatible_kernels< bfloat16, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
template std::vector<KernelDescription> arm_gemm::get_compatible_kernels< float, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
KernelDescription get_gemm_method | ( | const GemmArgs & | args, |
const OutputStage & | os | ||
) |
Definition at line 331 of file gemm_implementation.hpp.
References GemmTuner::args, GemmImplementation< Top, Tret, OutputStage >::method, and GemmImplementation< Top, Tret, OutputStage >::name.
template KernelDescription arm_gemm::get_gemm_method< bfloat16, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
template KernelDescription arm_gemm::get_gemm_method< float, float, Nothing > | ( | const GemmArgs & | args, |
const Nothing & | |||
) |
WeightFormat get_weight_format | ( | const KernelWeightFormat | kwf, |
size_t | element_size | ||
) |
Definition at line 40 of file misc.cpp.
References NON_FIXED, and UNSPECIFIED.
Referenced by GemmImplementation< Top, Tret, OutputStage >::do_is_supported(), GemmImplementation< Top, Tret, Nothing >::do_is_supported(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::get_config(), and GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::get_config().
bool has_opt_gemm | ( | WeightFormat & | wf, |
const GemmArgs & | args, | ||
const OutputStage & | os | ||
) |
Definition at line 311 of file gemm_implementation.hpp.
References GemmTuner::args, and GemmImplementation< Top, Tret, OutputStage >::do_instantiate().
template bool arm_gemm::has_opt_gemm< bfloat16, float, Nothing > | ( | WeightFormat & | weight_format, |
const GemmArgs & | args, | ||
const Nothing & | |||
) |
template bool arm_gemm::has_opt_gemm< float, float, Nothing > | ( | WeightFormat & | weight_format, |
const GemmArgs & | args, | ||
const Nothing & | |||
) |
|
inline |
Definition at line 65 of file utils.hpp.
References arm_compute::test::validation::b.
Referenced by GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::estimate_cycles(), GemvPretransposed< strategy, To, Tr, OutputStage >::execute(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::get_B_pretranspose_window_size(), GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::get_B_pretranspose_window_size(), arm_conv::depthwise::get_reduced_view_for_dilation(), arm_conv::depthwise::interleaves::quantized::get_storage_size(), arm_conv::depthwise::interleaves::get_storage_size_generic(), GemvPretransposed< strategy, To, Tr, OutputStage >::get_window_size(), GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::get_window_size(), arm_conv::depthwise::interleaves::quantized::pack_parameters(), and GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::pretranspose_B_array_part().
void IndirectInterleave | ( | TOut * | out, |
const TIn *const *const * | ptr, | ||
unsigned int | stringlen, | ||
unsigned int | rounded_stringlen, | ||
const unsigned int | y0, | ||
const unsigned int | ymax, | ||
const unsigned int | k0, | ||
const unsigned int | kmax, | ||
bool | integrate_sums, | ||
const int32_t | row_sum_multiplier | ||
) |
Definition at line 155 of file interleave_indirect.cpp.
References SVE.
void Interleave | ( | TOut * | out, |
const TIn * | in, | ||
size_t | in_stride, | ||
const unsigned int | y0, | ||
const unsigned int | ymax, | ||
const unsigned int | k0, | ||
const unsigned int | kmax, | ||
bool | integrate_sums, | ||
const int32_t | row_sum_multiplier | ||
) |
Definition at line 265 of file interleave_indirect.cpp.
References SVE.
void arm_gemm::interleave_block | ( | TOut *& | out, |
const TIn *const * | in, | ||
size_t | width, | ||
size_t | height, | ||
size_t | row_offset, | ||
bool | first | ||
) |
Definition at line 61 of file interleave_indirect.cpp.
References SVE.
void MergeResults | ( | Tout * | out, |
const Tin * | in, | ||
int | ldc, | ||
int | y0, | ||
int | ymax, | ||
int | x0, | ||
int | xmax, | ||
const Tout * | bias, | ||
Activation | act, | ||
bool | append | ||
) |
Definition at line 38 of file mergeresults.cpp.
References bias, Activation::BoundedReLU, Activation::None, Activation::param1, Activation::ReLU, and Activation::type.
Referenced by StdTransformsSVE< TOperand, TResult, height, width_vectors, block, mmla, integrate_sums >::Merge().
|
inline |
Definition at line 134 of file utils.hpp.
References Requantize32::per_channel_requant, and quant_no_left_shift().
|
inline |
Definition at line 128 of file utils.hpp.
References Requantize32::b_offset, and quant_no_left_shift().
|
inline |
Definition at line 118 of file utils.hpp.
References Requantize32::per_channel_left_shifts, Requantize32::per_channel_requant, and Requantize32::per_layer_left_shift.
Referenced by quant_hybrid_asymmetric(), and quant_hybrid_symmetric().
void arm_gemm::requantize_block_32 | ( | const Requantize32 & | qp, |
unsigned int | width, | ||
unsigned int | height, | ||
const Tin * | input, | ||
unsigned int | in_stride, | ||
Tout * | output, | ||
unsigned int | out_stride, | ||
const int32_t * | row_bias, | ||
const int32_t * | col_bias, | ||
unsigned int | start_col | ||
) |
Referenced by GemmHybridQuantized< strategy, To, Tr >::execute().
|
inline |
Definition at line 70 of file utils.hpp.
References arm_compute::test::validation::b.
Referenced by GemmHybrid< strategy, To, Tr >::estimate_cycles(), GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::estimate_cycles(), GemvPretransposed< strategy, To, Tr, OutputStage >::execute(), GemmHybrid< strategy, To, Tr >::execute(), GemmHybridQuantizedInline< strategy, To, Tr >::execute(), GemmHybridQuantized< strategy, To, Tr >::execute(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::execute(), GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::execute(), GemmHybridQuantizedInline< strategy, To, Tr >::get_B_pretransposed_array_size(), GemmHybrid< strategy, To, Tr >::get_B_pretransposed_array_size(), GemmHybridQuantized< strategy, To, Tr >::get_B_pretransposed_array_size(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::get_B_pretransposed_array_size(), GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::get_B_pretransposed_array_size(), GemmHybrid< strategy, To, Tr >::pretranspose_B_array(), GemmHybridQuantizedInline< strategy, To, Tr >::pretranspose_B_array(), GemmHybridQuantized< strategy, To, Tr >::pretranspose_B_array(), GemmHybridIndirect< strategy, To, Tr, OutputStage, SeparateQuantize, FixedFormat >::pretranspose_B_array_part(), and GemmInterleaved< strategy, To, Tr, OutputStage, MergeStep, FixedFormat, ForceThreadColumns, ForceFloatAccumulate >::pretranspose_B_array_part().
void arm_gemm::row_sums_indirect | ( | size_t | num_strings, |
const unsigned int * | string_lengths, | ||
IndirectInputArg< T > | A_arg, | ||
size_t | M, | ||
int32_t * | output_ptr, | ||
const Requantize32 * | qp | ||
) |
|
inline |
Convert an arm_compute::Window
to an arm_gemm::NDCoord
of the same max dimensions.
[win] | the arm_compute::Window we want to convert to arm_gemm::ndcoord_t |
Definition at line 112 of file arm_gemm_compute_iface.hpp.
References arm_compute::mlgo::parser::end().
Referenced by CpuGemmAssemblyWrapperKernel< TypeInput, TypeOutput >::run(), and CpuGemmAssemblyWrapperKernel< TypeInput, TypeOutput >::run_nd().
|
inline |
Convert an arm_compute::Window
to an arm_gemm::NDRange
of the same max dimensions.
It should be noted that arm_compute::Window
specifies a start()
and an end()
where as arm_gemm::ndrange_t
only has a size, as a result we store the delta between the range
[win] | the arm_compute::Window we want to convert to arm_gemm::ndrange_t |
Definition at line 97 of file arm_gemm_compute_iface.hpp.
References arm_compute::mlgo::parser::end().
|
inline |
Definition at line 72 of file arm_gemm_compute_iface.hpp.
References NDCoordinate< N >::get_position(), NDRange< D >::get_size(), ndrange_max, and Window::set().
|
inline |
Definition at line 53 of file arm_gemm_compute_iface.hpp.
References NDRange< D >::get_size(), ndrange_max, and Window::set().
Referenced by CpuGemmAssemblyWrapperKernel< TypeInput, TypeOutput >::configure().
void Transform | ( | TOut * | out, |
const TIn *const | in, | ||
const int | stride, | ||
const int | k0, | ||
const int | kmax, | ||
const int | x0, | ||
const int | xmax | ||
) |
Definition at line 116 of file transform.cpp.
|
constexpr |
Definition at line 40 of file arm_gemm_compute_iface.hpp.
Referenced by to_window().