25 #ifdef ARM_COMPUTE_ENABLE_SVE
27 #include "../std_transforms_sve.hpp"
28 #include "../performance_parameters.hpp"
31 unsigned int, const unsigned int *, \
32 IndirectInputArg<uint8_t>, \
35 IndirectOutputArg<uint32_t>, \
36 const uint32_t *, Activation, bool
41 void sve_hybrid_u8u32_mmla_6x4VL( ARGLIST );
43 class cls_sve_hybrid_u8u32_mmla_6x4VL
46 typedef uint8_t lhs_operand_type;
47 typedef uint8_t rhs_operand_type;
48 typedef uint32_t result_type;
50 typedef void (*kern_type)( ARGLIST );
53 static constexpr
unsigned int out_height()
58 static unsigned int out_width()
60 return get_vector_length<uint32_t>() * 4;
63 static constexpr
unsigned int k_unroll()
68 static constexpr
bool supports_accumulate()
73 StdTransformsSVE<rhs_operand_type, result_type, 6, 8, 8> transforms = {};
75 static inline PerformanceParameters get_performance_parameters(
const CPUInfo *
ci)
77 if (std::is_same<T, uint32_t>::value) {
88 if (std::is_same<T, uint8_t>::value) {
91 return { 54.90, 15.69, 0.62 };
93 return { 26.80, 3.89, 0.47 };
95 return { 75.14, 15.87, 0.83 };
103 kern_type kernel=sve_hybrid_u8u32_mmla_6x4VL;
104 cls_sve_hybrid_u8u32_mmla_6x4VL(
const CPUInfo *)
112 #endif // ARM_COMPUTE_ENABLE_SVE