25 #ifdef ARM_COMPUTE_ENABLE_SVE
27 #include "../std_transforms_sve.hpp"
28 #include "../bfloat.hpp"
29 #include "../kernel_weight_format.hpp"
30 #include "../performance_parameters.hpp"
33 unsigned int, const unsigned int *, \
34 IndirectInputArg<bfloat16>, \
38 IndirectOutputArg<float>, \
39 const float *, Activation, bool
44 void sve_ffhybrid_bf16fp32_mmla_6x4VL( ARGLIST );
46 class cls_sve_ffhybrid_bf16fp32_mmla_6x4VL
51 typedef float result_type;
53 typedef void (*kern_type)( ARGLIST );
56 static constexpr
unsigned int out_height()
60 static unsigned int stripe_width()
62 return get_vector_length<float>() * 1;
70 static unsigned int out_width()
72 return get_vector_length<float>() * 4;
75 static constexpr
unsigned int k_unroll()
80 static constexpr
bool supports_accumulate()
85 StdTransformsSVE<rhs_operand_type, result_type, 6, 8, 4> transforms = {};
87 static inline PerformanceParameters get_performance_parameters(
const CPUInfo *
ci)
89 if (std::is_same<T, bfloat16>::value) {
100 kern_type kernel=sve_ffhybrid_bf16fp32_mmla_6x4VL;
101 cls_sve_ffhybrid_bf16fp32_mmla_6x4VL(
const CPUInfo *)
109 #endif // ARM_COMPUTE_ENABLE_SVE