void do_premultiply_float_6(const float *in_ptr, const unsigned int ld_row, const unsigned int ld_col, float *out_ptr, const unsigned int out_ld_row, const unsigned int out_ld_col, const unsigned int tile_rows, const unsigned int tile_cols, const unsigned input_channels)