#include <premultiply.hpp>
Go to the source code of this file.
|
void | do_premultiply_float_6 (const float *in_ptr, const unsigned int ld_row, const unsigned int ld_col, float *out_ptr, const unsigned int out_ld_row, const unsigned int out_ld_col, const unsigned int tile_rows, const unsigned int tile_cols, const unsigned input_channels) |
|
◆ BLOCK_SIZE
◆ CHANNEL_MULTIPLIER
#define CHANNEL_MULTIPLIER 6 |
◆ do_premultiply_float_6()
void do_premultiply_float_6 |
( |
const float * |
in_ptr, |
|
|
const unsigned int |
ld_row, |
|
|
const unsigned int |
ld_col, |
|
|
float * |
out_ptr, |
|
|
const unsigned int |
out_ld_row, |
|
|
const unsigned int |
out_ld_col, |
|
|
const unsigned int |
tile_rows, |
|
|
const unsigned int |
tile_cols, |
|
|
const unsigned |
input_channels |
|
) |
| |
Definition at line 30 of file premultiply.cpp.
40 for(
unsigned int i = 0; i < tile_rows; i++)
42 const float *ip2 = in_ptr + i * ld_row;
43 float *op2 = out_ptr + i * out_ld_row;
44 for(
unsigned int j = 0; j < tile_cols; j++)
46 const float *ip = ip2;
49 unsigned int num_blocks = input_channels /
BLOCK_SIZE;
50 for(
unsigned int c = 0; c < num_blocks; c++)
69 unsigned int rem = input_channels - num_blocks *
BLOCK_SIZE;
70 for(
unsigned int c = 0; c < rem; c++)
References BLOCK_SIZE, and CHANNEL_MULTIPLIER.