ergo
|
Generalized matrix matrix multiplication using SSE intrinsics. More...
Go to the source code of this file.
Functions | |
template<typename real, typename regType, int m_kernel, int n_kernel, int k_kernel, int m_block, int n_block> | |
static void | gemm_sse (real const *const A, real const *const B, real *C, size_t const m, size_t const n, size_t const k, real *A_packed, real *B_packed, real *C_packed, size_t const ap_size, size_t const bp_size, size_t const cp_size) |
template<typename real> | |
static void | gemm_sse (real const *const A, real const *const B, real *C, size_t const m, size_t const n, size_t const k, real *A_packed, real *B_packed, real *C_packed, size_t const ap_size, size_t const bp_size, size_t const cp_size) |
template<> | |
void | gemm_sse (double const *const A, double const *const B, double *C, size_t const m, size_t const n, size_t const k, double *A_packed, double *B_packed, double *C_packed, size_t const ap_size, size_t const bp_size, size_t const cp_size) |
template<> | |
void | gemm_sse (float const *const A, float const *const B, float *C, size_t const m, size_t const n, size_t const k, float *A_packed, float *B_packed, float *C_packed, size_t const ap_size, size_t const bp_size, size_t const cp_size) |
Generalized matrix matrix multiplication using SSE intrinsics.
void gemm_sse | ( | double const *const | A, |
double const *const | B, | ||
double * | C, | ||
size_t const | m, | ||
size_t const | n, | ||
size_t const | k, | ||
double * | A_packed, | ||
double * | B_packed, | ||
double * | C_packed, | ||
size_t const | ap_size, | ||
size_t const | bp_size, | ||
size_t const | cp_size ) |
References A, B, and gemm_sse().
void gemm_sse | ( | float const *const | A, |
float const *const | B, | ||
float * | C, | ||
size_t const | m, | ||
size_t const | n, | ||
size_t const | k, | ||
float * | A_packed, | ||
float * | B_packed, | ||
float * | C_packed, | ||
size_t const | ap_size, | ||
size_t const | bp_size, | ||
size_t const | cp_size ) |
References A, B, and gemm_sse().
|
static |
Referenced by mat::gemm(), gemm_sse(), and gemm_sse().