6 #include <hmlp_internal.hpp> 9 BLIS_GEMM_KERNEL(bli_sgemm_opt_12x32_l2,
float);
10 BLIS_GEMM_KERNEL(bli_dgemm_opt_6x32_l2,
double);
15 inline GSKS_OPERATOR(
float)
const 17 printf(
"not implemented yet\n" );
27 const size_t pack_mr = 32;
28 const size_t pack_nr = 6;
29 const size_t align_size = 64;
30 const bool row_major =
false;
48 double ctmp[ mr * nr ];
51 double beta = aux->pc ? 1.0 : 0.0;
55 for (
size_t j = 0; j < aux->jb; j ++ )
56 for (
size_t i = 0; i < aux->ib; i ++ )
58 ctmp[ j * mr + i ] = c[ j * ldc + i ];
73 for (
size_t j = 0; j < aux->jb; j ++ )
75 for (
size_t i = 0; i < aux->ib; i ++ )
77 ctmp[ j * mr + i ] *= -2.0;
78 ctmp[ j * mr + i ] += aa[ i ] + bb[ j ];
79 ctmp[ j * mr + i ] = std::max( ctmp[ j * mr + i ], (
double)0 );
83 u[ i ] += std::exp( ker->scal * ctmp[ j * mr + i ] ) * w[ j ];
GSKS_OPERATOR(double) const
Definition: gsks_d6x32.hpp:46
Definition: gsks_d6x32.hpp:23
Definition: gsks_d12x16.hpp:13