18 index_t l0, index_t k)
noexcept;
20template <
class T,
class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OB, StorageOrder OD>
27template <
class T,
class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OB, StorageOrder OD>
consteval auto make_1d_lut(F f)
Returns an array of the form:
constexpr index_t RowsReg
Register block size of the matrix-matrix multiplication micro-kernels.
const constinit auto syomv_lut
constexpr index_t RowsReg
Register block size of the matrix-matrix multiplication micro-kernels.
void syomv_microkernel(uview< const T, Abi, OA > A, uview< const T, Abi, OB > B, uview< T, Abi, OD > D, index_t l0, index_t k) noexcept
Symmetric off-diagonal block multiply. Single register block.
void syomv_register(view< const T, Abi, OA > A, view< const T, Abi, OB > B, view< T, Abi, OD > D) noexcept
Generalized matrix multiplication D = C ± A⁽ᵀ⁾ B⁽ᵀ⁾. Using register blocking.
simd_view_types< std::remove_const_t< T >, Abi >::template view< T, Order > view
std::integral_constant< index_t, I > index_constant