14template <
class T,
class Abi, KernelConfig Conf, index_t RowsReg, StorageOrder OA, StorageOrder OD>
17template <
class T,
class Abi, KernelConfig Conf, index_t RowsReg, index_t ColsReg, StorageOrder OD>
20template <
class T,
class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OD>
25template <
class T,
class Abi>
28template <
class T,
class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OD>
34template <
class T,
class Abi, KernelConfig Conf, StorageOrder OD>
consteval auto make_1d_lut(F f)
Returns an array of the form:
consteval auto make_2d_lut(F f)
Returns a 2D array of the form:
constexpr index_t RowsReg
Register block size of the matrix-matrix multiplication micro-kernels.
const constinit auto trmm_lut
constexpr index_t RowsReg
Register block size of the matrix-matrix multiplication micro-kernels.
const constinit auto trtri_copy_lut
void trmm_microkernel(uview< const T, Abi, OD > Dr, uview< T, Abi, OD > D, index_t k) noexcept
void trtri_copy_register(view< const T, Abi, OA > A, view< T, Abi, OD > D) noexcept
constexpr index_t ColsReg
void trtri_copy_microkernel(uview< const T, Abi, OA > A, uview< T, Abi, OD > D, index_t k) noexcept
simd_view_types< std::remove_const_t< T >, Abi >::template view< T, Order > view
std::integral_constant< index_t, I > index_constant