batmat 0.0.16
Batched linear algebra routines
Loading...
Searching...
No Matches
gemm-diag.tpp File Reference

Go to the source code of this file.

Namespaces

namespace  batmat
namespace  batmat::linalg
namespace  batmat::linalg::micro_kernels
namespace  batmat::linalg::micro_kernels::gemm_diag

Macros

#define UNROLL_FOR(...)

Functions

template<class T, class Abi, KernelConfig Conf, index_t RowsReg, index_t ColsReg, StorageOrder OA, StorageOrder OB, StorageOrder OC, StorageOrder OD>
std::conditional_t< Conf.track_zeros, std::pair< index_t, index_t >, void > batmat::linalg::micro_kernels::gemm_diag::gemm_diag_copy_microkernel (const uview< const T, Abi, OA > A, const uview< const T, Abi, OB > B, const std::optional< uview< const T, Abi, OC > > C, const uview< T, Abi, OD > D, const uview_vec< const T, Abi > d, const index_t k) noexcept
 Generalized matrix multiplication D = C ± A⁽ᵀ⁾ diag(d) B⁽ᵀ⁾. Single register block.
template<class T, class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OB, StorageOrder OC, StorageOrder OD>
void batmat::linalg::micro_kernels::gemm_diag::gemm_diag_copy_register (const view< const T, Abi, OA > A, const view< const T, Abi, OB > B, const std::optional< view< const T, Abi, OC > > C, const view< T, Abi, OD > D, view< const T, Abi > d) noexcept
 Generalized matrix multiplication D = C ± A⁽ᵀ⁾ diag(d) B⁽ᵀ⁾. Using register blocking.

Variables

template<MatrixStructure Struc>
constexpr auto batmat::linalg::micro_kernels::gemm_diag::first_column
template<index_t ColsReg, MatrixStructure Struc>
constexpr auto batmat::linalg::micro_kernels::gemm_diag::last_column

Macro Definition Documentation

◆ UNROLL_FOR

#define UNROLL_FOR ( ...)
Value:
#define BATMAT_FULLY_UNROLLED_FOR(...)
Definition unroll.h:27

Definition at line 9 of file gemm-diag.tpp.