batmat develop
Batched linear algebra routines
Loading...
Searching...
No Matches
trsm.hpp File Reference
#include <batmat/linalg/structure.hpp>
#include <batmat/linalg/uview.hpp>
#include <batmat/micro-kernels/trsm/export.h>
#include <batmat/platform/platform.hpp>

Go to the source code of this file.

Classes

struct  batmat::linalg::micro_kernels::trsm::KernelConfig

Namespaces

namespace  batmat
namespace  batmat::linalg
namespace  batmat::linalg::micro_kernels
namespace  batmat::linalg::micro_kernels::trsm

Functions

template<class T, class Abi, KernelConfig Conf, index_t RowsReg, index_t ColsReg, StorageOrder OA, StorageOrder OB, StorageOrder OD>
void batmat::linalg::micro_kernels::trsm::trsm_copy_microkernel (uview< const T, Abi, OA > A, uview< const T, Abi, OB > B, uview< T, Abi, OD > D, index_t k) noexcept
template<class T, class Abi, KernelConfig Conf, StorageOrder OA, StorageOrder OB, StorageOrder OD>
void batmat::linalg::micro_kernels::trsm::trsm_copy_register (const view< const T, Abi, OA > A, const view< const T, Abi, OB > B, const view< T, Abi, OD > D) noexcept
 Triangular solve D = (A⁽ᵀ⁾)⁻¹ B⁽ᵀ⁾ where A⁽ᵀ⁾ is lower triangular.

Variables

template<class T, class Abi>
constexpr index_t batmat::linalg::micro_kernels::trsm::ColsReg = RowsReg<T, Abi>
template<class T, class Abi>
constexpr index_t batmat::linalg::micro_kernels::trsm::RowsReg
 Register block size of the matrix-matrix multiplication micro-kernels.

Class Documentation

◆ batmat::linalg::micro_kernels::trsm::KernelConfig

struct batmat::linalg::micro_kernels::trsm::KernelConfig
Class Members
MatrixStructure struc_A = MatrixStructure::LowerTriangular
index_t rotate_B = 0