batmat develop
Batched linear algebra routines
Loading...
Searching...
No Matches
small-potrf.tpp File Reference
#include <batmat/assume.hpp>
#include <batmat/linalg/micro-kernels/small-potrf.hpp>
#include <batmat/loop.hpp>
#include <batmat/lut.hpp>
#include <batmat/ops/rsqrt.hpp>
#include <batmat/ops/sqrt.hpp>
#include <batmat/simd.hpp>
#include <bit>

Go to the source code of this file.

Namespaces

namespace  batmat
namespace  batmat::linalg
namespace  batmat::linalg::micro_kernels
namespace  batmat::linalg::micro_kernels::small_potrf

Macros

#define UNROLL_FOR(...)

Functions

template<class T, index_t NC>
void batmat::linalg::micro_kernels::small_potrf::potrf_trsm_microkernel (index_t k, scalar_view< const T > A, scalar_view< T > L) noexcept
template<class T, index_t RowsReg, index_t ColsReg>
void batmat::linalg::micro_kernels::small_potrf::potrf_syrk_microkernel (index_t k, scalar_view< const T > L21, scalar_view< const T > A22, scalar_view< T > L22) noexcept
 Outer product for updating the bottom right tail during Cholesky factorization.
template<class T, index_t RowsReg = 4>
void batmat::linalg::micro_kernels::small_potrf::small_potrf (view< const T, datapar::scalar_abi< T > > A, view< T, datapar::scalar_abi< T > > L, index_t n=-1) noexcept
template<class T, index_t NC, index_t NR>
void batmat::linalg::micro_kernels::small_potrf::syrk_potrf_trsm_microkernel (index_t m, index_t k, scalar_view< const T > L21, scalar_view< const T > A22, scalar_view< T > L22) noexcept
 Left-looking variant of small_potrf, which updates the current block with the outer product of the previously computed part L21.
template<class T, index_t RowsReg = 4, index_t S = 8>
void batmat::linalg::micro_kernels::small_potrf::small_potrf_left (view< const T, datapar::scalar_abi< T > > A, view< T, datapar::scalar_abi< T > > L) noexcept

Macro Definition Documentation

◆ UNROLL_FOR

#define UNROLL_FOR ( ...)
Value:
#define BATMAT_FULLY_UNROLLED_FOR(...)
Definition unroll.h:27

Definition at line 12 of file small-potrf.tpp.