batmat 0.0.17
Batched linear algebra routines
Loading...
Searching...
No Matches
generic.hpp
Go to the documentation of this file.
1#pragma once
2
3#include <batmat/config.hpp>
4
5namespace batmat {
7
8/// Register block size of the matrix-matrix multiplication micro-kernels.
9/// Assumes that the platform has at least 16 vector registers, we use 9 registers for a 3×3
10/// accumulator block of matrix C (leaving some registers for loading A and B):
11template <class T, class Abi>
12inline constexpr index_t RowsReg = 3;
13
14} // namespace linalg::micro_kernels::gemm
15namespace ops {
16
17template <class T>
18inline constexpr index_t RowsRegTranspose = 4;
19template <class T>
20inline constexpr index_t ColsRegTranspose = 4;
21
22} // namespace ops
23} // namespace batmat
std::ptrdiff_t index_t
constexpr index_t RowsReg
Register block size of the matrix-matrix multiplication micro-kernels.
Definition avx-512.hpp:13
constexpr index_t RowsRegTranspose
Definition avx-512.hpp:23
constexpr index_t ColsRegTranspose
Definition avx-512.hpp:25