0.0.21/Doxygen/reduce_8hpp_source.html

#pragma once


#include <batmat/linalg/elementwise.hpp>

#include <batmat/linalg/norms.hpp>


namespace batmat::linalg {


/// @cond DETAIL


namespace detail {


template <class T, class Abi, StorageOrder O0, class Tinit, class F, class R, class... Args>

auto reduce(Tinit init, F fun, R reduce, view<const T, Abi, O0> x0, const Args &...xs) {

    BATMAT_ASSERT(((x0.rows() == xs.rows()) && ...));

    BATMAT_ASSERT(((x0.cols() == xs.cols()) && ...));

    BATMAT_ASSERT(((x0.depth() == xs.depth()) && ...));

    BATMAT_ASSERT(((x0.batch_size() == xs.batch_size()) && ...));

    iter_elems<T, Abi, O0>([&](auto... args) { init = fun(init, args...); }, x0, xs...);

    return reduce(init);

}


template <class T, class Abi, StorageOrder OA>

[[gnu::flatten]] linalg::norms<T>::result norms_all(view<const T, Abi, OA> A) {

    using simd  = datapar::simd<T, Abi>;

    using norms = linalg::norms<T, simd>;

    return reduce<T, Abi>(norms::zero_simd(), norms(), norms(), A);

}


/// Dot product.

template <class T, class Abi, StorageOrder OA, StorageOrder OB>

[[gnu::flatten]] T dot(view<const T, Abi, OA> a, view<const T, Abi, OB> b) {

    using simd       = datapar::simd<T, Abi>;

    auto fma         = [](auto accum, auto ai, auto bi) { return ai * bi + accum; };

    auto simd_reduce = [](auto accum) { return reduce(accum); };

    return reduce<T, Abi>(simd{0}, fma, simd_reduce, a, b);

}


/// Squared 2-norm.

template <class T, class Abi, StorageOrder OA>

[[gnu::flatten]] T norm_2_sq(view<const T, Abi, OA> a) {

    using simd       = datapar::simd<T, Abi>;

    auto fma         = [](auto accum, auto ai) { return ai * ai + accum; };

    auto simd_reduce = [](auto accum) { return reduce(accum); };

    return reduce<T, Abi>(simd{0}, fma, simd_reduce, a);

}


/// ∑ wᵢ aᵢ².

template <class T, class Abi, StorageOrder OW, StorageOrder OA>

[[gnu::flatten]] T weighted_norm_sq(view<const T, Abi, OW> w, view<const T, Abi, OA> a) {

    using simd       = datapar::simd<T, Abi>;

    auto wnd         = [](auto accum, auto wi, auto ai) { return wi * (ai * ai) + accum; };

    auto simd_reduce = [](auto accum) { return reduce(accum); };

    return reduce<T, Abi>(simd{0}, wnd, simd_reduce, w, a);

}


/// ∑ wᵢ(aᵢ - bᵢ)².

template <class T, class Abi, StorageOrder OW, StorageOrder OA, StorageOrder OB>

[[gnu::flatten]] T weighted_norm_sq_difference(view<const T, Abi, OW> w, view<const T, Abi, OA> a,

                                               view<const T, Abi, OB> b) {

    using simd = datapar::simd<T, Abi>;

    auto wnd   = [](auto accum, auto wi, auto ai, auto bi) {

        auto ei = ai - bi;

        return wi * (ei * ei) + accum;

    };

    auto simd_reduce = [](auto accum) { return reduce(accum); };

    return reduce<T, Abi>(simd{0}, wnd, simd_reduce, w, a, b);

}


} // namespace detail


/// @endcond


/// @addtogroup topic-linalg

/// @{


/// @name Single-batch reduction operations

/// @{


/// Compute the norms (max, 1-norm, and 2-norm) of a vector.

template <simdifiable Vx>


norms<simdified_value_t<Vx>>::result norms_all(Vx &&x) {

    GUANAQO_TRACE_LINALG("norms_all", 3 * detail::num_elem(simdify(x))); // fma, add, max

    return detail::norms_all<simdified_value_t<Vx>, simdified_abi_t<Vx>>(simdify(x).as_const());

}


/// Compute the infinity norm of a vector.

template <simdifiable Vx>


simdified_value_t<Vx> norm_inf(Vx &&x) {

    return norms_all(std::forward<Vx>(x)).norm_inf();

}


/// Compute the 1-norm of a vector.

template <simdifiable Vx>


simdified_value_t<Vx> norm_1(Vx &&x) {

    return norms_all(std::forward<Vx>(x)).norm_1();

}


/// Compute the squared 2-norm of a vector.

template <simdifiable Vx>


simdified_value_t<Vx> norm_2_squared(Vx &&x) {

    GUANAQO_TRACE_LINALG("norm_2_squared", detail::num_elem(simdify(x)));

    return detail::norm_2_sq<simdified_value_t<Vx>, simdified_abi_t<Vx>>(simdify(x).as_const());

}


/// Compute the 2-norm of a vector.

template <simdifiable Vx>


simdified_value_t<Vx> norm_2(Vx &&x) {

    using std::sqrt;

    return sqrt(norm_2_squared(std::forward<Vx>(x)));

}


/// Compute the dot product of two vectors.

template <simdifiable Vx, simdifiable Vy>

    requires simdify_compatible<Vx, Vy>


simdified_value_t<Vx> dot(Vx &&x, Vy &&y) {

    GUANAQO_TRACE_LINALG("dot", detail::num_elem(simdify(x)));

    return detail::dot<simdified_value_t<Vx>, simdified_abi_t<Vx>>(simdify(x).as_const(),

                                                                   simdify(y).as_const());

}


/// ∑ wᵢ aᵢ².

template <simdifiable Vw, simdifiable Va>

    requires simdify_compatible<Vw, Va>


simdified_value_t<Vw> weighted_norm_sq(Vw &&w, Va &&a) {

    GUANAQO_TRACE_LINALG("weighted_norm_sq", 2 * detail::num_elem(simdify(w)));

    return detail::weighted_norm_sq<simdified_value_t<Vw>, simdified_abi_t<Vw>>(

        simdify(w).as_const(), simdify(a).as_const());

}


/// ∑ wᵢ(aᵢ - bᵢ)².

template <simdifiable Vw, simdifiable Va, simdifiable Vb>

    requires simdify_compatible<Vw, Va, Vb>


simdified_value_t<Vw> weighted_norm_sq_diff(Vw &&w, Va &&a, Vb &&b) {

    GUANAQO_TRACE_LINALG("weighted_norm_sq_difference", 3 * detail::num_elem(simdify(w)));

    return detail::weighted_norm_sq_difference<simdified_value_t<Vw>, simdified_abi_t<Vw>>(

        simdify(w).as_const(), simdify(a).as_const(), simdify(b).as_const());

}


/// @}


/// @}


// TODO: doxygen gets confused because the template parameters are the same as the single-batch

// versions, so put in a separate namespace

inline namespace multi {


/// @addtogroup topic-linalg

/// @{


/// @name Multi-batch reduction operations

/// @{


/// Compute the norms (max, 1-norm, and 2-norm) of a vector.

template <simdifiable_multi Vx>


norms<simdified_value_t<Vx>>::result norms_all(Vx &&x) {

    typename norms<simdified_value_t<Vx>>::result result{};

    for (index_t b = 0; b < x.num_batches(); ++b)

        result = norms<simdified_value_t<Vx>>{}(result, linalg::norms_all(x.batch(b)));

    return result;

}


/// Compute the infinity norm of a vector.

template <simdifiable_multi Vx>


simdified_value_t<Vx> norm_inf(Vx &&x) {

    return norms_all(std::forward<Vx>(x)).norm_inf();

}


/// Compute the 1-norm of a vector.

template <simdifiable_multi Vx>


simdified_value_t<Vx> norm_1(Vx &&x) {

    return norms_all(std::forward<Vx>(x)).norm_1();

}


/// Compute the squared 2-norm of a vector.

template <simdifiable_multi Vx>


simdified_value_t<Vx> norm_2_squared(Vx &&x) {

    simdified_value_t<Vx> sumsq{};

    for (index_t b = 0; b < x.num_batches(); ++b)

        sumsq += linalg::norm_2_squared(x.batch(b));

    return sumsq;

}


/// Compute the 2-norm of a vector.

template <simdifiable_multi Vx>


simdified_value_t<Vx> norm_2(Vx &&x) {

    using std::sqrt;

    return sqrt(norm_2_squared(std::forward<Vx>(x)));

}


/// Compute the dot product of two vectors.

template <simdifiable_multi Vx, simdifiable_multi Vy>

    requires simdify_compatible<Vx, Vy>


simdified_value_t<Vx> dot(Vx &&x, Vy &&y) {

    BATMAT_ASSERT(x.num_batches() == y.num_batches());

    simdified_value_t<Vx> result{};

    for (index_t b = 0; b < x.num_batches(); ++b)

        result += linalg::dot(x.batch(b), y.batch(b));

    return result;

}


/// ∑ wᵢ xᵢ².

template <simdifiable_multi Vw, simdifiable_multi Vx>

    requires simdify_compatible<Vw, Vx>


simdified_value_t<Vw> weighted_norm_sq(Vw &&w, Vx &&x) {

    BATMAT_ASSERT(w.num_batches() == x.num_batches());

    simdified_value_t<Vw> result{};

    for (index_t b = 0; b < w.num_batches(); ++b)

        result += linalg::weighted_norm_sq(w.batch(b), x.batch(b));

    return result;

}


/// ∑ wᵢ(xᵢ - yᵢ)².

template <simdifiable_multi Vw, simdifiable_multi Vx, simdifiable_multi Vy>

    requires simdify_compatible<Vw, Vx, Vy>


simdified_value_t<Vw> weighted_norm_sq_difference(Vw &&w, Vx &&x, Vy &&y) {

    BATMAT_ASSERT(w.num_batches() == x.num_batches());

    BATMAT_ASSERT(w.num_batches() == y.num_batches());

    simdified_value_t<Vw> result{};

    for (index_t b = 0; b < w.num_batches(); ++b)

        result += linalg::weighted_norm_sq_diff(w.batch(b), x.batch(b), y.batch(b));

    return result;

}


} // namespace multi


} // namespace batmat::linalg

BATMAT_ASSERT
#define BATMAT_ASSERT(x)
Definition assume.hpp:14

elementwise.hpp

guanaqo::StorageOrder
StorageOrder

batmat::linalg::norm_inf
simdified_value_t< Vx > norm_inf(Vx &&x)
Compute the infinity norm of a vector.
Definition reduce.hpp:88

batmat::linalg::norm_2_squared
simdified_value_t< Vx > norm_2_squared(Vx &&x)
Compute the squared 2-norm of a vector.
Definition reduce.hpp:100

batmat::linalg::multi::norm_2
simdified_value_t< Vx > norm_2(Vx &&x)
Compute the 2-norm of a vector.
Definition reduce.hpp:185

batmat::linalg::norm_2
simdified_value_t< Vx > norm_2(Vx &&x)
Compute the 2-norm of a vector.
Definition reduce.hpp:107

batmat::linalg::multi::norm_2_squared
simdified_value_t< Vx > norm_2_squared(Vx &&x)
Compute the squared 2-norm of a vector.
Definition reduce.hpp:176

batmat::linalg::norm_1
simdified_value_t< Vx > norm_1(Vx &&x)
Compute the 1-norm of a vector.
Definition reduce.hpp:94

batmat::linalg::multi::weighted_norm_sq
simdified_value_t< Vw > weighted_norm_sq(Vw &&w, Vx &&x)
∑ wᵢ xᵢ².
Definition reduce.hpp:204

batmat::linalg::dot
simdified_value_t< Vx > dot(Vx &&x, Vy &&y)
Compute the dot product of two vectors.
Definition reduce.hpp:115

batmat::linalg::multi::norm_1
simdified_value_t< Vx > norm_1(Vx &&x)
Compute the 1-norm of a vector.
Definition reduce.hpp:170

batmat::linalg::norms_all
norms< simdified_value_t< Vx > >::result norms_all(Vx &&x)
Compute the norms (max, 1-norm, and 2-norm) of a vector.
Definition reduce.hpp:81

batmat::linalg::multi::weighted_norm_sq_difference
simdified_value_t< Vw > weighted_norm_sq_difference(Vw &&w, Vx &&x, Vy &&y)
∑ wᵢ(xᵢ - yᵢ)².
Definition reduce.hpp:215

batmat::linalg::multi::norm_inf
simdified_value_t< Vx > norm_inf(Vx &&x)
Compute the infinity norm of a vector.
Definition reduce.hpp:164

batmat::linalg::multi::dot
simdified_value_t< Vx > dot(Vx &&x, Vy &&y)
Compute the dot product of two vectors.
Definition reduce.hpp:193

batmat::linalg::weighted_norm_sq
simdified_value_t< Vw > weighted_norm_sq(Vw &&w, Va &&a)
∑ wᵢ aᵢ².
Definition reduce.hpp:124

batmat::linalg::weighted_norm_sq_diff
simdified_value_t< Vw > weighted_norm_sq_diff(Vw &&w, Va &&a, Vb &&b)
∑ wᵢ(aᵢ - bᵢ)².
Definition reduce.hpp:133

batmat::linalg::multi::norms_all
norms< simdified_value_t< Vx > >::result norms_all(Vx &&x)
Compute the norms (max, 1-norm, and 2-norm) of a vector.
Definition reduce.hpp:155

GUANAQO_TRACE_LINALG
#define GUANAQO_TRACE_LINALG(name, gflops)

batmat::datapar::simd
stdx::simd< Tp, Abi > simd
Definition simd.hpp:102

batmat::linalg::detail
Definition compress.hpp:14

batmat::linalg
Definition compress.hpp:12

batmat::linalg::simdified_value_t
typename detail::simdified_value< V >::type simdified_value_t
Definition simdify.hpp:206

batmat::linalg::simdified_abi_t
typename detail::simdified_abi< V >::type simdified_abi_t
Definition simdify.hpp:208

batmat::linalg::simdify_compatible
constexpr bool simdify_compatible
Definition simdify.hpp:211

batmat::linalg::simdify
constexpr auto simdify(simdifiable auto &&a) -> simdified_view_t< decltype(a)>
Definition simdify.hpp:218

batmat::linalg::view
simd_view_types< std::remove_const_t< T >, Abi >::template view< T, Order > view
Definition uview.hpp:70

batmat::index_t
int index_t
Definition config.hpp:13

norms.hpp
Vector reductions.

batmat::linalg::norms
Utilities for computing vector norms.
Definition norms.hpp:26

batmat::linalg::norms::zero_simd
static result_simd zero_simd()
Definition norms.hpp:53

batmat::linalg::norms::result
typename norms< T >::result result
Accumulator.
Definition norms.hpp:28