xsimd__generic__details_8hpp_source.html

/*

 * SPDX-FileCopyrightText: 2022 L. E. Segovia <amy@amyspark.me>

 *

 * SPDX-License-Identifier: BSD-3-Clause

 */


#ifndef KIS_XSIMD_GENERIC_DETAILS_DECL_HPP

#define KIS_XSIMD_GENERIC_DETAILS_DECL_HPP


#include <cstdint>

#include <tuple>


namespace xsimd

{

/***********************

 * Truncate-initialize *

 ***********************/


template<typename V, typename T, typename A>

batch<T, A> truncate_to_type(batch<T, A> const &self) noexcept;


/**************************

 * Masked initializations *

 **************************/


// Mask to 0 elements of a vector.

template<typename T, typename A>

inline auto set_zero(const batch<T, A> &src, const batch_bool<T, A> &mask) noexcept;


// Mask to 1 elements of a vector.

template<typename T, typename A>

inline auto set_one(const batch<T, A> &src, const batch_bool<T, A> &mask) noexcept;


/**********************************

 * Sign-extending unaligned loads *

 **********************************/


// Load `T::size` values from the array of `T2` elements.

template<typename T, typename T2>

inline T load_and_extend(const T2 *src) noexcept;


/*************************************************

 * Type-inferred, auto-aligned memory allocation *

 *************************************************/


// Allocate size bytes of memory aligned to `batch<T, A>::alignment()`.

template<typename T, typename A = xsimd::current_arch>

inline T *aligned_malloc(size_t size) noexcept;


// Allocate memory for `sz` T items, aligned to the selected architecture's

// alignment.

template<typename T, typename A = xsimd::current_arch>

inline T *vector_aligned_malloc(size_t sz) noexcept;


// Free allocated memory, hiding the `const_cast` if necessary.

template<typename T>

inline void vector_aligned_free(const T *ptr) noexcept;


/****************

 * Interleaving *

 ****************/


// Return the tuple of interleaved batches `a` and `b`.

// First element is the low half, second is the upper half.

template<typename V>

inline std::pair<V, V> interleave(const V &a, const V &b) noexcept;


template<typename T, typename A>

inline xsimd::batch<T, A> pow2(xsimd::batch<T, A> const &self) noexcept;


namespace kernel

{


namespace detail

{

/*****************************

 * Helpers: unary applicator *

 *****************************/


template<class F, class A, class T>


inline batch<T, A> apply_with_value(F &&func, batch<T, A> const &self) noexcept

{

    alignas(A::alignment()) std::array<T, batch<T, A>::size> self_buffer;

    self.store_aligned(self_buffer.data());

    for (std::size_t i = 0; i < batch<T, A>::size; ++i) {

        self_buffer[i] = func(self_buffer[i]);

    }

    return batch<T, A>::load_aligned(self_buffer.data());

}


template<class F, class A, class T>


inline batch<T, A> apply_with_index_and_value(F &&func, batch<T, A> const &self) noexcept

{

    alignas(A::alignment()) std::array<T, batch<T, A>::size> self_buffer;

    self.store_aligned(self_buffer.data());

    for (std::size_t i = 0; i < batch<T, A>::size; ++i) {

        self_buffer[i] = func(i, self_buffer[i]);

    }

    return batch<T, A>::load_aligned(self_buffer.data());

}


} // namespace kernel


} // namespace detail


}; // namespace xsimd


#endif // KIS_XSIMD_GENERIC_DETAILS_DECL_HPP

detail
Definition kis_brush.cpp:105

xsimd::kernel::detail::apply_with_index_and_value
batch< T, A > apply_with_index_and_value(F &&func, batch< T, A > const &self) noexcept
Definition xsimd_generic_details.hpp:91

xsimd::kernel::detail::apply_with_value
batch< T, A > apply_with_value(F &&func, batch< T, A > const &self) noexcept
Definition xsimd_generic_details.hpp:80

xsimd
Definition xsimd_generic.hpp:16

xsimd::interleave
std::pair< V, V > interleave(const V &a, const V &b) noexcept
Definition xsimd_generic.hpp:116

xsimd::vector_aligned_malloc
T * vector_aligned_malloc(size_t sz) noexcept
Definition xsimd_generic.hpp:96

xsimd::set_one
auto set_one(const batch< T, A > &src, const batch_bool< T, A > &mask) noexcept
Definition xsimd_generic.hpp:46

xsimd::pow2
batch< T, A > pow2(batch< T, A > const &self) noexcept
Definition xsimd_generic.hpp:126

xsimd::set_zero
auto set_zero(const batch< T, A > &src, const batch_bool< T, A > &mask) noexcept
Definition xsimd_generic.hpp:39

xsimd::vector_aligned_free
void vector_aligned_free(const T *ptr) noexcept
Definition xsimd_generic.hpp:103

xsimd::aligned_malloc
T * aligned_malloc(size_t size) noexcept
Definition xsimd_generic.hpp:72

xsimd::truncate_to_type
batch< T, A > truncate_to_type(xsimd::batch< T, A > const &self) noexcept
Definition xsimd_generic.hpp:22

xsimd::load_and_extend
T load_and_extend(const T2 *src) noexcept
Definition xsimd_generic.hpp:57