Grok  9.5.0
Classes | Namespaces | Macros | Typedefs | Functions
arm_neon-inl.h File Reference
#include <arm_neon.h>
#include <stddef.h>
#include <stdint.h>
#include "hwy/base.h"
#include "hwy/ops/shared-inl.h"

Go to the source code of this file.

Classes

struct  hwy::HWY_NAMESPACE::detail::Raw128< uint8_t, 16 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint16_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint32_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint64_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int8_t, 16 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int16_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int32_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int64_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float16_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< bfloat16_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint8_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint16_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint32_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint64_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int8_t, 8 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int16_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int32_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int64_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float16_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< bfloat16_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint8_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint16_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint32_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int8_t, 4 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int16_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int32_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float16_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< bfloat16_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint8_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint16_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int8_t, 2 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int16_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< float16_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< bfloat16_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< uint8_t, 1 >
 
struct  hwy::HWY_NAMESPACE::detail::Raw128< int8_t, 1 >
 
class  hwy::HWY_NAMESPACE::Vec128< T, N >
 
struct  hwy::HWY_NAMESPACE::Mask128< T, N >
 
struct  hwy::HWY_NAMESPACE::detail::DeduceD
 
struct  hwy::HWY_NAMESPACE::detail::ShiftLeftBytesT< kBytes >
 
struct  hwy::HWY_NAMESPACE::detail::ShiftLeftBytesT< 0 >
 
struct  hwy::HWY_NAMESPACE::detail::ShiftLeftBytesT< 0xFF >
 
struct  hwy::HWY_NAMESPACE::detail::ShiftRightBytesT< kBytes >
 
struct  hwy::HWY_NAMESPACE::detail::ShiftRightBytesT< 0 >
 
struct  hwy::HWY_NAMESPACE::detail::ShiftRightBytesT< 0xFF >
 
struct  hwy::HWY_NAMESPACE::Indices128< T, N >
 

Namespaces

 hwy
 
 hwy::HWY_NAMESPACE
 
 hwy::HWY_NAMESPACE::detail
 
 hwy::HWY_NAMESPACE::internal
 

Macros

#define HWY_NEON_BUILD_TPL_1
 
#define HWY_NEON_BUILD_TPL_2
 
#define HWY_NEON_BUILD_TPL_3
 
#define HWY_NEON_BUILD_RET_1(type, size)   Vec128<type, size>
 
#define HWY_NEON_BUILD_RET_2(type, size)   Vec128<type, size>
 
#define HWY_NEON_BUILD_RET_3(type, size)   Vec128<type, size>
 
#define HWY_NEON_BUILD_PARAM_1(type, size)   const Vec128<type, size> a
 
#define HWY_NEON_BUILD_PARAM_2(type, size)    const Vec128<type, size> a, const Vec128<type, size> b
 
#define HWY_NEON_BUILD_PARAM_3(type, size)
 
#define HWY_NEON_BUILD_ARG_1   a.raw
 
#define HWY_NEON_BUILD_ARG_2   a.raw, b.raw
 
#define HWY_NEON_BUILD_ARG_3   a.raw, b.raw, c.raw
 
#define HWY_NEON_EVAL(func, ...)   func(__VA_ARGS__)
 
#define HWY_NEON_DEF_FUNCTION(type, size, name, prefix, infix, suffix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINT_8(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INT_8(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINT_16(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INT_16(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINT_32(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INT_32(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINT_64(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INT_64(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_ALL_FLOATS(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINT_8_16_32(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INT_8_16_32(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_UINTS(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INTS(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_INTS_UINTS(name, prefix, infix, args)
 
#define HWY_NEON_DEF_FUNCTION_ALL_TYPES(name, prefix, infix, args)
 
#define HWY_NEON_BUILD_TPL_HWY_CAST_TO_U8
 
#define HWY_NEON_BUILD_RET_HWY_CAST_TO_U8(type, size)    Vec128<uint8_t, size * sizeof(type)>
 
#define HWY_NEON_BUILD_PARAM_HWY_CAST_TO_U8(type, size)   Vec128<type, size> v
 
#define HWY_NEON_BUILD_ARG_HWY_CAST_TO_U8   v.raw
 
#define HWY_NEON_BUILD_TPL_HWY_SET1
 
#define HWY_NEON_BUILD_RET_HWY_SET1(type, size)   Vec128<type, size>
 
#define HWY_NEON_BUILD_PARAM_HWY_SET1(type, size)    Simd<type, size> /* tag */, const type t
 
#define HWY_NEON_BUILD_ARG_HWY_SET1   t
 
#define HWY_NEON_DEF_FUNCTION(type, size, name, prefix, infix, suffix, args)
 
#define HWY_NATIVE_POPCNT
 
#define HWY_NEON_BUILD_TPL_HWY_IF
 
#define HWY_NEON_BUILD_RET_HWY_IF(type, size)   Vec128<type, size>
 
#define HWY_NEON_BUILD_PARAM_HWY_IF(type, size)
 
#define HWY_NEON_BUILD_ARG_HWY_IF   mask.raw, yes.raw, no.raw
 
#define HWY_NEON_BUILD_TPL_HWY_COMPARE
 
#define HWY_NEON_BUILD_RET_HWY_COMPARE(type, size)   Mask128<type, size>
 
#define HWY_NEON_BUILD_PARAM_HWY_COMPARE(type, size)    const Vec128<type, size> a, const Vec128<type, size> b
 
#define HWY_NEON_BUILD_ARG_HWY_COMPARE   a.raw, b.raw
 
#define HWY_NEON_BUILD_TPL_HWY_TESTBIT
 
#define HWY_NEON_BUILD_RET_HWY_TESTBIT(type, size)   Mask128<type, size>
 
#define HWY_NEON_BUILD_PARAM_HWY_TESTBIT(type, size)    Vec128<type, size> v, Vec128<type, size> bit
 
#define HWY_NEON_BUILD_ARG_HWY_TESTBIT   v.raw, bit.raw
 

Typedefs

template<typename T >
using hwy::HWY_NAMESPACE::Full128 = Simd< T, 16/sizeof(T)>
 
template<class V >
using hwy::HWY_NAMESPACE::DFromV = decltype(detail::DeduceD()(V()))
 
template<class V >
using hwy::HWY_NAMESPACE::TFromV = TFromD< DFromV< V > >
 
template<class D >
using hwy::HWY_NAMESPACE::VFromD = decltype(Zero(D()))
 

Functions

 HWY_BEFORE_NAMESPACE ()
 
template<size_t N>
HWY_INLINE Vec128< uint8_t, N > hwy::HWY_NAMESPACE::detail::BitCastToByte (Vec128< uint8_t, N > v)
 
 hwy::HWY_NAMESPACE::detail::HWY_NEON_DEF_FUNCTION_ALL_FLOATS (BitCastToByte, vreinterpret, _u8_, HWY_CAST_TO_U8) template< size_t N > HWY_INLINE Vec128< uint8_t
 
N * hwy::HWY_NAMESPACE::detail::BitCastToByte (Vec128< float16_t, N > v)
 
template<size_t N>
HWY_INLINE Vec128< uint8_t, N *2 > hwy::HWY_NAMESPACE::detail::BitCastToByte (Vec128< bfloat16_t, N > v)
 
template<size_t N>
HWY_INLINE Vec128< uint8_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< uint8_t, N >, Vec128< uint8_t, N > v)
 
template<size_t N, HWY_IF_LE64(int8_t, N) >
HWY_INLINE Vec128< int8_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< int8_t, N >, Vec128< uint8_t, N > v)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_INLINE Vec128< uint16_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< uint16_t, N >, Vec128< uint8_t, N *2 > v)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_INLINE Vec128< int16_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< int16_t, N >, Vec128< uint8_t, N *2 > v)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_INLINE Vec128< uint32_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< uint32_t, N >, Vec128< uint8_t, N *4 > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_INLINE Vec128< int32_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< int32_t, N >, Vec128< uint8_t, N *4 > v)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_INLINE Vec128< float, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< float, N >, Vec128< uint8_t, N *4 > v)
 
HWY_INLINE Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< uint64_t, 1 >, Vec128< uint8_t, 1 *8 > v)
 
HWY_INLINE Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< int64_t, 1 >, Vec128< uint8_t, 1 *8 > v)
 
HWY_INLINE Vec128< int8_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< int8_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< uint16_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< uint16_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< int16_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< int16_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< uint32_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< uint32_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< int32_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< int32_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< float > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< float >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< uint64_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< uint64_t >, Vec128< uint8_t > v)
 
HWY_INLINE Vec128< int64_t > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Full128< int64_t >, Vec128< uint8_t > v)
 
template<size_t N>
HWY_INLINE Vec128< float16_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< float16_t, N >, Vec128< uint8_t, N *2 > v)
 
template<size_t N>
HWY_INLINE Vec128< bfloat16_t, N > hwy::HWY_NAMESPACE::detail::BitCastFromByte (Simd< bfloat16_t, N >, Vec128< uint8_t, N *2 > v)
 
template<typename T , size_t N, typename FromT >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::BitCast (Simd< T, N > d, Vec128< FromT, N *sizeof(T)/sizeof(FromT)> v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Zero (Simd< T, N > d)
 
template<size_t N>
HWY_API Vec128< bfloat16_t, N > hwy::HWY_NAMESPACE::Zero (Simd< bfloat16_t, N > d)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Undefined (Simd< T, N >)
 
template<typename T , size_t N, typename T2 >
Vec128< T, N > hwy::HWY_NAMESPACE::Iota (const Simd< T, N > d, const T2 first)
 
HWY_API uint8_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint8_t, 16 > v)
 
template<size_t N>
HWY_API uint8_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint8_t, N > v)
 
HWY_API int8_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int8_t, 16 > v)
 
template<size_t N>
HWY_API int8_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int8_t, N > v)
 
HWY_API uint16_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint16_t, 8 > v)
 
template<size_t N>
HWY_API uint16_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint16_t, N > v)
 
HWY_API int16_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int16_t, 8 > v)
 
template<size_t N>
HWY_API int16_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int16_t, N > v)
 
HWY_API uint32_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint32_t, 4 > v)
 
template<size_t N>
HWY_API uint32_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint32_t, N > v)
 
HWY_API int32_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int32_t, 4 > v)
 
template<size_t N>
HWY_API int32_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int32_t, N > v)
 
HWY_API uint64_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint64_t, 2 > v)
 
HWY_API uint64_t hwy::HWY_NAMESPACE::GetLane (const Vec128< uint64_t, 1 > v)
 
HWY_API int64_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int64_t, 2 > v)
 
HWY_API int64_t hwy::HWY_NAMESPACE::GetLane (const Vec128< int64_t, 1 > v)
 
HWY_API float hwy::HWY_NAMESPACE::GetLane (const Vec128< float, 4 > v)
 
HWY_API float hwy::HWY_NAMESPACE::GetLane (const Vec128< float, 2 > v)
 
HWY_API float hwy::HWY_NAMESPACE::GetLane (const Vec128< float, 1 > v)
 
 hwy::HWY_NAMESPACE::HWY_NEON_DEF_FUNCTION_INT_8_16_32 (Neg, vneg, _, 1) HWY_API Vec128< int64_t
 
 hwy::HWY_NAMESPACE::Neg (const Vec128< int64_t, 1 > v)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::Neg (const Vec128< int64_t > v)
 
HWY_API Vec128< uint8_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint8_t > v, const Vec128< uint8_t > bits)
 
template<size_t N, HWY_IF_LE64(uint8_t, N) >
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint8_t, N > v, const Vec128< uint8_t, N > bits)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint16_t > v, const Vec128< uint16_t > bits)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint16_t, N > v, const Vec128< uint16_t, N > bits)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint32_t > v, const Vec128< uint32_t > bits)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint32_t, N > v, const Vec128< uint32_t, N > bits)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint64_t > v, const Vec128< uint64_t > bits)
 
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::operator<< (const Vec128< uint64_t, 1 > v, const Vec128< uint64_t, 1 > bits)
 
HWY_API Vec128< int8_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< int8_t > v, const Vec128< int8_t > bits)
 
template<size_t N, HWY_IF_LE64(int8_t, N) >
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< int8_t, N > v, const Vec128< int8_t, N > bits)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< int16_t > v, const Vec128< int16_t > bits)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< int16_t, N > v, const Vec128< int16_t, N > bits)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< int32_t > v, const Vec128< int32_t > bits)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::operator<< (const Vec128< int32_t, N > v, const Vec128< int32_t, N > bits)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::operator<< (const Vec128< int64_t > v, const Vec128< int64_t > bits)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::operator<< (const Vec128< int64_t, 1 > v, const Vec128< int64_t, 1 > bits)
 
HWY_API Vec128< uint8_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint8_t > v, const Vec128< uint8_t > bits)
 
template<size_t N, HWY_IF_LE64(uint8_t, N) >
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint8_t, N > v, const Vec128< uint8_t, N > bits)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint16_t > v, const Vec128< uint16_t > bits)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint16_t, N > v, const Vec128< uint16_t, N > bits)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint32_t > v, const Vec128< uint32_t > bits)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint32_t, N > v, const Vec128< uint32_t, N > bits)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint64_t > v, const Vec128< uint64_t > bits)
 
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::operator>> (const Vec128< uint64_t, 1 > v, const Vec128< uint64_t, 1 > bits)
 
HWY_API Vec128< int8_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< int8_t > v, const Vec128< int8_t > bits)
 
template<size_t N, HWY_IF_LE64(int8_t, N) >
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< int8_t, N > v, const Vec128< int8_t, N > bits)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< int16_t > v, const Vec128< int16_t > bits)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< int16_t, N > v, const Vec128< int16_t, N > bits)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< int32_t > v, const Vec128< int32_t > bits)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::operator>> (const Vec128< int32_t, N > v, const Vec128< int32_t, N > bits)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::operator>> (const Vec128< int64_t > v, const Vec128< int64_t > bits)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::operator>> (const Vec128< int64_t, 1 > v, const Vec128< int64_t, 1 > bits)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftLeftSame (const Vec128< T, N > v, int bits)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftRightSame (const Vec128< T, N > v, int bits)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::operator* (const Vec128< uint16_t > a, const Vec128< uint16_t > b)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::operator* (const Vec128< uint32_t > a, const Vec128< uint32_t > b)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::operator* (const Vec128< uint16_t, N > a, const Vec128< uint16_t, N > b)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::operator* (const Vec128< uint32_t, N > a, const Vec128< uint32_t, N > b)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::operator* (const Vec128< int16_t > a, const Vec128< int16_t > b)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::operator* (const Vec128< int32_t > a, const Vec128< int32_t > b)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::operator* (const Vec128< int16_t, N > a, const Vec128< int16_t, N > b)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::operator* (const Vec128< int32_t, N > a, const Vec128< int32_t, N > b)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::MulHigh (const Vec128< int16_t > a, const Vec128< int16_t > b)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::MulHigh (const Vec128< uint16_t > a, const Vec128< uint16_t > b)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::MulHigh (const Vec128< int16_t, N > a, const Vec128< int16_t, N > b)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::MulHigh (const Vec128< uint16_t, N > a, const Vec128< uint16_t, N > b)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::ApproximateReciprocal (const Vec128< float > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ApproximateReciprocal (const Vec128< float, N > v)
 
HWY_INLINE Vec128< float > hwy::HWY_NAMESPACE::detail::ReciprocalNewtonRaphsonStep (const Vec128< float > recip, const Vec128< float > divisor)
 
template<size_t N>
HWY_INLINE Vec128< float, N > hwy::HWY_NAMESPACE::detail::ReciprocalNewtonRaphsonStep (const Vec128< float, N > recip, Vec128< float, N > divisor)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::operator/ (const Vec128< float, N > a, const Vec128< float, N > b)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::AbsDiff (const Vec128< float > a, const Vec128< float > b)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::AbsDiff (const Vec128< float, N > a, const Vec128< float, N > b)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::MulAdd (const Vec128< float, N > mul, const Vec128< float, N > x, const Vec128< float, N > add)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::NegMulAdd (const Vec128< float, N > mul, const Vec128< float, N > x, const Vec128< float, N > add)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::MulSub (const Vec128< float, N > mul, const Vec128< float, N > x, const Vec128< float, N > sub)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::NegMulSub (const Vec128< float, N > mul, const Vec128< float, N > x, const Vec128< float, N > sub)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::ApproximateReciprocalSqrt (const Vec128< float > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ApproximateReciprocalSqrt (const Vec128< float, N > v)
 
HWY_INLINE Vec128< float > hwy::HWY_NAMESPACE::detail::ReciprocalSqrtStep (const Vec128< float > root, const Vec128< float > recip)
 
template<size_t N>
HWY_INLINE Vec128< float, N > hwy::HWY_NAMESPACE::detail::ReciprocalSqrtStep (const Vec128< float, N > root, Vec128< float, N > recip)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Sqrt (const Vec128< float, N > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Not (const Vec128< T > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Not (const Vec128< T, N > v)
 
template<typename T , size_t N, HWY_IF_FLOAT(T) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::And (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N, HWY_IF_NOT_FLOAT(T) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::AndNot (const Vec128< T, N > not_mask, const Vec128< T, N > mask)
 
template<typename T , size_t N, HWY_IF_FLOAT(T) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Or (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N, HWY_IF_FLOAT(T) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Xor (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::operator& (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::operator| (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::operator^ (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 1 >, Vec128< T > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 1 >, Vec128< T, N > v)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 2 >, Vec128< T > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 2 >, Vec128< T, N > v)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 4 >, Vec128< T > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 4 >, Vec128< T, N > v)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 8 >, Vec128< T > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::PopulationCount (hwy::SizeTag< 8 >, Vec128< T, N > v)
 
template<typename T , size_t N, HWY_IF_NOT_FLOAT(T) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::PopulationCount (Vec128< T, N > v)
 
HWY_API Vec128< int8_t > hwy::HWY_NAMESPACE::Abs (const Vec128< int8_t > v)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::Abs (const Vec128< int16_t > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::Abs (const Vec128< int32_t > v)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::Abs (const Vec128< float > v)
 
template<size_t N, HWY_IF_LE64(int8_t, N) >
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::Abs (const Vec128< int8_t, N > v)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::Abs (const Vec128< int16_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::Abs (const Vec128< int32_t, N > v)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Abs (const Vec128< float, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::CopySign (const Vec128< T, N > magn, const Vec128< T, N > sign)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::CopySignToAbs (const Vec128< T, N > abs, const Vec128< T, N > sign)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::BroadcastSignBit (const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::MaskFromVec (const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::VecFromMask (const Mask128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::VecFromMask (Simd< T, N > d, const Mask128< T, N > v)
 
template<typename TFrom , typename TTo , size_t N>
HWY_API Mask128< TTo, N > hwy::HWY_NAMESPACE::RebindMask (Simd< TTo, N > dto, Mask128< TFrom, N > m)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::IfThenElseZero (const Mask128< T, N > mask, const Vec128< T, N > yes)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::IfThenZeroElse (const Mask128< T, N > mask, const Vec128< T, N > no)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ZeroIfNegative (Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::Not (const Mask128< T, N > m)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::And (const Mask128< T, N > a, Mask128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::AndNot (const Mask128< T, N > a, Mask128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::Or (const Mask128< T, N > a, Mask128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::Xor (const Mask128< T, N > a, Mask128< T, N > b)
 
HWY_API Vec128< uint32_t, 2 > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< uint32_t, 2 > v)
 
HWY_API Vec128< int32_t, 2 > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< int32_t, 2 > v)
 
HWY_API Vec128< float, 2 > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< float, 2 > v)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< uint32_t > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< int32_t > v)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::Shuffle2301 (const Vec128< float > v)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::operator!= (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::operator> (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::operator>= (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N>
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::FirstN (const Simd< T, N > d, size_t num)
 
template<size_t N>
HWY_API Mask128< uint64_t, N > hwy::HWY_NAMESPACE::TestBit (Vec128< uint64_t, N > v, Vec128< uint64_t, N > bit)
 
template<size_t N>
HWY_API Mask128< int64_t, N > hwy::HWY_NAMESPACE::TestBit (Vec128< int64_t, N > v, Vec128< int64_t, N > bit)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::Abs (const Vec128< int64_t > v)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::Abs (const Vec128< int64_t, 1 > v)
 
template<size_t N>
HWY_API Vec128< uint64_t, N > hwy::HWY_NAMESPACE::Min (const Vec128< uint64_t, N > a, const Vec128< uint64_t, N > b)
 
template<size_t N>
HWY_API Vec128< int64_t, N > hwy::HWY_NAMESPACE::Min (const Vec128< int64_t, N > a, const Vec128< int64_t, N > b)
 
template<size_t N>
HWY_API Vec128< uint64_t, N > hwy::HWY_NAMESPACE::Max (const Vec128< uint64_t, N > a, const Vec128< uint64_t, N > b)
 
template<size_t N>
HWY_API Vec128< int64_t, N > hwy::HWY_NAMESPACE::Max (const Vec128< int64_t, N > a, const Vec128< int64_t, N > b)
 
HWY_API Vec128< uint8_t > hwy::HWY_NAMESPACE::LoadU (Full128< uint8_t >, const uint8_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::LoadU (Full128< uint16_t >, const uint16_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::LoadU (Full128< uint32_t >, const uint32_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::LoadU (Full128< uint64_t >, const uint64_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< int8_t > hwy::HWY_NAMESPACE::LoadU (Full128< int8_t >, const int8_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::LoadU (Full128< int16_t >, const int16_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::LoadU (Full128< int32_t >, const int32_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::LoadU (Full128< int64_t >, const int64_t *HWY_RESTRICT unaligned)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::LoadU (Full128< float >, const float *HWY_RESTRICT unaligned)
 
HWY_API Vec128< uint8_t, 8 > hwy::HWY_NAMESPACE::LoadU (Simd< uint8_t, 8 >, const uint8_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint16_t, 4 > hwy::HWY_NAMESPACE::LoadU (Simd< uint16_t, 4 >, const uint16_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint32_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< uint32_t, 2 >, const uint32_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< uint64_t, 1 >, const uint64_t *HWY_RESTRICT p)
 
HWY_API Vec128< int8_t, 8 > hwy::HWY_NAMESPACE::LoadU (Simd< int8_t, 8 >, const int8_t *HWY_RESTRICT p)
 
HWY_API Vec128< int16_t, 4 > hwy::HWY_NAMESPACE::LoadU (Simd< int16_t, 4 >, const int16_t *HWY_RESTRICT p)
 
HWY_API Vec128< int32_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< int32_t, 2 >, const int32_t *HWY_RESTRICT p)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< int64_t, 1 >, const int64_t *HWY_RESTRICT p)
 
HWY_API Vec128< float, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< float, 2 >, const float *HWY_RESTRICT p)
 
HWY_API Vec128< uint8_t, 4 > hwy::HWY_NAMESPACE::LoadU (Simd< uint8_t, 4 >, const uint8_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint16_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< uint16_t, 2 >, const uint16_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint32_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< uint32_t, 1 >, const uint32_t *HWY_RESTRICT p)
 
HWY_API Vec128< int8_t, 4 > hwy::HWY_NAMESPACE::LoadU (Simd< int8_t, 4 >, const int8_t *HWY_RESTRICT p)
 
HWY_API Vec128< int16_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< int16_t, 2 >, const int16_t *HWY_RESTRICT p)
 
HWY_API Vec128< int32_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< int32_t, 1 >, const int32_t *HWY_RESTRICT p)
 
HWY_API Vec128< float, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< float, 1 >, const float *HWY_RESTRICT p)
 
HWY_API Vec128< uint8_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< uint8_t, 2 >, const uint8_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint16_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< uint16_t, 1 >, const uint16_t *HWY_RESTRICT p)
 
HWY_API Vec128< int8_t, 2 > hwy::HWY_NAMESPACE::LoadU (Simd< int8_t, 2 >, const int8_t *HWY_RESTRICT p)
 
HWY_API Vec128< int16_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< int16_t, 1 >, const int16_t *HWY_RESTRICT p)
 
HWY_API Vec128< uint8_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< uint8_t, 1 > d, const uint8_t *HWY_RESTRICT p)
 
HWY_API Vec128< int8_t, 1 > hwy::HWY_NAMESPACE::LoadU (Simd< int8_t, 1 > d, const int8_t *HWY_RESTRICT p)
 
template<size_t N>
HWY_API Vec128< float16_t, N > hwy::HWY_NAMESPACE::LoadU (Simd< float16_t, N >, const float16_t *HWY_RESTRICT p)
 
template<size_t N>
HWY_API Vec128< bfloat16_t, N > hwy::HWY_NAMESPACE::LoadU (Simd< bfloat16_t, N >, const bfloat16_t *HWY_RESTRICT p)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Load (Simd< T, N > d, const T *HWY_RESTRICT p)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::MaskedLoad (Mask128< T, N > m, Simd< T, N > d, const T *HWY_RESTRICT aligned)
 
template<typename T , size_t N, HWY_IF_LE128(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::LoadDup128 (Simd< T, N > d, const T *const HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint8_t > v, Full128< uint8_t >, uint8_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint16_t > v, Full128< uint16_t >, uint16_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint32_t > v, Full128< uint32_t >, uint32_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint64_t > v, Full128< uint64_t >, uint64_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int8_t > v, Full128< int8_t >, int8_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int16_t > v, Full128< int16_t >, int16_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int32_t > v, Full128< int32_t >, int32_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int64_t > v, Full128< int64_t >, int64_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< float > v, Full128< float >, float *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint8_t, 8 > v, Simd< uint8_t, 8 >, uint8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint16_t, 4 > v, Simd< uint16_t, 4 >, uint16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint32_t, 2 > v, Simd< uint32_t, 2 >, uint32_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint64_t, 1 > v, Simd< uint64_t, 1 >, uint64_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int8_t, 8 > v, Simd< int8_t, 8 >, int8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int16_t, 4 > v, Simd< int16_t, 4 >, int16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int32_t, 2 > v, Simd< int32_t, 2 >, int32_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int64_t, 1 > v, Simd< int64_t, 1 >, int64_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< float, 2 > v, Simd< float, 2 >, float *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint8_t, 4 > v, Simd< uint8_t, 4 >, uint8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint16_t, 2 > v, Simd< uint16_t, 2 >, uint16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint32_t, 1 > v, Simd< uint32_t, 1 >, uint32_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int8_t, 4 > v, Simd< int8_t, 4 >, int8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int16_t, 2 > v, Simd< int16_t, 2 >, int16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int32_t, 1 > v, Simd< int32_t, 1 >, int32_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< float, 1 > v, Simd< float, 1 >, float *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint8_t, 2 > v, Simd< uint8_t, 2 >, uint8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint16_t, 1 > v, Simd< uint16_t, 1 >, uint16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int8_t, 2 > v, Simd< int8_t, 2 >, int8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int16_t, 1 > v, Simd< int16_t, 1 >, int16_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< uint8_t, 1 > v, Simd< uint8_t, 1 >, uint8_t *HWY_RESTRICT p)
 
HWY_API void hwy::HWY_NAMESPACE::StoreU (const Vec128< int8_t, 1 > v, Simd< int8_t, 1 >, int8_t *HWY_RESTRICT p)
 
template<size_t N>
HWY_API void hwy::HWY_NAMESPACE::StoreU (Vec128< float16_t, N > v, Simd< float16_t, N >, float16_t *HWY_RESTRICT p)
 
template<size_t N>
HWY_API void hwy::HWY_NAMESPACE::StoreU (Vec128< bfloat16_t, N > v, Simd< bfloat16_t, N >, bfloat16_t *HWY_RESTRICT p)
 
template<typename T , size_t N>
HWY_API void hwy::HWY_NAMESPACE::Store (Vec128< T, N > v, Simd< T, N > d, T *HWY_RESTRICT aligned)
 
template<typename T , size_t N>
HWY_API void hwy::HWY_NAMESPACE::Stream (const Vec128< T, N > v, Simd< T, N > d, T *HWY_RESTRICT aligned)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< uint16_t >, const Vec128< uint8_t, 8 > v)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< uint32_t >, const Vec128< uint8_t, 4 > v)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< uint32_t >, const Vec128< uint16_t, 4 > v)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< uint64_t >, const Vec128< uint32_t, 2 > v)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int16_t > d, const Vec128< uint8_t, 8 > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int32_t > d, const Vec128< uint8_t, 4 > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int32_t > d, const Vec128< uint16_t, 4 > v)
 
template<size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< uint16_t, N >, const Vec128< uint8_t, N > v)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< uint32_t, N >, const Vec128< uint8_t, N > v)
 
template<size_t N>
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< uint32_t, N >, const Vec128< uint16_t, N > v)
 
template<size_t N, HWY_IF_LE64(uint64_t, N) >
HWY_API Vec128< uint64_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< uint64_t, N >, const Vec128< uint32_t, N > v)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int16_t, N > d, const Vec128< uint8_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int32_t, N >, const Vec128< uint8_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int32_t, N >, const Vec128< uint16_t, N > v)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int16_t >, const Vec128< int8_t, 8 > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int32_t >, const Vec128< int8_t, 4 > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int32_t >, const Vec128< int16_t, 4 > v)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::PromoteTo (Full128< int64_t >, const Vec128< int32_t, 2 > v)
 
template<size_t N>
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int16_t, N >, const Vec128< int8_t, N > v)
 
template<size_t N>
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int32_t, N >, const Vec128< int8_t, N > v)
 
template<size_t N>
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int32_t, N >, const Vec128< int16_t, N > v)
 
template<size_t N>
HWY_API Vec128< int64_t, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< int64_t, N >, const Vec128< int32_t, N > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< float, N >, const Vec128< float16_t, N > v)
 
HWY_API Vec128< uint16_t, 4 > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint16_t, 4 >, const Vec128< int32_t > v)
 
HWY_API Vec128< int16_t, 4 > hwy::HWY_NAMESPACE::DemoteTo (Simd< int16_t, 4 >, const Vec128< int32_t > v)
 
HWY_API Vec128< uint8_t, 4 > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint8_t, 4 >, const Vec128< int32_t > v)
 
HWY_API Vec128< uint8_t, 8 > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint8_t, 8 >, const Vec128< int16_t > v)
 
HWY_API Vec128< int8_t, 4 > hwy::HWY_NAMESPACE::DemoteTo (Simd< int8_t, 4 >, const Vec128< int32_t > v)
 
HWY_API Vec128< int8_t, 8 > hwy::HWY_NAMESPACE::DemoteTo (Simd< int8_t, 8 >, const Vec128< int16_t > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint16_t, N >, const Vec128< int32_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< int16_t, N >, const Vec128< int32_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint8_t, N >, const Vec128< int32_t, N > v)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint8_t, N >, const Vec128< int16_t, N > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< int8_t, N >, const Vec128< int32_t, N > v)
 
template<size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< int8_t, N >, const Vec128< int16_t, N > v)
 
template<size_t N>
HWY_API Vec128< float16_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< float16_t, N >, const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< bfloat16_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< bfloat16_t, N > dbf16, const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< bfloat16_t, 2 *N > hwy::HWY_NAMESPACE::ReorderDemote2To (Simd< bfloat16_t, 2 *N > dbf16, Vec128< float, N > a, Vec128< float, N > b)
 
HWY_API Vec128< uint8_t, 4 > hwy::HWY_NAMESPACE::U8FromU32 (const Vec128< uint32_t > v)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::U8FromU32 (const Vec128< uint32_t, N > v)
 
template<size_t N>
HWY_API Vec128< uint8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< uint8_t, N >, const Vec128< int32_t > v)
 
template<size_t N>
HWY_API Vec128< int8_t, N > hwy::HWY_NAMESPACE::DemoteTo (Simd< int8_t, N >, const Vec128< int32_t > v)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::ConvertTo (Full128< float >, const Vec128< int32_t > v)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ConvertTo (Simd< float, N >, const Vec128< int32_t, N > v)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::ConvertTo (Full128< int32_t >, const Vec128< float > v)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::ConvertTo (Simd< int32_t, N >, const Vec128< float, N > v)
 
template<size_t N>
HWY_INLINE Mask128< float, N > hwy::HWY_NAMESPACE::detail::UseInt (const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Trunc (const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Round (const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Ceil (const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Floor (const Vec128< float, N > v)
 
template<size_t N>
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::NearestInt (const Vec128< float, N > v)
 
template<typename T , size_t N, HWY_IF_LE64(uint8_t, N) >
HWY_API Vec128< T, N/2 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< T, N > v)
 
HWY_API Vec128< uint8_t, 8 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< uint8_t > v)
 
HWY_API Vec128< uint16_t, 4 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< uint16_t > v)
 
HWY_API Vec128< uint32_t, 2 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< uint32_t > v)
 
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< uint64_t > v)
 
HWY_API Vec128< int8_t, 8 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< int8_t > v)
 
HWY_API Vec128< int16_t, 4 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< int16_t > v)
 
HWY_API Vec128< int32_t, 2 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< int32_t > v)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< int64_t > v)
 
HWY_API Vec128< float, 2 > hwy::HWY_NAMESPACE::LowerHalf (const Vec128< float > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N/2 > hwy::HWY_NAMESPACE::LowerHalf (Simd< T, N/2 >, Vec128< T, N > v)
 
template<int kBytes, typename T , class V128 = Vec128<T>>
HWY_API V128 hwy::HWY_NAMESPACE::CombineShiftRightBytes (Full128< T > d, V128 hi, V128 lo)
 
template<int kBytes, typename T , class V64 = Vec128<T, 8 / sizeof(T)>>
HWY_API V64 hwy::HWY_NAMESPACE::CombineShiftRightBytes (Simd< T, 8/sizeof(T)> d, V64 hi, V64 lo)
 
template<int kBytes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftLeftBytes (Simd< T, N >, Vec128< T, N > v)
 
template<int kBytes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftLeftBytes (const Vec128< T, N > v)
 
template<int kLanes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftLeftLanes (Simd< T, N > d, const Vec128< T, N > v)
 
template<int kLanes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftLeftLanes (const Vec128< T, N > v)
 
template<int kBytes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftRightBytes (Simd< T, N >, Vec128< T, N > v)
 
template<int kLanes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftRightLanes (Simd< T, N > d, const Vec128< T, N > v)
 
template<int kBytes, typename T , size_t N, HWY_IF_LE32(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::CombineShiftRightBytes (Simd< T, N > d, Vec128< T, N > hi, Vec128< T, N > lo)
 
HWY_API Vec128< uint8_t, 8 > hwy::HWY_NAMESPACE::UpperHalf (Simd< uint8_t, 8 >, const Vec128< uint8_t > v)
 
HWY_API Vec128< uint16_t, 4 > hwy::HWY_NAMESPACE::UpperHalf (Simd< uint16_t, 4 >, const Vec128< uint16_t > v)
 
HWY_API Vec128< uint32_t, 2 > hwy::HWY_NAMESPACE::UpperHalf (Simd< uint32_t, 2 >, const Vec128< uint32_t > v)
 
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::UpperHalf (Simd< uint64_t, 1 >, const Vec128< uint64_t > v)
 
HWY_API Vec128< int8_t, 8 > hwy::HWY_NAMESPACE::UpperHalf (Simd< int8_t, 8 >, const Vec128< int8_t > v)
 
HWY_API Vec128< int16_t, 4 > hwy::HWY_NAMESPACE::UpperHalf (Simd< int16_t, 4 >, const Vec128< int16_t > v)
 
HWY_API Vec128< int32_t, 2 > hwy::HWY_NAMESPACE::UpperHalf (Simd< int32_t, 2 >, const Vec128< int32_t > v)
 
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::UpperHalf (Simd< int64_t, 1 >, const Vec128< int64_t > v)
 
HWY_API Vec128< float, 2 > hwy::HWY_NAMESPACE::UpperHalf (Simd< float, 2 >, const Vec128< float > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_API Vec128< T,(N+1)/2 > hwy::HWY_NAMESPACE::UpperHalf (Half< Simd< T, N >>, Vec128< T, N > v)
 
template<int kLane>
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint16_t > v)
 
template<int kLane, size_t N, HWY_IF_LE64(uint16_t, N) >
HWY_API Vec128< uint16_t, N > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint16_t, N > v)
 
template<int kLane>
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint32_t > v)
 
template<int kLane, size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint32_t, N > v)
 
template<int kLane>
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint64_t > v)
 
template<int kLane>
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int16_t > v)
 
template<int kLane, size_t N, HWY_IF_LE64(int16_t, N) >
HWY_API Vec128< int16_t, N > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int16_t, N > v)
 
template<int kLane>
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int32_t > v)
 
template<int kLane, size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int32_t, N > v)
 
template<int kLane>
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int64_t > v)
 
template<int kLane>
HWY_API Vec128< float > hwy::HWY_NAMESPACE::Broadcast (const Vec128< float > v)
 
template<int kLane, size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::Broadcast (const Vec128< float, N > v)
 
template<int kLane>
HWY_API Vec128< uint64_t, 1 > hwy::HWY_NAMESPACE::Broadcast (const Vec128< uint64_t, 1 > v)
 
template<int kLane>
HWY_API Vec128< int64_t, 1 > hwy::HWY_NAMESPACE::Broadcast (const Vec128< int64_t, 1 > v)
 
template<typename T , size_t N, HWY_IF_LE128(T, N) >
HWY_API Indices128< T, N > hwy::HWY_NAMESPACE::SetTableIndices (Simd< T, N > d, const int32_t *idx)
 
template<size_t N>
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::TableLookupLanes (const Vec128< uint32_t, N > v, const Indices128< uint32_t, N > idx)
 
template<size_t N>
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::TableLookupLanes (const Vec128< int32_t, N > v, const Indices128< int32_t, N > idx)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::TableLookupLanes (const Vec128< float, N > v, const Indices128< float, N > idx)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Reverse (Full128< T >, const Vec128< T > v)
 
template<typename T >
HWY_API Vec128< T, 2 > hwy::HWY_NAMESPACE::Reverse (Simd< T, 2 >, const Vec128< T, 2 > v)
 
template<typename T >
HWY_API Vec128< T, 1 > hwy::HWY_NAMESPACE::Reverse (Simd< T, 1 >, const Vec128< T, 1 > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Shuffle1032 (const Vec128< T > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Shuffle01 (const Vec128< T > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Shuffle0321 (const Vec128< T > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Shuffle2103 (const Vec128< T > v)
 
template<typename T >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::Shuffle0123 (const Vec128< T > v)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::InterleaveLower (const Vec128< uint64_t > a, const Vec128< uint64_t > b)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::InterleaveLower (const Vec128< int64_t > a, const Vec128< int64_t > b)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::InterleaveLower (const Vec128< float > a, const Vec128< float > b)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::InterleaveLower (const Vec128< float, N > a, const Vec128< float, N > b)
 
template<typename T , size_t N, HWY_IF_LE32(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::InterleaveLower (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N, class V = Vec128<T, N>>
HWY_APIhwy::HWY_NAMESPACE::InterleaveLower (Simd< T, N >, V a, V b)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::detail::InterleaveUpper (const Vec128< uint64_t > a, const Vec128< uint64_t > b)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::detail::InterleaveUpper (Vec128< int64_t > a, Vec128< int64_t > b)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::detail::InterleaveUpper (Vec128< float > a, Vec128< float > b)
 
HWY_API Vec128< float, 2 > hwy::HWY_NAMESPACE::detail::InterleaveUpper (const Vec128< float, 2 > a, const Vec128< float, 2 > b)
 
template<typename T , size_t N, HWY_IF_GE64(T, N) , class V = Vec128<T, N>>
HWY_APIhwy::HWY_NAMESPACE::InterleaveUpper (Simd< T, N >, V a, V b)
 
template<typename T , size_t N, class DW = RepartitionToWide<Simd<T, N>>>
HWY_API VFromD< DW > hwy::HWY_NAMESPACE::ZipLower (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N, class D = Simd<T, N>, class DW = RepartitionToWide<D>>
HWY_API VFromD< DW > hwy::HWY_NAMESPACE::ZipLower (DW dw, Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N, class D = Simd<T, N>, class DW = RepartitionToWide<D>>
HWY_API VFromD< DW > hwy::HWY_NAMESPACE::ZipUpper (DW dw, Vec128< T, N > a, Vec128< T, N > b)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ReorderWidenMulAccumulate (Simd< float, N > df32, Vec128< bfloat16_t, 2 *N > a, Vec128< bfloat16_t, 2 *N > b, const Vec128< float, N > sum0, Vec128< float, N > &sum1)
 
HWY_API Vec128< uint8_t > hwy::HWY_NAMESPACE::Combine (Full128< uint8_t >, Vec128< uint8_t, 8 > hi, Vec128< uint8_t, 8 > lo)
 
HWY_API Vec128< uint16_t > hwy::HWY_NAMESPACE::Combine (Full128< uint16_t >, Vec128< uint16_t, 4 > hi, Vec128< uint16_t, 4 > lo)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::Combine (Full128< uint32_t >, Vec128< uint32_t, 2 > hi, Vec128< uint32_t, 2 > lo)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::Combine (Full128< uint64_t >, Vec128< uint64_t, 1 > hi, Vec128< uint64_t, 1 > lo)
 
HWY_API Vec128< int8_t > hwy::HWY_NAMESPACE::Combine (Full128< int8_t >, Vec128< int8_t, 8 > hi, Vec128< int8_t, 8 > lo)
 
HWY_API Vec128< int16_t > hwy::HWY_NAMESPACE::Combine (Full128< int16_t >, Vec128< int16_t, 4 > hi, Vec128< int16_t, 4 > lo)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::Combine (Full128< int32_t >, Vec128< int32_t, 2 > hi, Vec128< int32_t, 2 > lo)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::Combine (Full128< int64_t >, Vec128< int64_t, 1 > hi, Vec128< int64_t, 1 > lo)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::Combine (Full128< float >, Vec128< float, 2 > hi, Vec128< float, 2 > lo)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Combine (Simd< T, N > d, Vec128< T, N/2 > hi, Vec128< T, N/2 > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ZeroExtendVector (Simd< T, N > d, Vec128< T, N/2 > lo)
 
template<typename T , size_t N, HWY_IF_GE64(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatLowerLower (const Simd< T, N > d, Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N, HWY_IF_GE64(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatUpperUpper (const Simd< T, N > d, Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N, HWY_IF_GE64(T, N) >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatLowerUpper (const Simd< T, N > d, Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatUpperLower (Simd< T, N > d, Vec128< T, N > hi, Vec128< T, N > lo)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::ConcatOdd (Full128< uint32_t >, Vec128< uint32_t > hi, Vec128< uint32_t > lo)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::ConcatOdd (Full128< int32_t >, Vec128< int32_t > hi, Vec128< int32_t > lo)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::ConcatOdd (Full128< float >, Vec128< float > hi, Vec128< float > lo)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::ConcatOdd (Simd< uint32_t, N >, Vec128< uint32_t, N > hi, Vec128< uint32_t, N > lo)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::ConcatOdd (Simd< int32_t, N >, Vec128< int32_t, N > hi, Vec128< int32_t, N > lo)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ConcatOdd (Simd< float, N >, Vec128< float, N > hi, Vec128< float, N > lo)
 
template<typename T , HWY_IF_LANE_SIZE(T, 8) >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::ConcatOdd (Full128< T > d, Vec128< T > hi, Vec128< T > lo)
 
HWY_API Vec128< uint32_t > hwy::HWY_NAMESPACE::ConcatEven (Full128< uint32_t >, Vec128< uint32_t > hi, Vec128< uint32_t > lo)
 
HWY_API Vec128< int32_t > hwy::HWY_NAMESPACE::ConcatEven (Full128< int32_t >, Vec128< int32_t > hi, Vec128< int32_t > lo)
 
HWY_API Vec128< float > hwy::HWY_NAMESPACE::ConcatEven (Full128< float >, Vec128< float > hi, Vec128< float > lo)
 
template<size_t N, HWY_IF_LE64(uint32_t, N) >
HWY_API Vec128< uint32_t, N > hwy::HWY_NAMESPACE::ConcatEven (Simd< uint32_t, N >, Vec128< uint32_t, N > hi, Vec128< uint32_t, N > lo)
 
template<size_t N, HWY_IF_LE64(int32_t, N) >
HWY_API Vec128< int32_t, N > hwy::HWY_NAMESPACE::ConcatEven (Simd< int32_t, N >, Vec128< int32_t, N > hi, Vec128< int32_t, N > lo)
 
template<size_t N, HWY_IF_LE64(float, N) >
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::ConcatEven (Simd< float, N >, Vec128< float, N > hi, Vec128< float, N > lo)
 
template<typename T , HWY_IF_LANE_SIZE(T, 8) >
HWY_API Vec128< T > hwy::HWY_NAMESPACE::ConcatEven (Full128< T > d, Vec128< T > hi, Vec128< T > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::OddEven (const Vec128< T, N > a, const Vec128< T, N > b)
 
template<size_t N>
HWY_API Vec128< float, N > hwy::HWY_NAMESPACE::PromoteTo (Simd< float, N > df32, const Vec128< bfloat16_t, N > v)
 
HWY_API Vec128< int64_t > hwy::HWY_NAMESPACE::MulEven (Vec128< int32_t > a, Vec128< int32_t > b)
 
HWY_API Vec128< uint64_t > hwy::HWY_NAMESPACE::MulEven (Vec128< uint32_t > a, Vec128< uint32_t > b)
 
template<size_t N>
HWY_API Vec128< int64_t,(N+1)/2 > hwy::HWY_NAMESPACE::MulEven (const Vec128< int32_t, N > a, const Vec128< int32_t, N > b)
 
template<size_t N>
HWY_API Vec128< uint64_t,(N+1)/2 > hwy::HWY_NAMESPACE::MulEven (const Vec128< uint32_t, N > a, const Vec128< uint32_t, N > b)
 
HWY_INLINE Vec128< uint64_t > hwy::HWY_NAMESPACE::MulEven (Vec128< uint64_t > a, Vec128< uint64_t > b)
 
HWY_INLINE Vec128< uint64_t > hwy::HWY_NAMESPACE::MulOdd (Vec128< uint64_t > a, Vec128< uint64_t > b)
 
template<typename T , typename TI >
HWY_API Vec128< TI > hwy::HWY_NAMESPACE::TableLookupBytes (const Vec128< T > bytes, const Vec128< TI > from)
 
template<typename T , typename TI , size_t NI, HWY_IF_LE64(TI, NI) >
HWY_API Vec128< TI, NI > hwy::HWY_NAMESPACE::TableLookupBytes (const Vec128< T > bytes, const Vec128< TI, NI > from)
 
template<typename T , size_t N, typename TI , HWY_IF_LE64(T, N) >
HWY_API Vec128< TI > hwy::HWY_NAMESPACE::TableLookupBytes (const Vec128< T, N > bytes, const Vec128< TI > from)
 
template<typename T , size_t N, typename TI , size_t NI, HWY_IF_LE64(T, N) , HWY_IF_LE64(TI, NI) >
HWY_API VFromD< Repartition< T, Simd< TI, NI > > > hwy::HWY_NAMESPACE::TableLookupBytes (Vec128< T, N > bytes, Vec128< TI, NI > from)
 
template<class V , class VI >
HWY_API VI hwy::HWY_NAMESPACE::TableLookupBytesOr0 (const V bytes, const VI from)
 
template<typename T , size_t N, typename Offset , HWY_IF_LE128(T, N) >
HWY_API void hwy::HWY_NAMESPACE::ScatterOffset (Vec128< T, N > v, Simd< T, N > d, T *HWY_RESTRICT base, const Vec128< Offset, N > offset)
 
template<typename T , size_t N, typename Index , HWY_IF_LE128(T, N) >
HWY_API void hwy::HWY_NAMESPACE::ScatterIndex (Vec128< T, N > v, Simd< T, N > d, T *HWY_RESTRICT base, const Vec128< Index, N > index)
 
template<typename T , size_t N, typename Offset >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::GatherOffset (const Simd< T, N > d, const T *HWY_RESTRICT base, const Vec128< Offset, N > offset)
 
template<typename T , size_t N, typename Index >
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::GatherIndex (const Simd< T, N > d, const T *HWY_RESTRICT base, const Vec128< Index, N > index)
 
template<typename T >
HWY_INLINE Vec128< T, 1 > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< T, 1 > v)
 
template<typename T >
HWY_INLINE Vec128< T, 1 > hwy::HWY_NAMESPACE::detail::MinOfLanes (hwy::SizeTag< sizeof(T)>, const Vec128< T, 1 > v)
 
template<typename T >
HWY_INLINE Vec128< T, 1 > hwy::HWY_NAMESPACE::detail::MaxOfLanes (hwy::SizeTag< sizeof(T)>, const Vec128< T, 1 > v)
 
template<typename T , HWY_IF_LANE_SIZE(T, 4) >
HWY_INLINE Vec128< T, 2 > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< T, 2 > v10)
 
template<typename T >
HWY_INLINE Vec128< T, 2 > hwy::HWY_NAMESPACE::detail::MinOfLanes (hwy::SizeTag< 4 >, const Vec128< T, 2 > v10)
 
template<typename T >
HWY_INLINE Vec128< T, 2 > hwy::HWY_NAMESPACE::detail::MaxOfLanes (hwy::SizeTag< 4 >, const Vec128< T, 2 > v10)
 
HWY_INLINE Vec128< uint32_t > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< uint32_t > v)
 
HWY_INLINE Vec128< int32_t > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< int32_t > v)
 
HWY_INLINE Vec128< float > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< float > v)
 
HWY_INLINE Vec128< uint64_t > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< uint64_t > v)
 
HWY_INLINE Vec128< int64_t > hwy::HWY_NAMESPACE::detail::SumOfLanes (const Vec128< int64_t > v)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::MinOfLanes (hwy::SizeTag< 4 >, const Vec128< T > v3210)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::MaxOfLanes (hwy::SizeTag< 4 >, const Vec128< T > v3210)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::MinOfLanes (hwy::SizeTag< 8 >, const Vec128< T > v10)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::MaxOfLanes (hwy::SizeTag< 8 >, const Vec128< T > v10)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::SumOfLanes (Simd< T, N >, const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::MinOfLanes (Simd< T, N >, const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::MaxOfLanes (Simd< T, N >, const Vec128< T, N > v)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::Set64 (Simd< T, N >, uint64_t mask_bits)
 
template<typename T >
HWY_INLINE Vec128< T > hwy::HWY_NAMESPACE::detail::Set64 (Full128< T > d, uint64_t mask_bits)
 
template<typename T , size_t N, HWY_IF_LANE_SIZE(T, 1) >
HWY_INLINE Mask128< T, N > hwy::HWY_NAMESPACE::detail::LoadMaskBits (Simd< T, N > d, uint64_t mask_bits)
 
template<typename T , size_t N, HWY_IF_LE128(T, N) >
HWY_API Mask128< T, N > hwy::HWY_NAMESPACE::LoadMaskBits (Simd< T, N > d, const uint8_t *HWY_RESTRICT bits)
 
template<typename T >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 1 >, const Mask128< T > mask)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 1 >, const Mask128< T, N > mask)
 
template<typename T >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 2 >, const Mask128< T > mask)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 2 >, const Mask128< T, N > mask)
 
template<typename T >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 4 >, const Mask128< T > mask)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 4 >, const Mask128< T, N > mask)
 
template<typename T >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 8 >, const Mask128< T > m)
 
template<typename T >
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (hwy::SizeTag< 8 >, const Mask128< T, 1 > m)
 
template<typename T , size_t N>
constexpr uint64_t hwy::HWY_NAMESPACE::detail::OnlyActive (uint64_t bits)
 
template<typename T , size_t N>
HWY_INLINE uint64_t hwy::HWY_NAMESPACE::detail::BitsFromMask (const Mask128< T, N > mask)
 
template<typename T >
HWY_INLINE size_t hwy::HWY_NAMESPACE::detail::CountTrue (hwy::SizeTag< 1 >, const Mask128< T > mask)
 
template<typename T >
HWY_INLINE size_t hwy::HWY_NAMESPACE::detail::CountTrue (hwy::SizeTag< 2 >, const Mask128< T > mask)
 
template<typename T >
HWY_INLINE size_t hwy::HWY_NAMESPACE::detail::CountTrue (hwy::SizeTag< 4 >, const Mask128< T > mask)
 
template<typename T >
HWY_INLINE size_t hwy::HWY_NAMESPACE::detail::CountTrue (hwy::SizeTag< 8 >, const Mask128< T > mask)
 
template<typename T >
HWY_API size_t hwy::HWY_NAMESPACE::CountTrue (Full128< T >, const Mask128< T > mask)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_API size_t hwy::HWY_NAMESPACE::CountTrue (Simd< T, N >, const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_API intptr_t hwy::HWY_NAMESPACE::FindFirstTrue (const Simd< T, N >, const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_API size_t hwy::HWY_NAMESPACE::StoreMaskBits (Simd< T, N >, const Mask128< T, N > mask, uint8_t *bits)
 
template<typename T >
HWY_API bool hwy::HWY_NAMESPACE::AllFalse (const Full128< T > d, const Mask128< T > m)
 
template<typename T , size_t N, HWY_IF_LE64(T, N) >
HWY_API bool hwy::HWY_NAMESPACE::AllFalse (const Simd< T, N >, const Mask128< T, N > m)
 
template<typename T , size_t N>
HWY_API bool hwy::HWY_NAMESPACE::AllTrue (const Simd< T, N > d, const Mask128< T, N > m)
 
HWY_INLINE Vec128< uint8_t > hwy::HWY_NAMESPACE::detail::Load8Bytes (Full128< uint8_t >, const uint8_t *bytes)
 
template<size_t N, HWY_IF_LE64(uint8_t, N) >
HWY_INLINE Vec128< uint8_t, N > hwy::HWY_NAMESPACE::detail::Load8Bytes (Simd< uint8_t, N > d, const uint8_t *bytes)
 
template<typename T , size_t N>
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::IdxFromBits (hwy::SizeTag< 2 >, const uint64_t mask_bits)
 
template<typename T , size_t N>
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::IdxFromBits (hwy::SizeTag< 4 >, const uint64_t mask_bits)
 
template<typename T , size_t N>
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::detail::Compress (Vec128< T, N > v, const uint64_t mask_bits)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::Compress (Vec128< T, N > v, const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_INLINE Vec128< T, N > hwy::HWY_NAMESPACE::CompressBits (Vec128< T, N > v, const uint8_t *HWY_RESTRICT bits)
 
template<typename T , size_t N>
HWY_API size_t hwy::HWY_NAMESPACE::CompressStore (Vec128< T, N > v, const Mask128< T, N > mask, Simd< T, N > d, T *HWY_RESTRICT unaligned)
 
template<typename T , size_t N>
HWY_API size_t hwy::HWY_NAMESPACE::CompressBitsStore (Vec128< T, N > v, const uint8_t *HWY_RESTRICT bits, Simd< T, N > d, T *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved3 (const Vec128< uint8_t > v0, const Vec128< uint8_t > v1, const Vec128< uint8_t > v2, Full128< uint8_t >, uint8_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved3 (const Vec128< uint8_t, 8 > v0, const Vec128< uint8_t, 8 > v1, const Vec128< uint8_t, 8 > v2, Simd< uint8_t, 8 >, uint8_t *HWY_RESTRICT unaligned)
 
template<size_t N, HWY_IF_LE32(uint8_t, N) >
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved3 (const Vec128< uint8_t, N > v0, const Vec128< uint8_t, N > v1, const Vec128< uint8_t, N > v2, Simd< uint8_t, N >, uint8_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved4 (const Vec128< uint8_t > v0, const Vec128< uint8_t > v1, const Vec128< uint8_t > v2, const Vec128< uint8_t > v3, Full128< uint8_t >, uint8_t *HWY_RESTRICT unaligned)
 
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved4 (const Vec128< uint8_t, 8 > v0, const Vec128< uint8_t, 8 > v1, const Vec128< uint8_t, 8 > v2, const Vec128< uint8_t, 8 > v3, Simd< uint8_t, 8 >, uint8_t *HWY_RESTRICT unaligned)
 
template<size_t N, HWY_IF_LE32(uint8_t, N) >
HWY_API void hwy::HWY_NAMESPACE::StoreInterleaved4 (const Vec128< uint8_t, N > v0, const Vec128< uint8_t, N > v1, const Vec128< uint8_t, N > v2, const Vec128< uint8_t, N > v3, Simd< uint8_t, N >, uint8_t *HWY_RESTRICT unaligned)
 
template<typename T , size_t N>
HWY_API size_t hwy::HWY_NAMESPACE::StoreMaskBits (const Mask128< T, N > mask, uint8_t *bits)
 
template<typename T , size_t N>
HWY_API bool hwy::HWY_NAMESPACE::AllTrue (const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_API bool hwy::HWY_NAMESPACE::AllFalse (const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_API size_t hwy::HWY_NAMESPACE::CountTrue (const Mask128< T, N > mask)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::SumOfLanes (const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::MinOfLanes (const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::MaxOfLanes (const Vec128< T, N > v)
 
template<typename T , size_t N>
HWY_API Vec128< T,(N+1)/2 > hwy::HWY_NAMESPACE::UpperHalf (Vec128< T, N > v)
 
template<int kBytes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftRightBytes (const Vec128< T, N > v)
 
template<int kLanes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ShiftRightLanes (const Vec128< T, N > v)
 
template<size_t kBytes, typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::CombineShiftRightBytes (Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::InterleaveUpper (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N, class D = Simd<T, N>>
HWY_API VFromD< RepartitionToWide< D > > hwy::HWY_NAMESPACE::ZipUpper (Vec128< T, N > a, Vec128< T, N > b)
 
template<typename T , size_t N2>
HWY_API Vec128< T, N2 *2 > hwy::HWY_NAMESPACE::Combine (Vec128< T, N2 > hi2, Vec128< T, N2 > lo2)
 
template<typename T , size_t N2, HWY_IF_LE64(T, N2) >
HWY_API Vec128< T, N2 *2 > hwy::HWY_NAMESPACE::ZeroExtendVector (Vec128< T, N2 > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatLowerLower (Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatUpperUpper (Vec128< T, N > hi, Vec128< T, N > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatLowerUpper (const Vec128< T, N > hi, const Vec128< T, N > lo)
 
template<typename T , size_t N>
HWY_API Vec128< T, N > hwy::HWY_NAMESPACE::ConcatUpperLower (Vec128< T, N > hi, Vec128< T, N > lo)
 
template<class V >
HWY_APIhwy::HWY_NAMESPACE::Add (V a, V b)
 
template<class V >
HWY_APIhwy::HWY_NAMESPACE::Sub (V a, V b)
 
template<class V >
HWY_APIhwy::HWY_NAMESPACE::Mul (V a, V b)
 
template<class V >
HWY_APIhwy::HWY_NAMESPACE::Div (V a, V b)
 
template<class V >
hwy::HWY_NAMESPACE::Shl (V a, V b)
 
template<class V >
hwy::HWY_NAMESPACE::Shr (V a, V b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Eq (V a, V b) -> decltype(a==b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Ne (V a, V b) -> decltype(a==b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Lt (V a, V b) -> decltype(a==b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Gt (V a, V b) -> decltype(a==b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Ge (V a, V b) -> decltype(a==b)
 
template<class V >
HWY_API auto hwy::HWY_NAMESPACE::Le (V a, V b) -> decltype(a==b)
 
 HWY_AFTER_NAMESPACE ()
 

Macro Definition Documentation

◆ HWY_NATIVE_POPCNT

#define HWY_NATIVE_POPCNT

◆ HWY_NEON_BUILD_ARG_1

#define HWY_NEON_BUILD_ARG_1   a.raw

◆ HWY_NEON_BUILD_ARG_2

#define HWY_NEON_BUILD_ARG_2   a.raw, b.raw

◆ HWY_NEON_BUILD_ARG_3

#define HWY_NEON_BUILD_ARG_3   a.raw, b.raw, c.raw

◆ HWY_NEON_BUILD_ARG_HWY_CAST_TO_U8

#define HWY_NEON_BUILD_ARG_HWY_CAST_TO_U8   v.raw

◆ HWY_NEON_BUILD_ARG_HWY_COMPARE

#define HWY_NEON_BUILD_ARG_HWY_COMPARE   a.raw, b.raw

◆ HWY_NEON_BUILD_ARG_HWY_IF

#define HWY_NEON_BUILD_ARG_HWY_IF   mask.raw, yes.raw, no.raw

◆ HWY_NEON_BUILD_ARG_HWY_SET1

#define HWY_NEON_BUILD_ARG_HWY_SET1   t

◆ HWY_NEON_BUILD_ARG_HWY_TESTBIT

#define HWY_NEON_BUILD_ARG_HWY_TESTBIT   v.raw, bit.raw

◆ HWY_NEON_BUILD_PARAM_1

#define HWY_NEON_BUILD_PARAM_1 (   type,
  size 
)    const Vec128<type, size> a

◆ HWY_NEON_BUILD_PARAM_2

#define HWY_NEON_BUILD_PARAM_2 (   type,
  size 
)     const Vec128<type, size> a, const Vec128<type, size> b

◆ HWY_NEON_BUILD_PARAM_3

#define HWY_NEON_BUILD_PARAM_3 (   type,
  size 
)
Value:
const Vec128<type, size> a, const Vec128<type, size> b, \
const Vec128<type, size> c

◆ HWY_NEON_BUILD_PARAM_HWY_CAST_TO_U8

#define HWY_NEON_BUILD_PARAM_HWY_CAST_TO_U8 (   type,
  size 
)    Vec128<type, size> v

◆ HWY_NEON_BUILD_PARAM_HWY_COMPARE

#define HWY_NEON_BUILD_PARAM_HWY_COMPARE (   type,
  size 
)     const Vec128<type, size> a, const Vec128<type, size> b

◆ HWY_NEON_BUILD_PARAM_HWY_IF

#define HWY_NEON_BUILD_PARAM_HWY_IF (   type,
  size 
)
Value:
const Mask128<type, size> mask, const Vec128<type, size> yes, \
const Vec128<type, size> no

◆ HWY_NEON_BUILD_PARAM_HWY_SET1

#define HWY_NEON_BUILD_PARAM_HWY_SET1 (   type,
  size 
)     Simd<type, size> /* tag */, const type t

◆ HWY_NEON_BUILD_PARAM_HWY_TESTBIT

#define HWY_NEON_BUILD_PARAM_HWY_TESTBIT (   type,
  size 
)     Vec128<type, size> v, Vec128<type, size> bit

◆ HWY_NEON_BUILD_RET_1

#define HWY_NEON_BUILD_RET_1 (   type,
  size 
)    Vec128<type, size>

◆ HWY_NEON_BUILD_RET_2

#define HWY_NEON_BUILD_RET_2 (   type,
  size 
)    Vec128<type, size>

◆ HWY_NEON_BUILD_RET_3

#define HWY_NEON_BUILD_RET_3 (   type,
  size 
)    Vec128<type, size>

◆ HWY_NEON_BUILD_RET_HWY_CAST_TO_U8

#define HWY_NEON_BUILD_RET_HWY_CAST_TO_U8 (   type,
  size 
)     Vec128<uint8_t, size * sizeof(type)>

◆ HWY_NEON_BUILD_RET_HWY_COMPARE

#define HWY_NEON_BUILD_RET_HWY_COMPARE (   type,
  size 
)    Mask128<type, size>

◆ HWY_NEON_BUILD_RET_HWY_IF

#define HWY_NEON_BUILD_RET_HWY_IF (   type,
  size 
)    Vec128<type, size>

◆ HWY_NEON_BUILD_RET_HWY_SET1

#define HWY_NEON_BUILD_RET_HWY_SET1 (   type,
  size 
)    Vec128<type, size>

◆ HWY_NEON_BUILD_RET_HWY_TESTBIT

#define HWY_NEON_BUILD_RET_HWY_TESTBIT (   type,
  size 
)    Mask128<type, size>

◆ HWY_NEON_BUILD_TPL_1

#define HWY_NEON_BUILD_TPL_1

◆ HWY_NEON_BUILD_TPL_2

#define HWY_NEON_BUILD_TPL_2

◆ HWY_NEON_BUILD_TPL_3

#define HWY_NEON_BUILD_TPL_3

◆ HWY_NEON_BUILD_TPL_HWY_CAST_TO_U8

#define HWY_NEON_BUILD_TPL_HWY_CAST_TO_U8

◆ HWY_NEON_BUILD_TPL_HWY_COMPARE

#define HWY_NEON_BUILD_TPL_HWY_COMPARE

◆ HWY_NEON_BUILD_TPL_HWY_IF

#define HWY_NEON_BUILD_TPL_HWY_IF

◆ HWY_NEON_BUILD_TPL_HWY_SET1

#define HWY_NEON_BUILD_TPL_HWY_SET1

◆ HWY_NEON_BUILD_TPL_HWY_TESTBIT

#define HWY_NEON_BUILD_TPL_HWY_TESTBIT

◆ HWY_NEON_DEF_FUNCTION [1/2]

#define HWY_NEON_DEF_FUNCTION (   type,
  size,
  name,
  prefix,
  infix,
  suffix,
  args 
)
Value:
HWY_CONCAT(HWY_NEON_BUILD_TPL_, args) \
HWY_API HWY_CONCAT(HWY_NEON_BUILD_RET_, args)(type, size) \
name(HWY_CONCAT(HWY_NEON_BUILD_PARAM_, args)(type, size)) { \
return HWY_CONCAT(HWY_NEON_BUILD_RET_, args)(type, size)( \
HWY_NEON_EVAL(prefix##infix##suffix, HWY_NEON_BUILD_ARG_##args)); \
}
#define HWY_NEON_EVAL(func,...)
Definition: arm_neon-inl.h:68
#define HWY_CONCAT(a, b)
Definition: base.h:120

◆ HWY_NEON_DEF_FUNCTION [2/2]

#define HWY_NEON_DEF_FUNCTION (   type,
  size,
  name,
  prefix,
  infix,
  suffix,
  args 
)
Value:
template <int kBits> \
HWY_API Vec128<type, size> name(const Vec128<type, size> v) { \
return kBits == 0 ? v \
: Vec128<type, size>(HWY_NEON_EVAL( \
prefix##infix##suffix, v.raw, HWY_MAX(1, kBits))); \
}
#define HWY_MAX(a, b)
Definition: base.h:123

◆ HWY_NEON_DEF_FUNCTION_ALL_FLOATS

#define HWY_NEON_DEF_FUNCTION_ALL_FLOATS (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(float, 4, name, prefix##q, infix, f32, args) \
HWY_NEON_DEF_FUNCTION(float, 2, name, prefix, infix, f32, args) \
HWY_NEON_DEF_FUNCTION(float, 1, name, prefix, infix, f32, args)
#define HWY_NEON_DEF_FUNCTION(type, size, name, prefix, infix, suffix, args)
Definition: arm_neon-inl.h:887

◆ HWY_NEON_DEF_FUNCTION_ALL_TYPES

#define HWY_NEON_DEF_FUNCTION_ALL_TYPES (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_INTS_UINTS(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_ALL_FLOATS(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_INTS_UINTS(name, prefix, infix, args)
Definition: arm_neon-inl.h:179

◆ HWY_NEON_DEF_FUNCTION_INT_16

#define HWY_NEON_DEF_FUNCTION_INT_16 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(int16_t, 8, name, prefix##q, infix, s16, args) \
HWY_NEON_DEF_FUNCTION(int16_t, 4, name, prefix, infix, s16, args) \
HWY_NEON_DEF_FUNCTION(int16_t, 2, name, prefix, infix, s16, args) \
HWY_NEON_DEF_FUNCTION(int16_t, 1, name, prefix, infix, s16, args)

◆ HWY_NEON_DEF_FUNCTION_INT_32

#define HWY_NEON_DEF_FUNCTION_INT_32 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(int32_t, 4, name, prefix##q, infix, s32, args) \
HWY_NEON_DEF_FUNCTION(int32_t, 2, name, prefix, infix, s32, args) \
HWY_NEON_DEF_FUNCTION(int32_t, 1, name, prefix, infix, s32, args)

◆ HWY_NEON_DEF_FUNCTION_INT_64

#define HWY_NEON_DEF_FUNCTION_INT_64 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(int64_t, 2, name, prefix##q, infix, s64, args) \
HWY_NEON_DEF_FUNCTION(int64_t, 1, name, prefix, infix, s64, args)

◆ HWY_NEON_DEF_FUNCTION_INT_8

#define HWY_NEON_DEF_FUNCTION_INT_8 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(int8_t, 16, name, prefix##q, infix, s8, args) \
HWY_NEON_DEF_FUNCTION(int8_t, 8, name, prefix, infix, s8, args) \
HWY_NEON_DEF_FUNCTION(int8_t, 4, name, prefix, infix, s8, args) \
HWY_NEON_DEF_FUNCTION(int8_t, 2, name, prefix, infix, s8, args) \
HWY_NEON_DEF_FUNCTION(int8_t, 1, name, prefix, infix, s8, args)

◆ HWY_NEON_DEF_FUNCTION_INT_8_16_32

#define HWY_NEON_DEF_FUNCTION_INT_8_16_32 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_INT_8(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_INT_16(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_INT_32(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_INT_8(name, prefix, infix, args)
Definition: arm_neon-inl.h:97

◆ HWY_NEON_DEF_FUNCTION_INTS

#define HWY_NEON_DEF_FUNCTION_INTS (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_INT_8_16_32(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_INT_64(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_INT_8_16_32(name, prefix, infix, args)
Definition: arm_neon-inl.h:163

◆ HWY_NEON_DEF_FUNCTION_INTS_UINTS

#define HWY_NEON_DEF_FUNCTION_INTS_UINTS (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_INTS(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_UINTS(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_INTS(name, prefix, infix, args)
Definition: arm_neon-inl.h:174

◆ HWY_NEON_DEF_FUNCTION_UINT_16

#define HWY_NEON_DEF_FUNCTION_UINT_16 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(uint16_t, 8, name, prefix##q, infix, u16, args) \
HWY_NEON_DEF_FUNCTION(uint16_t, 4, name, prefix, infix, u16, args) \
HWY_NEON_DEF_FUNCTION(uint16_t, 2, name, prefix, infix, u16, args) \
HWY_NEON_DEF_FUNCTION(uint16_t, 1, name, prefix, infix, u16, args)

◆ HWY_NEON_DEF_FUNCTION_UINT_32

#define HWY_NEON_DEF_FUNCTION_UINT_32 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(uint32_t, 4, name, prefix##q, infix, u32, args) \
HWY_NEON_DEF_FUNCTION(uint32_t, 2, name, prefix, infix, u32, args) \
HWY_NEON_DEF_FUNCTION(uint32_t, 1, name, prefix, infix, u32, args)

◆ HWY_NEON_DEF_FUNCTION_UINT_64

#define HWY_NEON_DEF_FUNCTION_UINT_64 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(uint64_t, 2, name, prefix##q, infix, u64, args) \
HWY_NEON_DEF_FUNCTION(uint64_t, 1, name, prefix, infix, u64, args)

◆ HWY_NEON_DEF_FUNCTION_UINT_8

#define HWY_NEON_DEF_FUNCTION_UINT_8 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION(uint8_t, 16, name, prefix##q, infix, u8, args) \
HWY_NEON_DEF_FUNCTION(uint8_t, 8, name, prefix, infix, u8, args) \
HWY_NEON_DEF_FUNCTION(uint8_t, 4, name, prefix, infix, u8, args) \
HWY_NEON_DEF_FUNCTION(uint8_t, 2, name, prefix, infix, u8, args) \
HWY_NEON_DEF_FUNCTION(uint8_t, 1, name, prefix, infix, u8, args)

◆ HWY_NEON_DEF_FUNCTION_UINT_8_16_32

#define HWY_NEON_DEF_FUNCTION_UINT_8_16_32 (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_UINT_8(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_UINT_16(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_UINT_32(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_UINT_8(name, prefix, infix, args)
Definition: arm_neon-inl.h:89

◆ HWY_NEON_DEF_FUNCTION_UINTS

#define HWY_NEON_DEF_FUNCTION_UINTS (   name,
  prefix,
  infix,
  args 
)
Value:
HWY_NEON_DEF_FUNCTION_UINT_8_16_32(name, prefix, infix, args) \
HWY_NEON_DEF_FUNCTION_UINT_64(name, prefix, infix, args)
#define HWY_NEON_DEF_FUNCTION_UINT_8_16_32(name, prefix, infix, args)
Definition: arm_neon-inl.h:157

◆ HWY_NEON_EVAL

#define HWY_NEON_EVAL (   func,
  ... 
)    func(__VA_ARGS__)

Function Documentation

◆ HWY_AFTER_NAMESPACE()

HWY_AFTER_NAMESPACE ( )

◆ HWY_BEFORE_NAMESPACE()

HWY_BEFORE_NAMESPACE ( )