Classes
struct	Mask

struct	Mask< double >

struct	Mask< float >

class	ScaledDividerU32

struct	Vec

struct	Vec< 1, T >

struct	Vec< 2, T >

struct	Vec< 4, T >

Typedefs
template<typename T >
using	M = typename Mask< T >::type

using	float2 = Vec< 2, float >

using	float4 = Vec< 4, float >

using	float8 = Vec< 8, float >

using	double2 = Vec< 2, double >

using	double4 = Vec< 4, double >

using	double8 = Vec< 8, double >

using	byte2 = Vec< 2, uint8_t >

using	byte4 = Vec< 4, uint8_t >

using	byte8 = Vec< 8, uint8_t >

using	byte16 = Vec< 16, uint8_t >

using	int2 = Vec< 2, int32_t >

using	int4 = Vec< 4, int32_t >

using	int8 = Vec< 8, int32_t >

using	ushort2 = Vec< 2, uint16_t >

using	ushort4 = Vec< 4, uint16_t >

using	ushort8 = Vec< 8, uint16_t >

using	uint2 = Vec< 2, uint32_t >

using	uint4 = Vec< 4, uint32_t >

using	uint8 = Vec< 8, uint32_t >

using	long2 = Vec< 2, int64_t >

using	long4 = Vec< 4, int64_t >

using	long8 = Vec< 8, int64_t >

using	half2 = Vec< 2, uint16_t >

using	half4 = Vec< 4, uint16_t >

using	half8 = Vec< 8, uint16_t >

Functions
template<int... Ix, int N, typename T >
SI Vec< sizeof...(Ix), T >	shuffle (const Vec< N, T > &)

SINT Vec< 2 *N, T >	join (const Vec< N, T > &lo, const Vec< N, T > &hi)

SIT Vec< 1, T >	operator+ (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator- (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator* (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator/ (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator^ (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator& (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator\| (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, T >	operator! (const Vec< 1, T > &x)

SIT Vec< 1, T >	operator- (const Vec< 1, T > &x)

SIT Vec< 1, T >	operator~ (const Vec< 1, T > &x)

SIT Vec< 1, T >	operator<< (const Vec< 1, T > &x, int k)

SIT Vec< 1, T >	operator>> (const Vec< 1, T > &x, int k)

SIT Vec< 1, M< T > >	operator== (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, M< T > >	operator!= (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, M< T > >	operator<= (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, M< T > >	operator>= (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, M< T > >	operator< (const Vec< 1, T > &x, const Vec< 1, T > &y)

SIT Vec< 1, M< T > >	operator> (const Vec< 1, T > &x, const Vec< 1, T > &y)

SINT Vec< N, T >	operator+ (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator- (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator* (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator/ (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator^ (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator& (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator\| (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	operator! (const Vec< N, T > &x)

SINT Vec< N, T >	operator- (const Vec< N, T > &x)

SINT Vec< N, T >	operator~ (const Vec< N, T > &x)

SINT Vec< N, T >	operator<< (const Vec< N, T > &x, int k)

SINT Vec< N, T >	operator>> (const Vec< N, T > &x, int k)

SINT Vec< N, M< T > >	operator== (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, M< T > >	operator!= (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, M< T > >	operator<= (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, M< T > >	operator>= (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, M< T > >	operator< (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, M< T > >	operator> (const Vec< N, T > &x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator+ (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator- (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator* (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator/ (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator^ (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator& (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator\| (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator== (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator!= (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator<= (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator>= (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator< (U x, const Vec< N, T > &y)

SINTU Vec< N, M< T > >	operator> (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	operator+ (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator- (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator* (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator/ (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator^ (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator& (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	operator\| (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator== (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator!= (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator<= (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator>= (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator< (const Vec< N, T > &x, U y)

SINTU Vec< N, M< T > >	operator> (const Vec< N, T > &x, U y)

SINT Vec< N, T > &	operator+= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator-= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator*= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator/= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator^= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator&= (Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T > &	operator\|= (Vec< N, T > &x, const Vec< N, T > &y)

SINTU Vec< N, T > &	operator+= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator-= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator*= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator/= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator^= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator&= (Vec< N, T > &x, U y)

SINTU Vec< N, T > &	operator\|= (Vec< N, T > &x, U y)

SINT Vec< N, T > &	operator<<= (Vec< N, T > &x, int bits)

SINT Vec< N, T > &	operator>>= (Vec< N, T > &x, int bits)

SINT Vec< N, T >	naive_if_then_else (const Vec< N, M< T > > &cond, const Vec< N, T > &t, const Vec< N, T > &e)

SIT Vec< 1, T >	if_then_else (const Vec< 1, M< T > > &cond, const Vec< 1, T > &t, const Vec< 1, T > &e)

SINT Vec< N, T >	if_then_else (const Vec< N, M< T > > &cond, const Vec< N, T > &t, const Vec< N, T > &e)

SIT bool	any (const Vec< 1, T > &x)

SINT bool	any (const Vec< N, T > &x)

SIT bool	all (const Vec< 1, T > &x)

SINT bool	all (const Vec< N, T > &x)

template<typename D , typename S >
SI Vec< 1, D >	cast (const Vec< 1, S > &src)

template<typename D , int N, typename S >
SI Vec< N, D >	cast (const Vec< N, S > &src)

SIT T	min (const Vec< 1, T > &x)

SIT T	max (const Vec< 1, T > &x)

SINT T	min (const Vec< N, T > &x)

SINT T	max (const Vec< N, T > &x)

SINT Vec< N, T >	min (const Vec< N, T > &x, const Vec< N, T > &y)

SINT Vec< N, T >	max (const Vec< N, T > &x, const Vec< N, T > &y)

SINTU Vec< N, T >	min (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	max (const Vec< N, T > &x, U y)

SINTU Vec< N, T >	min (U x, const Vec< N, T > &y)

SINTU Vec< N, T >	max (U x, const Vec< N, T > &y)

SINT Vec< N, T >	pin (const Vec< N, T > &x, const Vec< N, T > &lo, const Vec< N, T > &hi)

template<typename Fn , typename... Args, size_t... I>
SI auto	map (std::index_sequence< I... >, Fn &&fn, const Args &... args) -> skvx::Vec< sizeof...(I), decltype(fn(args[0]...))>

template<typename Fn , int N, typename T , typename... Rest>
auto	map (Fn &&fn, const Vec< N, T > &first, const Rest &... rest)

SIN Vec< N, float >	ceil (const Vec< N, float > &x)

SIN Vec< N, float >	floor (const Vec< N, float > &x)

SIN Vec< N, float >	trunc (const Vec< N, float > &x)

SIN Vec< N, float >	round (const Vec< N, float > &x)

SIN Vec< N, float >	sqrt (const Vec< N, float > &x)

SIN Vec< N, float >	abs (const Vec< N, float > &x)

SIN Vec< N, float >	fma (const Vec< N, float > &x, const Vec< N, float > &y, const Vec< N, float > &z)

SI Vec< 1, int >	lrint (const Vec< 1, float > &x)

SIN Vec< N, int >	lrint (const Vec< N, float > &x)

SIN Vec< N, float >	fract (const Vec< N, float > &x)

SIN Vec< N, uint16_t >	to_half (const Vec< N, float > &x)

SIN Vec< N, float >	from_half (const Vec< N, uint16_t > &x)

SIN Vec< N, uint8_t >	div255 (const Vec< N, uint16_t > &x)

SIN Vec< N, uint8_t >	approx_scale (const Vec< N, uint8_t > &x, const Vec< N, uint8_t > &y)

SINT std::enable_if_t< std::is_unsigned_v< T >, Vec< N, T > >	saturated_add (const Vec< N, T > &x, const Vec< N, T > &y)

SIN Vec< N, uint16_t >	mull (const Vec< N, uint8_t > &x, const Vec< N, uint8_t > &y)

SIN Vec< N, uint32_t >	mull (const Vec< N, uint16_t > &x, const Vec< N, uint16_t > &y)

SIN Vec< N, uint16_t >	mulhi (const Vec< N, uint16_t > &x, const Vec< N, uint16_t > &y)

SINT T	dot (const Vec< N, T > &a, const Vec< N, T > &b)

SIT T	cross (const Vec< 2, T > &a, const Vec< 2, T > &b)

SIN float	length (const Vec< N, float > &v)

SIN double	length (const Vec< N, double > &v)

SIN Vec< N, float >	normalize (const Vec< N, float > &v)

SIN Vec< N, double >	normalize (const Vec< N, double > &v)

SINT bool	isfinite (const Vec< N, T > &v)

SIT void	strided_load4 (const T *v, Vec< 1, T > &a, Vec< 1, T > &b, Vec< 1, T > &c, Vec< 1, T > &d)

SINT void	strided_load4 (const T *v, Vec< N, T > &a, Vec< N, T > &b, Vec< N, T > &c, Vec< N, T > &d)

SI void	strided_load4 (const float *v, Vec< 4, float > &a, Vec< 4, float > &b, Vec< 4, float > &c, Vec< 4, float > &d)

SIT void	strided_load2 (const T *v, Vec< 1, T > &a, Vec< 1, T > &b)

SINT void	strided_load2 (const T *v, Vec< N, T > &a, Vec< N, T > &b)

	DEF_TEST (SkVx, r)

	DEF_TEST (SkVx_xy, r)

	DEF_TEST (SkVx_xyzw, r)

	DEF_TEST (SkVx_cross_dot, r)

template<int N, typename T >
void	check_strided_loads (skiatest::Reporter *r)

template<typename T >
void	check_strided_loads (skiatest::Reporter *r)

	DEF_TEST (SkVx_strided_loads, r)

	DEF_TEST (SkVx_ScaledDividerU32, r)

	DEF_TEST (SkVx_saturated_add, r)

	DEF_TEST (SkVx_length, r)

	DEF_TEST (SkVx_normalize, r)

	DEF_TEST (SkVx_normalize_infinity_and_nan, r)

	DEF_TEST (SkVx_isfinite, r)

Typedef Documentation

◆ byte16

using skvx::byte16 = typedef Vec<16, uint8_t>

Definition at line 1156 of file SkVx.h.

◆ byte2

using skvx::byte2 = typedef Vec< 2, uint8_t>

Definition at line 1153 of file SkVx.h.

◆ byte4

using skvx::byte4 = typedef Vec< 4, uint8_t>

Definition at line 1154 of file SkVx.h.

◆ byte8

using skvx::byte8 = typedef Vec< 8, uint8_t>

Definition at line 1155 of file SkVx.h.

◆ double2

using skvx::double2 = typedef Vec< 2, double>

Definition at line 1149 of file SkVx.h.

◆ double4

using skvx::double4 = typedef Vec< 4, double>

Definition at line 1150 of file SkVx.h.

◆ double8

using skvx::double8 = typedef Vec< 8, double>

Definition at line 1151 of file SkVx.h.

◆ float2

using skvx::float2 = typedef Vec< 2, float>

Definition at line 1145 of file SkVx.h.

◆ float4

using skvx::float4 = typedef Vec< 4, float>

Definition at line 1146 of file SkVx.h.

◆ float8

using skvx::float8 = typedef Vec< 8, float>

Definition at line 1147 of file SkVx.h.

◆ half2

using skvx::half2 = typedef Vec< 2, uint16_t>

Definition at line 1175 of file SkVx.h.

◆ half4

using skvx::half4 = typedef Vec< 4, uint16_t>

Definition at line 1176 of file SkVx.h.

◆ half8

using skvx::half8 = typedef Vec< 8, uint16_t>

Definition at line 1177 of file SkVx.h.

◆ int2

using skvx::int2 = typedef Vec< 2, int32_t>

Definition at line 1158 of file SkVx.h.

◆ int4

using skvx::int4 = typedef Vec< 4, int32_t>

Definition at line 1159 of file SkVx.h.

◆ int8

using skvx::int8 = typedef Vec< 8, int32_t>

Definition at line 1160 of file SkVx.h.

◆ long2

using skvx::long2 = typedef Vec< 2, int64_t>

Definition at line 1170 of file SkVx.h.

◆ long4

using skvx::long4 = typedef Vec< 4, int64_t>

Definition at line 1171 of file SkVx.h.

◆ long8

using skvx::long8 = typedef Vec< 8, int64_t>

Definition at line 1172 of file SkVx.h.

◆ M

template<typename T >

using skvx::M = typedef typename Mask<T>::type

Definition at line 239 of file SkVx.h.

◆ uint2

using skvx::uint2 = typedef Vec< 2, uint32_t>

Definition at line 1166 of file SkVx.h.

◆ uint4

using skvx::uint4 = typedef Vec< 4, uint32_t>

Definition at line 1167 of file SkVx.h.

◆ uint8

using skvx::uint8 = typedef Vec< 8, uint32_t>

Definition at line 1168 of file SkVx.h.

◆ ushort2

using skvx::ushort2 = typedef Vec< 2, uint16_t>

Definition at line 1162 of file SkVx.h.

◆ ushort4

using skvx::ushort4 = typedef Vec< 4, uint16_t>

Definition at line 1163 of file SkVx.h.

◆ ushort8

using skvx::ushort8 = typedef Vec< 8, uint16_t>

Definition at line 1164 of file SkVx.h.

Function Documentation

◆ abs()

SIN Vec< N, float > skvx::abs ( const Vec< N, float > & x )

Definition at line 707 of file SkVx.h.

707{ return map( fabsf, x); }

x

double x

Definition: mouse-input-test.cc:82

skvx::map

auto map(Fn &&fn, const Vec< N, T > &first, const Rest &... rest)

Definition: SkVx.h:697

◆ all() [1/2]

SIT bool skvx::all ( const Vec< 1, T > & x )

Definition at line 582 of file SkVx.h.

582{ return x.val != 0; }

◆ all() [2/2]

SINT bool skvx::all ( const Vec< N, T > & x )

Definition at line 583 of file SkVx.h.

                                 {
// Unlike any(), we have to respect the lane layout, or we'll miss cases where a
// true lane has a mix of 0 and 1 bits.
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1
    // Unfortunately, the _mm_testc intrinsics don't let us avoid the comparison to 0 for all()'s
    // correctness, so always just use the plain SSE version.
    if constexpr (N == 4 && sizeof(T) == 4) {
        return _mm_movemask_ps(_mm_cmpneq_ps(sk_bit_cast<__m128>(x), _mm_set1_ps(0))) == 0b1111;
    }
#endif
#if SKVX_USE_SIMD && defined(__aarch64__)
    // On 64-bit NEON, take the min across the lanes, which will be non-zero if all lanes are != 0.
    if constexpr (sizeof(T)==1 && N==8)  {return vminv_u8  (sk_bit_cast<uint8x8_t> (x)) > 0;}
    if constexpr (sizeof(T)==1 && N==16) {return vminvq_u8 (sk_bit_cast<uint8x16_t>(x)) > 0;}
    if constexpr (sizeof(T)==2 && N==4)  {return vminv_u16 (sk_bit_cast<uint16x4_t>(x)) > 0;}
    if constexpr (sizeof(T)==2 && N==8)  {return vminvq_u16(sk_bit_cast<uint16x8_t>(x)) > 0;}
    if constexpr (sizeof(T)==4 && N==2)  {return vminv_u32 (sk_bit_cast<uint32x2_t>(x)) > 0;}
    if constexpr (sizeof(T)==4 && N==4)  {return vminvq_u32(sk_bit_cast<uint32x4_t>(x)) > 0;}
#endif
#if SKVX_USE_SIMD && defined(__wasm_simd128__)
    if constexpr (N == 4 && sizeof(T) == 4) {
        return wasm_i32x4_all_true(sk_bit_cast<VExt<4,int>>(x));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LASX
    if constexpr (N == 8 && sizeof(T) == 4) {
        v8i32 retv = (v8i32)__lasx_xvmskltz_w(__lasx_xvslt_wu(__lasx_xvldi(0),
                                                              sk_bit_cast<__m256i>(x)));
        return (retv[0] & retv[4]) == 0b1111;
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
    if constexpr (N == 4 && sizeof(T) == 4) {
        v4i32 retv = (v4i32)__lsx_vmskltz_w(__lsx_vslt_wu(__lsx_vldi(0),
                                                          sk_bit_cast<__m128i>(x)));
        return retv[0] == 0b1111;
    }
#endif
    return all(x.lo)
        && all(x.hi);
}

◆ any() [1/2]

SIT bool skvx::any ( const Vec< 1, T > & x )

Definition at line 530 of file SkVx.h.

530{ return x.val != 0; }

◆ any() [2/2]

SINT bool skvx::any ( const Vec< N, T > & x )

Definition at line 531 of file SkVx.h.

                                 {
    // For any(), the _mm_testz intrinsics are correct and don't require comparing 'x' to 0, so it's
    // lower latency compared to _mm_movemask + _mm_compneq on plain SSE.
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX2
    if constexpr (N*sizeof(T) == 32) {
        return !_mm256_testz_si256(sk_bit_cast<__m256i>(x), _mm256_set1_epi32(-1));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE41
    if constexpr (N*sizeof(T) == 16) {
        return !_mm_testz_si128(sk_bit_cast<__m128i>(x), _mm_set1_epi32(-1));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1
    if constexpr (N*sizeof(T) == 16) {
        // On SSE, movemask checks only the MSB in each lane, which is fine if the lanes were set
        // directly from a comparison op (which sets all bits to 1 when true), but skvx::Vec<>
        // treats any non-zero value as true, so we have to compare 'x' to 0 before calling movemask
        return _mm_movemask_ps(_mm_cmpneq_ps(sk_bit_cast<__m128>(x), _mm_set1_ps(0))) != 0b0000;
    }
#endif
#if SKVX_USE_SIMD && defined(__aarch64__)
    // On 64-bit NEON, take the max across lanes, which will be non-zero if any lane was true.
    // The specific lane-size doesn't really matter in this case since it's really any set bit
    // that we're looking for.
    if constexpr (N*sizeof(T) == 8 ) { return vmaxv_u8 (sk_bit_cast<uint8x8_t> (x)) > 0; }
    if constexpr (N*sizeof(T) == 16) { return vmaxvq_u8(sk_bit_cast<uint8x16_t>(x)) > 0; }
#endif
#if SKVX_USE_SIMD && defined(__wasm_simd128__)
    if constexpr (N == 4 && sizeof(T) == 4) {
        return wasm_i32x4_any_true(sk_bit_cast<VExt<4,int>>(x));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LASX
    if constexpr (N*sizeof(T) == 32) {
        v8i32 retv = (v8i32)__lasx_xvmskltz_w(__lasx_xvslt_wu(__lasx_xvldi(0),
                                                              sk_bit_cast<__m256i>(x)));
        return (retv[0] | retv[4]) != 0b0000;
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
    if constexpr (N*sizeof(T) == 16) {
        v4i32 retv = (v4i32)__lsx_vmskltz_w(__lsx_vslt_wu(__lsx_vldi(0),
                                                          sk_bit_cast<__m128i>(x)));
        return retv[0] != 0b0000;
    }
#endif
    return any(x.lo)
        || any(x.hi);
}

◆ approx_scale()

SIN Vec< N, uint8_t > skvx::approx_scale	(	const Vec< N, uint8_t > &	x,
		const Vec< N, uint8_t > &	y
	)

Definition at line 824 of file SkVx.h.

                                                                                  {
    // All of (x*y+x)/256, (x*y+y)/256, and (x*y+255)/256 meet the criteria above.
    // We happen to have historically picked (x*y+x)/256.
    auto X = cast<uint16_t>(x),
         Y = cast<uint16_t>(y);
    return cast<uint8_t>( (X*Y+X)/256 );
}

◆ cast() [1/2]

template<typename D , typename S >

SI Vec< 1, D > skvx::cast ( const Vec< 1, S > & src )

Definition at line 628 of file SkVx.h.

628{ return (D)src.val; }

D

Definition: GrMemoryPoolTest.cpp:109

mskp_parser.src

src

Definition: mskp_parser.py:22

◆ cast() [2/2]

template<typename D , int N, typename S >

SI Vec< N, D > skvx::cast ( const Vec< N, S > & src )

Definition at line 631 of file SkVx.h.

                                      {
#if SKVX_USE_SIMD && defined(__clang__)
    return to_vec(__builtin_convertvector(to_vext(src), VExt<N,D>));
#else
    return join(cast<D>(src.lo), cast<D>(src.hi));
#endif
}

◆ ceil()

SIN Vec< N, float > skvx::ceil ( const Vec< N, float > & x )

Definition at line 702 of file SkVx.h.

702{ return map( ceilf, x); }

◆ check_strided_loads() [1/2]

template<int N, typename T >

void skvx::check_strided_loads ( skiatest::Reporter * r )

Definition at line 278 of file SkVxTest.cpp.

                                                                          {
    using Vec = Vec<N,T>;
    T values[N*4];
    std::iota(values, values + N*4, 0);
    Vec a, b, c, d;
    strided_load2(values, a, b);
    for (int i = 0; i < N; ++i) {
        REPORTER_ASSERT(r, a[i] == values[i*2]);
        REPORTER_ASSERT(r, b[i] == values[i*2 + 1]);
    }
    strided_load4(values, a, b, c, d);
    for (int i = 0; i < N; ++i) {
        REPORTER_ASSERT(r, a[i] == values[i*4]);
        REPORTER_ASSERT(r, b[i] == values[i*4 + 1]);
        REPORTER_ASSERT(r, c[i] == values[i*4 + 2]);
        REPORTER_ASSERT(r, d[i] == values[i*4 + 3]);
    }
}

◆ check_strided_loads() [2/2]

template<typename T >

void skvx::check_strided_loads ( skiatest::Reporter * r )

Definition at line 297 of file SkVxTest.cpp.

                                                                   {
    check_strided_loads<1,T>(r);
    check_strided_loads<2,T>(r);
    check_strided_loads<4,T>(r);
    check_strided_loads<8,T>(r);
    check_strided_loads<16,T>(r);
    check_strided_loads<32,T>(r);
}

◆ cross()

SIT T skvx::cross	(	const Vec< 2, T > &	a,
		const Vec< 2, T > &	b
	)

Definition at line 982 of file SkVx.h.

                                                    {
    auto x = a * shuffle<1,0>(b);
    return x[0] - x[1];
}

◆ DEF_TEST() [1/11]

skvx::DEF_TEST	(	SkVx	,
		r
	)

Definition at line 18 of file SkVxTest.cpp.

                  {
    static_assert(sizeof(float2) ==  8, "");
    static_assert(sizeof(float4) == 16, "");
    static_assert(sizeof(float8) == 32, "");
 
    static_assert(sizeof(byte2) == 2, "");
    static_assert(sizeof(byte4) == 4, "");
    static_assert(sizeof(byte8) == 8, "");
 
    {
        int4 mask = float4{1,2,3,4} < float4{1,2,4,8};
        REPORTER_ASSERT(r, mask[0] == int32_t( 0));
        REPORTER_ASSERT(r, mask[1] == int32_t( 0));
        REPORTER_ASSERT(r, mask[2] == int32_t(-1));
        REPORTER_ASSERT(r, mask[3] == int32_t(-1));
 
        REPORTER_ASSERT(r,  any(mask));
        REPORTER_ASSERT(r, !all(mask));
    }
 
    {
        long4 mask = double4{1,2,3,4} < double4{1,2,4,8};
        REPORTER_ASSERT(r, mask[0] == int64_t( 0));
        REPORTER_ASSERT(r, mask[1] == int64_t( 0));
        REPORTER_ASSERT(r, mask[2] == int64_t(-1));
        REPORTER_ASSERT(r, mask[3] == int64_t(-1));
 
        REPORTER_ASSERT(r,  any(mask));
        REPORTER_ASSERT(r, !all(mask));
    }
 
    {
        // Tests that any/all work with non-zero values, not just full bit lanes.
        REPORTER_ASSERT(r,  all(int4{1,2,3,4}));
        REPORTER_ASSERT(r, !all(int4{1,2,3}));
        REPORTER_ASSERT(r,  any(int4{1,2}));
        REPORTER_ASSERT(r, !any(int4{}));
    }
 
    REPORTER_ASSERT(r, min(float4{1,2,3,4}) == 1);
    REPORTER_ASSERT(r, max(float4{1,2,3,4}) == 4);
 
    REPORTER_ASSERT(r, all(int4{1,2,3,4}   == int4{1,2,3,4}));
    REPORTER_ASSERT(r, all(int4{1,2,3}     == int4{1,2,3,0}));
    REPORTER_ASSERT(r, all(int4{1,2}       == int4{1,2,0,0}));
    REPORTER_ASSERT(r, all(int4{1}         == int4{1,0,0,0}));
    REPORTER_ASSERT(r, all(int4(1)         == int4{1,1,1,1}));
    REPORTER_ASSERT(r, all(int4{}          == int4{0,0,0,0}));
    REPORTER_ASSERT(r, all(int4()          == int4{0,0,0,0}));
 
    REPORTER_ASSERT(r, all(int4{1,2,2,1} == min(int4{1,2,3,4}, int4{4,3,2,1})));
    REPORTER_ASSERT(r, all(int4{4,3,3,4} == max(int4{1,2,3,4}, int4{4,3,2,1})));
 
    REPORTER_ASSERT(r, all(if_then_else(float4{1,2,3,2} <= float4{2,2,2,2}, float4(42), float4(47))
                           == float4{42,42,47,42}));
 
    REPORTER_ASSERT(r, all(floor(float4{-1.5f,1.5f,1.0f,-1.0f}) == float4{-2.0f,1.0f,1.0f,-1.0f}));
    REPORTER_ASSERT(r, all( ceil(float4{-1.5f,1.5f,1.0f,-1.0f}) == float4{-1.0f,2.0f,1.0f,-1.0f}));
    REPORTER_ASSERT(r, all(trunc(float4{-1.5f,1.5f,1.0f,-1.0f}) == float4{-1.0f,1.0f,1.0f,-1.0f}));
    REPORTER_ASSERT(r, all(round(float4{-1.5f,1.5f,1.0f,-1.0f}) == float4{-2.0f,2.0f,1.0f,-1.0f}));
 
 
    REPORTER_ASSERT(r, all(abs(float4{-2,-1,0,1}) == float4{2,1,0,1}));
 
    // TODO(mtklein): these tests could be made less loose.
    REPORTER_ASSERT(r, all( sqrt(float4{2,3,4,5}) < float4{2,2,3,3}));
    REPORTER_ASSERT(r, all( sqrt(float2{2,3}) < float2{2,2}));
 
    REPORTER_ASSERT(r, all(cast<int>(float4{-1.5f,0.5f,1.0f,1.5f}) == int4{-1,0,1,1}));
 
    float buf[] = {1,2,3,4,5,6};
    REPORTER_ASSERT(r, all(float4::Load(buf) == float4{1,2,3,4}));
    float4{2,3,4,5}.store(buf);
    REPORTER_ASSERT(r, buf[0] == 2
                    && buf[1] == 3
                    && buf[2] == 4
                    && buf[3] == 5
                    && buf[4] == 5
                    && buf[5] == 6);
    REPORTER_ASSERT(r, all(float4::Load(buf+0) == float4{2,3,4,5}));
    REPORTER_ASSERT(r, all(float4::Load(buf+2) == float4{4,5,5,6}));
 
    REPORTER_ASSERT(r, all(shuffle<2,1,0,3>        (float4{1,2,3,4}) == float4{3,2,1,4}));
    REPORTER_ASSERT(r, all(shuffle<2,1>            (float4{1,2,3,4}) == float2{3,2}));
    REPORTER_ASSERT(r, all(shuffle<3,3,3,3>        (float4{1,2,3,4}) == float4{4,4,4,4}));
    REPORTER_ASSERT(r, all(shuffle<2,1,2,1,2,1,2,1>(float4{1,2,3,4})
                           == float8{3,2,3,2,3,2,3,2}));
 
    // Test that mixed types can be used where they make sense.  Mostly about ergonomics.
    REPORTER_ASSERT(r, all(float4{1,2,3,4} < 5));
    REPORTER_ASSERT(r, all( byte4{1,2,3,4} < 5));
    REPORTER_ASSERT(r, all(  int4{1,2,3,4} < 5.0f));
    float4 five = 5;
    REPORTER_ASSERT(r, all(five == 5.0f));
    REPORTER_ASSERT(r, all(five == 5));
 
    REPORTER_ASSERT(r, all(max(2, min(float4{1,2,3,4}, 3)) == float4{2,2,3,3}));
 
    for (int x = 0; x < 256; x++)
    for (int y = 0; y < 256; y++) {
        uint8_t want = (uint8_t)( 255*(x/255.0 * y/255.0) + 0.5 );
 
        {
            uint8_t got = div255(Vec<8, uint16_t>(x) * Vec<8, uint16_t>(y) )[0];
            REPORTER_ASSERT(r, got == want);
        }
 
        {
            uint8_t got = approx_scale(Vec<8,uint8_t>(x), Vec<8,uint8_t>(y))[0];
 
            REPORTER_ASSERT(r, got == want-1 ||
                               got == want   ||
                               got == want+1);
            if (x == 0 || y == 0 || x == 255 || y == 255) {
                REPORTER_ASSERT(r, got == want);
            }
        }
    }
 
    for (int x = 0; x < 256; x++)
    for (int y = 0; y < 256; y++) {
        uint16_t xy = x*y;
 
        // Make sure to cover implementation cases N=8, N<8, and N>8.
        REPORTER_ASSERT(r, all(mull(byte2 (x), byte2 (y)) == xy));
        REPORTER_ASSERT(r, all(mull(byte4 (x), byte4 (y)) == xy));
        REPORTER_ASSERT(r, all(mull(byte8 (x), byte8 (y)) == xy));
        REPORTER_ASSERT(r, all(mull(byte16(x), byte16(y)) == xy));
    }
 
    {
        // Intentionally not testing -0, as we don't care if it's 0x0000 or 0x8000.
        float8 fs = {+0.0f,+0.5f,+1.0f,+2.0f,
                     -4.0f,-0.5f,-1.0f,-2.0f};
        Vec<8,uint16_t> hs = {0x0000,0x3800,0x3c00,0x4000,
                              0xc400,0xb800,0xbc00,0xc000};
        REPORTER_ASSERT(r, all(  to_half(fs) == hs));
        REPORTER_ASSERT(r, all(from_half(hs) == fs));
    }
}

◆ DEF_TEST() [2/11]

skvx::DEF_TEST	(	SkVx_cross_dot	,
		r
	)

Definition at line 246 of file SkVxTest.cpp.

                            {
    REPORTER_ASSERT(r, cross(int2{0,1}, int2{0,1}) == 0);
    REPORTER_ASSERT(r, cross(int2{1,0}, int2{1,0}) == 0);
    REPORTER_ASSERT(r, cross(int2{1,1}, int2{1,1}) == 0);
    REPORTER_ASSERT(r, cross(int2{1,1}, int2{1,-1}) == -2);
    REPORTER_ASSERT(r, cross(int2{1,1}, int2{-1,1}) == 2);
 
    REPORTER_ASSERT(r, dot(int2{0,1}, int2{1,0}) == 0);
    REPORTER_ASSERT(r, dot(int2{1,0}, int2{0,1}) == 0);
    REPORTER_ASSERT(r, dot(int2{1,1}, int2{1,-1}) == 0);
    REPORTER_ASSERT(r, dot(int2{1,1}, int2{1,1}) == 2);
    REPORTER_ASSERT(r, dot(int2{1,1}, int2{-1,-1}) == -2);
 
    SkRandom rand;
    for (int i = 0; i < 100; ++i) {
        float a=rand.nextRangeF(-1,1), b=rand.nextRangeF(-1,1), c=rand.nextRangeF(-1,1),
              d=rand.nextRangeF(-1,1);
        constexpr static float kTolerance = 1.f / (1 << 20);
        REPORTER_ASSERT(r, SkScalarNearlyEqual(
                cross(float2{a,b}, float2{c,d}), SkPoint::CrossProduct({a,b}, {c,d}), kTolerance));
        REPORTER_ASSERT(r, SkScalarNearlyEqual(
                dot(float2{a,b}, float2{c,d}), SkPoint::DotProduct({a,b}, {c,d}), kTolerance));
    }
 
    auto assertDoublesEqual = [&](double left, double right) {
        REPORTER_ASSERT(r, SkScalarNearlyEqual(left, right), "%f != %f", left, right);
    };
    assertDoublesEqual(cross(double2{1.2, 3.4}, double2{3.4, -1.2}),          -13.000000);
    assertDoublesEqual(cross(double2{12.34, 5.6}, double2{7.8, -9.0}),       -154.740000);
    assertDoublesEqual(cross(double2{12.34, 5.6}, double2{7.8, 9.012345678}),  67.532346);
}

◆ DEF_TEST() [3/11]

skvx::DEF_TEST	(	SkVx_isfinite	,
		r
	)

Definition at line 425 of file SkVxTest.cpp.

                           {
    REPORTER_ASSERT(r, isfinite(skvx::float2{0, 0}));
    REPORTER_ASSERT(r, isfinite(skvx::double4{1.2, 3.4, 5.6, 7.8}));
    REPORTER_ASSERT(r, isfinite(skvx::float8{8, 7, 6, 5, 4, 3, 2, 1}));
 
    REPORTER_ASSERT(r, !isfinite(skvx::float2{0, NAN}));
    REPORTER_ASSERT(r, !isfinite(skvx::float2{INFINITY, 10}));
    REPORTER_ASSERT(r, !isfinite(skvx::float2{NAN, INFINITY}));
 
    for (int i = 0; i < 4; i++) {
        auto v = skvx::double4{4, 3, 2, 1};
        v[i] = INFINITY;
        REPORTER_ASSERT(r, !isfinite(v), "index %d INFINITY", i);
        v[i] = NAN;
        REPORTER_ASSERT(r, !isfinite(v), "index %d NAN", i);
    }
 
    for (int i = 0; i < 8; i++) {
        auto v = skvx::float8{8, 7, 6, 5, 4, 3, 2, 1};
        v[i] = INFINITY;
        REPORTER_ASSERT(r, !isfinite(v), "index %d INFINITY", i);
        v[i] = NAN;
        REPORTER_ASSERT(r, !isfinite(v), "index %d NAN", i);
    }
}

◆ DEF_TEST() [4/11]

skvx::DEF_TEST	(	SkVx_length	,
		r
	)

Definition at line 366 of file SkVxTest.cpp.

                         {
    auto assertFloatsEqual = [&](float left, float right) {
        REPORTER_ASSERT(r, SkScalarNearlyEqual(left, right), "%f != %f", left, right);
    };
    auto assertDoublesEqual = [&](double left, double right) {
        REPORTER_ASSERT(r, SkScalarNearlyEqual(left, right), "%f != %f", left, right);
    };
 
    assertFloatsEqual(length(float2{0, 1}),       1.000000f);
    assertFloatsEqual(length(float2{2, 0}),       2.000000f);
    assertFloatsEqual(length(float2{3, 4}),       5.000000f);
    assertFloatsEqual(length(float2{1, 1}),       1.414214f);
    assertFloatsEqual(length(float2{2.5f, 2.5f}), 3.535534f);
    assertFloatsEqual(length(float4{1, 2, 3, 4}), 5.477226f);
 
    assertDoublesEqual(length(double2{2.5, 2.5}),           3.535534);
    assertDoublesEqual(length(double4{1.5, 2.5, 3.5, 4.5}), 6.403124);
}

◆ DEF_TEST() [5/11]

skvx::DEF_TEST	(	SkVx_normalize	,
		r
	)

Definition at line 385 of file SkVxTest.cpp.

                            {
    auto assertFloatsEqual = [&](float left, float right) {
        REPORTER_ASSERT(r, SkScalarNearlyEqual(left, right), "%f != %f", left, right);
    };
    auto assertDoublesEqual = [&](double left, double right) {
        REPORTER_ASSERT(r, SkScalarNearlyEqual(left, right), "%f != %f", left, right);
    };
 
    skvx::float2 twoFloats = normalize(skvx::float2{1.2f, 3.4f});
    assertFloatsEqual(twoFloats[0], 0.332820f);
    assertFloatsEqual(twoFloats[1], 0.942990f);
 
    skvx::double2 twoDoubles = normalize(skvx::double2{2.3, -4.5});
    assertDoublesEqual(twoDoubles[0],  0.455111);
    assertDoublesEqual(twoDoubles[1], -0.890435);
 
    skvx::double4 fourDoubles = normalize(skvx::double4{1.2, 3.4, 5.6, 7.8});
    assertDoublesEqual(fourDoubles[0],  0.116997);
    assertDoublesEqual(fourDoubles[1],  0.331490);
    assertDoublesEqual(fourDoubles[2],  0.545984);
    assertDoublesEqual(fourDoubles[3],  0.760478);
}

◆ DEF_TEST() [6/11]

skvx::DEF_TEST	(	SkVx_normalize_infinity_and_nan	,
		r
	)

Definition at line 408 of file SkVxTest.cpp.

                                             {
    skvx::float2 zeroLenVec = normalize(skvx::float2{0, 0});
    REPORTER_ASSERT(r, std::isnan(zeroLenVec[0]), "%f is not nan", zeroLenVec[0]);
    REPORTER_ASSERT(r, std::isnan(zeroLenVec[1]), "%f is not nan", zeroLenVec[1]);
    REPORTER_ASSERT(r, !isfinite(zeroLenVec));
 
    skvx::float2 tooBigVec = normalize(skvx::float2{std::numeric_limits<float>::max(),
                                                    std::numeric_limits<float>::max()});
    REPORTER_ASSERT(r, tooBigVec[0] == 0, "%f != 0", tooBigVec[0]);
    REPORTER_ASSERT(r, tooBigVec[1] == 0, "%f != 0", tooBigVec[1]);
 
    skvx::double2 tooBigVecD = normalize(skvx::double2{std::numeric_limits<double>::max(),
                                                       std::numeric_limits<double>::max()});
    REPORTER_ASSERT(r, tooBigVecD[0] == 0, "%f != 0", tooBigVecD[0]);
    REPORTER_ASSERT(r, tooBigVecD[1] == 0, "%f != 0", tooBigVecD[1]);
}

◆ DEF_TEST() [7/11]

skvx::DEF_TEST	(	SkVx_saturated_add	,
		r
	)

Definition at line 354 of file SkVxTest.cpp.

                                {
    for (int a = 0; a < (1<<8); a++) {
        for (int b = 0; b < (1<<8); b++) {
            int exact = a+b;
            if (exact > 255) { exact = 255; }
            if (exact <   0) { exact =   0; }
 
            REPORTER_ASSERT(r, saturated_add(skvx::byte16(a), skvx::byte16(b))[0] == exact);
        }
    }
}

◆ DEF_TEST() [8/11]

skvx::DEF_TEST	(	SkVx_ScaledDividerU32	,
		r
	)

Definition at line 316 of file SkVxTest.cpp.

                                   {
    static constexpr uint32_t kMax = std::numeric_limits<uint32_t>::max();
 
    auto errorBounds = [&](uint32_t actual, uint32_t expected) {
        uint32_t lowerLimit = expected == 0 ? 0 : expected - 1,
                 upperLimit = expected == kMax ? kMax : expected + 1;
        return lowerLimit <= actual && actual <= upperLimit;
    };
 
    auto test = [&](uint32_t denom) {
        // half == 1 so, the max to check is kMax-1
        ScaledDividerU32 d(denom);
        uint32_t maxCheck = static_cast<uint32_t>(
                std::floor((double)(kMax - d.half()) / denom + 0.5));
        REPORTER_ASSERT(r, errorBounds(d.divide((kMax))[0], maxCheck));
        for (uint32_t i = 0; i < kMax - d.half(); i += 65535) {
            uint32_t expected = static_cast<uint32_t>(std::floor((double)i / denom + 0.5));
            auto actual = d.divide(i + d.half());
            if (!errorBounds(actual[0], expected)) {
                SkDebugf("i: %u expected: %u actual: %u\n", i, expected, actual[0]);
            }
            // Make sure all the lanes are the same.
            for (int e = 1; e < 4; e++) {
                SkASSERT(actual[0] == actual[e]);
            }
        }
    };
 
    test(2);
    test(3);
    test(5);
    test(7);
    test(27);
    test(65'535);
    test(15'485'863);
    test(512'927'377);
}

◆ DEF_TEST() [9/11]

skvx::DEF_TEST	(	SkVx_strided_loads	,
		r
	)

Definition at line 306 of file SkVxTest.cpp.

                                {
    check_strided_loads<uint32_t>(r);
    check_strided_loads<uint16_t>(r);
    check_strided_loads<uint8_t>(r);
    check_strided_loads<int32_t>(r);
    check_strided_loads<int16_t>(r);
    check_strided_loads<int8_t>(r);
    check_strided_loads<float>(r);
}

◆ DEF_TEST() [10/11]

skvx::DEF_TEST	(	SkVx_xy	,
		r
	)

Definition at line 159 of file SkVxTest.cpp.

                     {
    float2 f = float2(1,2);
    REPORTER_ASSERT(r, all(f == float2{1,2}));
    REPORTER_ASSERT(r, f.x() == 1);
    REPORTER_ASSERT(r, f.y() == 2);
    f.y() = 9;
    REPORTER_ASSERT(r, all(f == float2{1,9}));
    f.x() = 0;
    REPORTER_ASSERT(r, all(f == float2(0,9)));
    f[0] = 8;
    REPORTER_ASSERT(r, f.x() == 8);
    f[1] = 6;
    REPORTER_ASSERT(r, f.y() == 6);
    REPORTER_ASSERT(r, all(f == float2(8,6)));
    f = f.yx();
    REPORTER_ASSERT(r, all(f == float2(6,8)));
    REPORTER_ASSERT(r, sk_bit_cast<SkPoint>(f) == SkPoint::Make(6,8));
    SkPoint p;
    f.store(&p);
    REPORTER_ASSERT(r, p == SkPoint::Make(6,8));
    f.yx().store(&p);
    REPORTER_ASSERT(r, p == SkPoint::Make(8,6));
    REPORTER_ASSERT(r, all(f.xyxy() == float4(6,8,6,8)));
    REPORTER_ASSERT(r, all(f.xyxy() == float4(f,f)));
    REPORTER_ASSERT(r, all(join(f,f) == f.xyxy()));
    REPORTER_ASSERT(r, all(join(f.yx(),f) == float4(f.y(),f.x(),f)));
    REPORTER_ASSERT(r, all(join(f.yx(),f) == float4(f.yx(),f.x(),f.y())));
    REPORTER_ASSERT(r, all(join(f,f.yx()) == float4(f.x(),f.y(),f.yx())));
    REPORTER_ASSERT(r, all(join(f.yx(),f.yx()) == float4(f.yx(),f.yx())));
}

◆ DEF_TEST() [11/11]

skvx::DEF_TEST	(	SkVx_xyzw	,
		r
	)

Definition at line 190 of file SkVxTest.cpp.

                       {
    float4 f = float4{1,2,3,4};
    REPORTER_ASSERT(r, all(f == float4(1,2,3,4)));
    REPORTER_ASSERT(r, all(f == float4(1,2,float2(3,4))));
    REPORTER_ASSERT(r, all(f == float4(float2(1,2),3,4)));
    REPORTER_ASSERT(r, all(f == float4(float2(1,2),float2(3,4))));
    f.xy() = float2(9,8);
    REPORTER_ASSERT(r, all(f == float4(9,8,3,4)));
    f.zw().x() = 7;
    f.zw().y() = 6;
    REPORTER_ASSERT(r, all(f == float4(9,8,7,6)));
    f.x() = 5;
    f.y() = 4;
    f.z() = 3;
    f.w() = 2;
    REPORTER_ASSERT(r, all(f == float4(5,4,3,2)));
    f[0] = 0;
    REPORTER_ASSERT(r, f.x() == 0);
    f[1] = 1;
    REPORTER_ASSERT(r, f.y() == 1);
    f[2] = 2;
    REPORTER_ASSERT(r, f.z() == 2);
    f[3] = 3;
    REPORTER_ASSERT(r, f.w() == 3);
    REPORTER_ASSERT(r, all(f.xy() == float2(0,1)));
    REPORTER_ASSERT(r, all(f.zw() == float2{2,3}));
    REPORTER_ASSERT(r, all(f == float4(0,1,2,3)));
    REPORTER_ASSERT(r, all(f.yxwz().lo == shuffle<1,0>(f)));
    REPORTER_ASSERT(r, all(f.yxwz().hi == shuffle<3,2>(f)));
    REPORTER_ASSERT(r, all(f.zwxy().lo.lo == f.z()));
    REPORTER_ASSERT(r, all(f.zwxy().lo.hi == f.w()));
    REPORTER_ASSERT(r, all(f.zwxy().hi.lo == f.x()));
    REPORTER_ASSERT(r, all(f.zwxy().hi.hi == f.y()));
    REPORTER_ASSERT(r, f.yxwz().lo.lo.val == f.y());
    REPORTER_ASSERT(r, f.yxwz().lo.hi.val == f.x());
    REPORTER_ASSERT(r, f.yxwz().hi.lo.val == f.w());
    REPORTER_ASSERT(r, f.yxwz().hi.hi.val == f.z());
 
    REPORTER_ASSERT(r, all(naive_if_then_else(int2(0,~0),
                                              shuffle<3,2>(float4(0,1,2,3)),
                                              float4(4,5,6,7).xy()) == float2(4,2)));
    REPORTER_ASSERT(r, all(if_then_else(int2(0,~0),
                                        shuffle<3,2>(float4(0,1,2,3)),
                                        float4(4,5,6,7).xy()) == float2(4,2)));
    REPORTER_ASSERT(r, all(naive_if_then_else(int2(0,~0).xyxy(),
                                              float4(0,1,2,3).zwxy(),
                                              float4(4,5,6,7)) == float4(4,3,6,1)));
    REPORTER_ASSERT(r, all(if_then_else(int2(0,~0).xyxy(),
                                        float4(0,1,2,3).zwxy(),
                                        float4(4,5,6,7)) == float4(4,3,6,1)));
 
    REPORTER_ASSERT(r, all(pin(float4(0,1,2,3).yxwz(),
                               float2(1).xyxy(),
                               float2(2).xyxy()) == float4(1,1,2,2)));
}

◆ div255()

SIN Vec< N, uint8_t > skvx::div255 ( const Vec< N, uint16_t > & x )

Definition at line 818 of file SkVx.h.

                                                    {
    return cast<uint8_t>( (x+127)/255 );
}

◆ dot()

SINT T skvx::dot	(	const Vec< N, T > &	a,
		const Vec< N, T > &	b
	)

Definition at line 964 of file SkVx.h.

                                                   {
    // While dot is a "horizontal" operation like any or all, it needs to remain
    // in floating point and there aren't really any good SIMD instructions that make it faster.
    // The constexpr cases remove the for loop in the only cases we realistically call.
    auto ab = a*b;
    if constexpr (N == 2) {
        return ab[0] + ab[1];
    } else if constexpr (N == 4) {
        return ab[0] + ab[1] + ab[2] + ab[3];
    } else {
        T sum = ab[0];
        for (int i = 1; i < N; ++i) {
            sum += ab[i];
        }
        return sum;
    }
}

◆ floor()

SIN Vec< N, float > skvx::floor ( const Vec< N, float > & x )

Definition at line 703 of file SkVx.h.

703{ return map(floorf, x); }

◆ fma()

SIN Vec< N, float > skvx::fma	(	const Vec< N, float > &	x,
		const Vec< N, float > &	y,
		const Vec< N, float > &	z
	)

Definition at line 708 of file SkVx.h.

                                              {
    // I don't understand why Clang's codegen is terrible if we write map(fmaf, x,y,z) directly.
    auto fn = [](float x, float y, float z) { return fmaf(x,y,z); };
    return map(fn, x,y,z);
}

◆ fract()

SIN Vec< N, float > skvx::fract ( const Vec< N, float > & x )

Definition at line 744 of file SkVx.h.

744{ return x - floor(x); }

◆ from_half()

SIN Vec< N, float > skvx::from_half ( const Vec< N, uint16_t > & x )

Definition at line 790 of file SkVx.h.

                                                     {
    if constexpr (N > 4) {
        return join(from_half(x.lo),
                    from_half(x.hi));
    }
 
#if SKVX_USE_SIMD && defined(__aarch64__)
    if constexpr (N == 4) {
        return sk_bit_cast<Vec<N,float>>(vcvt_f32_f16(sk_bit_cast<float16x4_t>(x)));
    }
#endif
 
    Vec<N,int32_t> wide = cast<int32_t>(x),
                      s  = wide & 0x8000,
                      em = wide ^ s,
              inf_or_nan =  (em >= (31 << 10)) & (255 << 23),  // Expands exponent to fill 8 bits
                 is_norm =   em > 0x3ff,
                     // subnormal f16's are 2^-14*0.[m0:9] == 2^-24*[m0:9].0
                     sub = sk_bit_cast<Vec<N,int32_t>>((cast<float>(em) * (1.f/(1<<24)))),
                    norm = ((em<<13) + ((127-15)<<23)), // Shifts mantissa, shifts + re-biases exp
                  finite = (is_norm & norm) | (~is_norm & sub);
    // If 'x' is f16 +/- infinity, inf_or_nan will be the filled 8-bit exponent but 'norm' will be
    // all 0s since 'x's mantissa is 0. Thus norm | inf_or_nan becomes f32 infinity. However, if
    // 'x' is an f16 NaN, some bits of 'norm' will be non-zero, so it stays an f32 NaN after the OR.
    return sk_bit_cast<Vec<N,float>>((s<<16) | finite | inf_or_nan);
}

◆ if_then_else() [1/2]

SIT Vec< 1, T > skvx::if_then_else	(	const Vec< 1, M< T > > &	cond,
		const Vec< 1, T > &	t,
		const Vec< 1, T > &	e
	)

Definition at line 479 of file SkVx.h.

                                                                                         {
    // In practice this scalar implementation is unlikely to be used.  See next if_then_else().
    return sk_bit_cast<Vec<1,T>>(( cond & sk_bit_cast<Vec<1, M<T>>>(t)) |
                                 (~cond & sk_bit_cast<Vec<1, M<T>>>(e)) );
}

◆ if_then_else() [2/2]

SINT Vec< N, T > skvx::if_then_else	(	const Vec< N, M< T > > &	cond,
		const Vec< N, T > &	t,
		const Vec< N, T > &	e
	)

Definition at line 484 of file SkVx.h.

                                                                                          {
    // Specializations inline here so they can generalize what types the apply to.
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX2
    if constexpr (N*sizeof(T) == 32) {
        return sk_bit_cast<Vec<N,T>>(_mm256_blendv_epi8(sk_bit_cast<__m256i>(e),
                                                        sk_bit_cast<__m256i>(t),
                                                        sk_bit_cast<__m256i>(cond)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE41
    if constexpr (N*sizeof(T) == 16) {
        return sk_bit_cast<Vec<N,T>>(_mm_blendv_epi8(sk_bit_cast<__m128i>(e),
                                                     sk_bit_cast<__m128i>(t),
                                                     sk_bit_cast<__m128i>(cond)));
    }
#endif
#if SKVX_USE_SIMD && defined(SK_ARM_HAS_NEON)
    if constexpr (N*sizeof(T) == 16) {
        return sk_bit_cast<Vec<N,T>>(vbslq_u8(sk_bit_cast<uint8x16_t>(cond),
                                              sk_bit_cast<uint8x16_t>(t),
                                              sk_bit_cast<uint8x16_t>(e)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LASX
    if constexpr (N*sizeof(T) == 32) {
        return sk_bit_cast<Vec<N,T>>(__lasx_xvbitsel_v(sk_bit_cast<__m256i>(e),
                                                       sk_bit_cast<__m256i>(t),
                                                       sk_bit_cast<__m256i>(cond)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
    if constexpr (N*sizeof(T) == 16) {
        return sk_bit_cast<Vec<N,T>>(__lsx_vbitsel_v(sk_bit_cast<__m128i>(e),
                                                     sk_bit_cast<__m128i>(t),
                                                     sk_bit_cast<__m128i>(cond)));
    }
#endif
    // Recurse for large vectors to try to hit the specializations above.
    if constexpr (N*sizeof(T) > 16) {
        return join(if_then_else(cond.lo, t.lo, e.lo),
                    if_then_else(cond.hi, t.hi, e.hi));
    }
    // This default can lead to better code than the recursing onto scalars.
    return naive_if_then_else(cond, t, e);
}

◆ isfinite()

SINT bool skvx::isfinite ( const Vec< N, T > & v )

Definition at line 1003 of file SkVx.h.

                                       {
    // Multiply all values together with 0. If they were all finite, the output is
    // 0 (also finite). If any were not, we'll get nan.
    return SkIsFinite(dot(v, Vec<N, T>(0)));
}

◆ join()

SINT Vec< 2 *N, T > skvx::join	(	const Vec< N, T > &	lo,
		const Vec< N, T > &	hi
	)

Definition at line 242 of file SkVx.h.

                                                             {
    Vec<2*N,T> v;
    v.lo = lo;
    v.hi = hi;
    return v;
}

◆ length() [1/2]

SIN double skvx::length ( const Vec< N, double > & v )

Definition at line 991 of file SkVx.h.

                                           {
    return std::sqrt(dot(v, v));
}

◆ length() [2/2]

SIN float skvx::length ( const Vec< N, float > & v )

Definition at line 987 of file SkVx.h.

                                         {
    return std::sqrt(dot(v, v));
}

◆ lrint() [1/2]

SI Vec< 1, int > skvx::lrint ( const Vec< 1, float > & x )

Definition at line 716 of file SkVx.h.

                                           {
    return (int)lrintf(x.val);
}

◆ lrint() [2/2]

SIN Vec< N, int > skvx::lrint ( const Vec< N, float > & x )

Definition at line 719 of file SkVx.h.

                                            {
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX
    if constexpr (N == 8) {
        return sk_bit_cast<Vec<N,int>>(_mm256_cvtps_epi32(sk_bit_cast<__m256>(x)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1
    if constexpr (N == 4) {
        return sk_bit_cast<Vec<N,int>>(_mm_cvtps_epi32(sk_bit_cast<__m128>(x)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LASX
    if constexpr (N == 8) {
        return sk_bit_cast<Vec<N,int>>(__lasx_xvftint_w_s(sk_bit_cast<__m256>(x)));
    }
#endif
#if SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
    if constexpr (N == 4) {
        return sk_bit_cast<Vec<N,int>>(__lsx_vftint_w_s(sk_bit_cast<__m128>(x)));
    }
#endif
    return join(lrint(x.lo),
                lrint(x.hi));
}

◆ map() [1/2]

template<typename Fn , int N, typename T , typename... Rest>

auto skvx::map	(	Fn &&	fn,
		const Vec< N, T > &	first,
		const Rest &...	rest
	)

Definition at line 697 of file SkVx.h.

                                                              {
    // Derive an {0...N-1} index_sequence from the size of the first arg: N lanes in, N lanes out.
    return map(std::make_index_sequence<N>{}, fn, first,rest...);
}

◆ map() [2/2]

template<typename Fn , typename... Args, size_t... I>

SI auto skvx::map	(	std::index_sequence< I... >	,
		Fn &&	fn,
		const Args &...	args
	)		-> skvx::Vec<sizeof...(I), decltype(fn(args[0]...))>

Definition at line 680 of file SkVx.h.

                                                                                             {
    auto lane = [&](size_t i)
#if defined(__clang__)
    // CFI, specifically -fsanitize=cfi-icall, seems to give a false positive here,
    // with errors like "control flow integrity check for type 'float (float)
    // noexcept' failed during indirect function call... note: sqrtf.cfi_jt defined
    // here".  But we can be quite sure fn is the right type: it's all inferred!
    // So, stifle CFI in this function.
    __attribute__((no_sanitize("cfi")))
#endif
    { return fn(args[static_cast<int>(i)]...); };
 
    return { lane(I)... };
}

◆ max() [1/5]

SIT T skvx::max ( const Vec< 1, T > & x )

Definition at line 641 of file SkVx.h.

641{ return x.val; }

◆ max() [2/5]

SINT T skvx::max ( const Vec< N, T > & x )

Definition at line 643 of file SkVx.h.

643{ return std::max(max(x.lo), max(x.hi)); }

◆ max() [3/5]

SINT Vec< N, T > skvx::max	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 646 of file SkVx.h.

646{ return naive_if_then_else(x < y, y, x); }

◆ max() [4/5]

SINTU Vec< N, T > skvx::max	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 649 of file SkVx.h.

649{ return max(x, Vec<N,T>(y)); }

◆ max() [5/5]

SINTU Vec< N, T > skvx::max	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 651 of file SkVx.h.

651{ return max(Vec<N,T>(x), y); }

◆ min() [1/5]

SIT T skvx::min ( const Vec< 1, T > & x )

Definition at line 640 of file SkVx.h.

640{ return x.val; }

◆ min() [2/5]

SINT T skvx::min ( const Vec< N, T > & x )

Definition at line 642 of file SkVx.h.

642{ return std::min(min(x.lo), min(x.hi)); }

◆ min() [3/5]

SINT Vec< N, T > skvx::min	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 645 of file SkVx.h.

645{ return naive_if_then_else(y < x, y, x); }

◆ min() [4/5]

SINTU Vec< N, T > skvx::min	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 648 of file SkVx.h.

648{ return min(x, Vec<N,T>(y)); }

◆ min() [5/5]

SINTU Vec< N, T > skvx::min	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 650 of file SkVx.h.

650{ return min(Vec<N,T>(x), y); }

◆ mulhi()

SIN Vec< N, uint16_t > skvx::mulhi	(	const Vec< N, uint16_t > &	x,
		const Vec< N, uint16_t > &	y
	)

Definition at line 938 of file SkVx.h.

                                                    {
#if SKVX_USE_SIMD && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1
    // Use _mm_mulhi_epu16 for 8xuint16_t and join or split to get there.
    if constexpr (N == 8) {
        return sk_bit_cast<Vec<8,uint16_t>>(_mm_mulhi_epu16(sk_bit_cast<__m128i>(x),
                                                            sk_bit_cast<__m128i>(y)));
    } else if constexpr (N < 8) {
        return mulhi(join(x,x), join(y,y)).lo;
    } else { // N > 8
        return join(mulhi(x.lo, y.lo), mulhi(x.hi, y.hi));
    }
#elif SKVX_USE_SIMD && SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
    if constexpr (N == 8) {
        return sk_bit_cast<Vec<8,uint16_t>>(__lsx_vmuh_hu(sk_bit_cast<__m128i>(x),
                                                          sk_bit_cast<__m128i>(y)));
    } else if constexpr (N < 8) {
        return mulhi(join(x,x), join(y,y)).lo;
    } else { // N > 8
        return join(mulhi(x.lo, y.lo), mulhi(x.hi, y.hi));
    }
#else
    return skvx::cast<uint16_t>(mull(x, y) >> 16);
#endif
}

◆ mull() [1/2]

SIN Vec< N, uint32_t > skvx::mull	(	const Vec< N, uint16_t > &	x,
		const Vec< N, uint16_t > &	y
	)

Definition at line 922 of file SkVx.h.

                                                   {
#if SKVX_USE_SIMD && defined(SK_ARM_HAS_NEON)
    // NEON can do four u16*u16 -> u32 in one instruction, vmull_u16
    if constexpr (N == 4) {
        return to_vec<4,uint32_t>(vmull_u16(to_vext(x), to_vext(y)));
    } else if constexpr (N < 4) {
        return mull(join(x,x), join(y,y)).lo;
    } else { // N > 4
        return join(mull(x.lo, y.lo), mull(x.hi, y.hi));
    }
#else
    return cast<uint32_t>(x) * cast<uint32_t>(y);
#endif
}

◆ mull() [2/2]

SIN Vec< N, uint16_t > skvx::mull	(	const Vec< N, uint8_t > &	x,
		const Vec< N, uint8_t > &	y
	)

Definition at line 906 of file SkVx.h.

                                                  {
#if SKVX_USE_SIMD && defined(SK_ARM_HAS_NEON)
    // With NEON we can do eight u8*u8 -> u16 in one instruction, vmull_u8 (read, mul-long).
    if constexpr (N == 8) {
        return to_vec<8,uint16_t>(vmull_u8(to_vext(x), to_vext(y)));
    } else if constexpr (N < 8) {
        return mull(join(x,x), join(y,y)).lo;
    } else { // N > 8
        return join(mull(x.lo, y.lo), mull(x.hi, y.hi));
    }
#else
    return cast<uint16_t>(x) * cast<uint16_t>(y);
#endif
}

◆ naive_if_then_else()

SINT Vec< N, T > skvx::naive_if_then_else	(	const Vec< N, M< T > > &	cond,
		const Vec< N, T > &	t,
		const Vec< N, T > &	e
	)

Definition at line 474 of file SkVx.h.

                                                                                                {
    return sk_bit_cast<Vec<N,T>>(( cond & sk_bit_cast<Vec<N, M<T>>>(t)) |
                                 (~cond & sk_bit_cast<Vec<N, M<T>>>(e)) );
}

◆ normalize() [1/2]

SIN Vec< N, double > skvx::normalize ( const Vec< N, double > & v )

Definition at line 999 of file SkVx.h.

                                                      {
    return v / length(v);
}

◆ normalize() [2/2]

SIN Vec< N, float > skvx::normalize ( const Vec< N, float > & v )

Definition at line 995 of file SkVx.h.

                                                    {
    return v / length(v);
}

◆ operator!() [1/2]

SIT Vec< 1, T > skvx::operator! ( const Vec< 1, T > & x )

Definition at line 344 of file SkVx.h.

344{ return !x.val; }

◆ operator!() [2/2]

SINT Vec< N, T > skvx::operator! ( const Vec< N, T > & x )

Definition at line 394 of file SkVx.h.

394{ return join(!x.lo, !x.hi); }

◆ operator!=() [1/4]

SIT Vec< 1, M< T > > skvx::operator!=	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 354 of file SkVx.h.

                                                                     {
        return x.val != y.val ? ~0 : 0;
    }

◆ operator!=() [2/4]

SINT Vec< N, M< T > > skvx::operator!=	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 404 of file SkVx.h.

                                                                      {
        return join(x.lo != y.lo, x.hi != y.hi);
    }

◆ operator!=() [3/4]

SINTU Vec< N, M< T > > skvx::operator!=	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 444 of file SkVx.h.

444{ return x != Vec<N,T>(y); }

◆ operator!=() [4/4]

SINTU Vec< N, M< T > > skvx::operator!=	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 430 of file SkVx.h.

430{ return Vec<N,T>(x) != y; }

◆ operator&() [1/4]

SIT Vec< 1, T > skvx::operator&	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 341 of file SkVx.h.

341{ return x.val & y.val; }

◆ operator&() [2/4]

SINT Vec< N, T > skvx::operator&	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 387 of file SkVx.h.

                                                                  {
        return join(x.lo & y.lo, x.hi & y.hi);
    }

◆ operator&() [3/4]

SINTU Vec< N, T > skvx::operator&	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 441 of file SkVx.h.

441{ return x & Vec<N,T>(y); }

◆ operator&() [4/4]

SINTU Vec< N, T > skvx::operator&	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 427 of file SkVx.h.

427{ return Vec<N,T>(x) & y; }

◆ operator&=() [1/2]

SINT Vec< N, T > & skvx::operator&=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 455 of file SkVx.h.

455{ return (x = x & y); }

◆ operator&=() [2/2]

SINTU Vec< N, T > & skvx::operator&=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 463 of file SkVx.h.

463{ return (x = x & Vec<N,T>(y)); }

◆ operator*() [1/4]

SIT Vec< 1, T > skvx::operator*	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 337 of file SkVx.h.

337{ return x.val * y.val; }

◆ operator*() [2/4]

SINT Vec< N, T > skvx::operator*	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 377 of file SkVx.h.

                                                                  {
        return join(x.lo * y.lo, x.hi * y.hi);
    }

◆ operator*() [3/4]

SINTU Vec< N, T > skvx::operator*	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 438 of file SkVx.h.

438{ return x * Vec<N,T>(y); }

◆ operator*() [4/4]

SINTU Vec< N, T > skvx::operator*	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 424 of file SkVx.h.

424{ return Vec<N,T>(x) * y; }

◆ operator*=() [1/2]

SINT Vec< N, T > & skvx::operator*=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 452 of file SkVx.h.

452{ return (x = x * y); }

◆ operator*=() [2/2]

SINTU Vec< N, T > & skvx::operator*=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 460 of file SkVx.h.

460{ return (x = x * Vec<N,T>(y)); }

◆ operator+() [1/4]

SIT Vec< 1, T > skvx::operator+	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 335 of file SkVx.h.

335{ return x.val + y.val; }

◆ operator+() [2/4]

SINT Vec< N, T > skvx::operator+	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 371 of file SkVx.h.

                                                                  {
        return join(x.lo + y.lo, x.hi + y.hi);
    }

◆ operator+() [3/4]

SINTU Vec< N, T > skvx::operator+	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 436 of file SkVx.h.

436{ return x + Vec<N,T>(y); }

◆ operator+() [4/4]

SINTU Vec< N, T > skvx::operator+	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 422 of file SkVx.h.

422{ return Vec<N,T>(x) + y; }

◆ operator+=() [1/2]

SINT Vec< N, T > & skvx::operator+=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 450 of file SkVx.h.

450{ return (x = x + y); }

◆ operator+=() [2/2]

SINTU Vec< N, T > & skvx::operator+=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 458 of file SkVx.h.

458{ return (x = x + Vec<N,T>(y)); }

◆ operator-() [1/6]

SIT Vec< 1, T > skvx::operator- ( const Vec< 1, T > & x )

Definition at line 345 of file SkVx.h.

345{ return -x.val; }

◆ operator-() [2/6]

SIT Vec< 1, T > skvx::operator-	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 336 of file SkVx.h.

336{ return x.val - y.val; }

◆ operator-() [3/6]

SINT Vec< N, T > skvx::operator- ( const Vec< N, T > & x )

Definition at line 395 of file SkVx.h.

395{ return join(-x.lo, -x.hi); }

◆ operator-() [4/6]

SINT Vec< N, T > skvx::operator-	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 374 of file SkVx.h.

                                                                  {
        return join(x.lo - y.lo, x.hi - y.hi);
    }

◆ operator-() [5/6]

SINTU Vec< N, T > skvx::operator-	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 437 of file SkVx.h.

437{ return x - Vec<N,T>(y); }

◆ operator-() [6/6]

SINTU Vec< N, T > skvx::operator-	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 423 of file SkVx.h.

423{ return Vec<N,T>(x) - y; }

◆ operator-=() [1/2]

SINT Vec< N, T > & skvx::operator-=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 451 of file SkVx.h.

451{ return (x = x - y); }

◆ operator-=() [2/2]

SINTU Vec< N, T > & skvx::operator-=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 459 of file SkVx.h.

459{ return (x = x - Vec<N,T>(y)); }

◆ operator/() [1/4]

SIT Vec< 1, T > skvx::operator/	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 338 of file SkVx.h.

338{ return x.val / y.val; }

◆ operator/() [2/4]

SINT Vec< N, T > skvx::operator/	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 380 of file SkVx.h.

                                                                  {
        return join(x.lo / y.lo, x.hi / y.hi);
    }

◆ operator/() [3/4]

SINTU Vec< N, T > skvx::operator/	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 439 of file SkVx.h.

439{ return x / Vec<N,T>(y); }

◆ operator/() [4/4]

SINTU Vec< N, T > skvx::operator/	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 425 of file SkVx.h.

425{ return Vec<N,T>(x) / y; }

◆ operator/=() [1/2]

SINT Vec< N, T > & skvx::operator/=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 453 of file SkVx.h.

453{ return (x = x / y); }

◆ operator/=() [2/2]

SINTU Vec< N, T > & skvx::operator/=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 461 of file SkVx.h.

461{ return (x = x / Vec<N,T>(y)); }

◆ operator<() [1/4]

SIT Vec< 1, M< T > > skvx::operator<	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 363 of file SkVx.h.

                                                                     {
        return x.val <  y.val ? ~0 : 0;
    }

◆ operator<() [2/4]

SINT Vec< N, M< T > > skvx::operator<	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 413 of file SkVx.h.

                                                                      {
        return join(x.lo <  y.lo, x.hi <  y.hi);
    }

◆ operator<() [3/4]

SINTU Vec< N, M< T > > skvx::operator<	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 447 of file SkVx.h.

447{ return x < Vec<N,T>(y); }

◆ operator<() [4/4]

SINTU Vec< N, M< T > > skvx::operator<	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 433 of file SkVx.h.

433{ return Vec<N,T>(x) < y; }

◆ operator<<() [1/2]

SIT Vec< 1, T > skvx::operator<<	(	const Vec< 1, T > &	x,
		int	k
	)

Definition at line 348 of file SkVx.h.

348{ return x.val << k; }

◆ operator<<() [2/2]

SINT Vec< N, T > skvx::operator<<	(	const Vec< N, T > &	x,
		int	k
	)

Definition at line 398 of file SkVx.h.

398{ return join(x.lo << k, x.hi << k); }

◆ operator<<=()

SINT Vec< N, T > & skvx::operator<<=	(	Vec< N, T > &	x,
		int	bits
	)

Definition at line 466 of file SkVx.h.

466{ return (x = x << bits); }

skcms_private::bits

uint32_t bits

Definition: skcms_Transform.h:120

◆ operator<=() [1/4]

SIT Vec< 1, M< T > > skvx::operator<=	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 357 of file SkVx.h.

                                                                     {
        return x.val <= y.val ? ~0 : 0;
    }

◆ operator<=() [2/4]

SINT Vec< N, M< T > > skvx::operator<=	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 407 of file SkVx.h.

                                                                      {
        return join(x.lo <= y.lo, x.hi <= y.hi);
    }

◆ operator<=() [3/4]

SINTU Vec< N, M< T > > skvx::operator<=	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 445 of file SkVx.h.

445{ return x <= Vec<N,T>(y); }

◆ operator<=() [4/4]

SINTU Vec< N, M< T > > skvx::operator<=	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 431 of file SkVx.h.

431{ return Vec<N,T>(x) <= y; }

◆ operator==() [1/4]

SIT Vec< 1, M< T > > skvx::operator==	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 351 of file SkVx.h.

                                                                     {
        return x.val == y.val ? ~0 : 0;
    }

◆ operator==() [2/4]

SINT Vec< N, M< T > > skvx::operator==	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 401 of file SkVx.h.

                                                                      {
        return join(x.lo == y.lo, x.hi == y.hi);
    }

◆ operator==() [3/4]

SINTU Vec< N, M< T > > skvx::operator==	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 443 of file SkVx.h.

443{ return x == Vec<N,T>(y); }

◆ operator==() [4/4]

SINTU Vec< N, M< T > > skvx::operator==	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 429 of file SkVx.h.

429{ return Vec<N,T>(x) == y; }

◆ operator>() [1/4]

SIT Vec< 1, M< T > > skvx::operator>	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 366 of file SkVx.h.

                                                                     {
        return x.val >  y.val ? ~0 : 0;
    }

◆ operator>() [2/4]

SINT Vec< N, M< T > > skvx::operator>	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 416 of file SkVx.h.

                                                                      {
        return join(x.lo >  y.lo, x.hi >  y.hi);
    }

◆ operator>() [3/4]

SINTU Vec< N, M< T > > skvx::operator>	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 448 of file SkVx.h.

448{ return x > Vec<N,T>(y); }

◆ operator>() [4/4]

SINTU Vec< N, M< T > > skvx::operator>	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 434 of file SkVx.h.

434{ return Vec<N,T>(x) > y; }

◆ operator>=() [1/4]

SIT Vec< 1, M< T > > skvx::operator>=	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 360 of file SkVx.h.

                                                                     {
        return x.val >= y.val ? ~0 : 0;
    }

◆ operator>=() [2/4]

SINT Vec< N, M< T > > skvx::operator>=	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 410 of file SkVx.h.

                                                                      {
        return join(x.lo >= y.lo, x.hi >= y.hi);
    }

◆ operator>=() [3/4]

SINTU Vec< N, M< T > > skvx::operator>=	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 446 of file SkVx.h.

446{ return x >= Vec<N,T>(y); }

◆ operator>=() [4/4]

SINTU Vec< N, M< T > > skvx::operator>=	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 432 of file SkVx.h.

432{ return Vec<N,T>(x) >= y; }

◆ operator>>() [1/2]

SIT Vec< 1, T > skvx::operator>>	(	const Vec< 1, T > &	x,
		int	k
	)

Definition at line 349 of file SkVx.h.

349{ return x.val >> k; }

◆ operator>>() [2/2]

SINT Vec< N, T > skvx::operator>>	(	const Vec< N, T > &	x,
		int	k
	)

Definition at line 399 of file SkVx.h.

399{ return join(x.lo >> k, x.hi >> k); }

◆ operator>>=()

SINT Vec< N, T > & skvx::operator>>=	(	Vec< N, T > &	x,
		int	bits
	)

Definition at line 467 of file SkVx.h.

467{ return (x = x >> bits); }

◆ operator^() [1/4]

SIT Vec< 1, T > skvx::operator^	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 340 of file SkVx.h.

340{ return x.val ^ y.val; }

◆ operator^() [2/4]

SINT Vec< N, T > skvx::operator^	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 384 of file SkVx.h.

                                                                  {
        return join(x.lo ^ y.lo, x.hi ^ y.hi);
    }

◆ operator^() [3/4]

SINTU Vec< N, T > skvx::operator^	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 440 of file SkVx.h.

440{ return x ^ Vec<N,T>(y); }

◆ operator^() [4/4]

SINTU Vec< N, T > skvx::operator^	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 426 of file SkVx.h.

426{ return Vec<N,T>(x) ^ y; }

◆ operator^=() [1/2]

SINT Vec< N, T > & skvx::operator^=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 454 of file SkVx.h.

454{ return (x = x ^ y); }

◆ operator^=() [2/2]

SINTU Vec< N, T > & skvx::operator^=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 462 of file SkVx.h.

462{ return (x = x ^ Vec<N,T>(y)); }

◆ operator|() [1/4]

SIT Vec< 1, T > skvx::operator\|	(	const Vec< 1, T > &	x,
		const Vec< 1, T > &	y
	)

Definition at line 342 of file SkVx.h.

342{ return x.val | y.val; }

◆ operator|() [2/4]

SINT Vec< N, T > skvx::operator\|	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 390 of file SkVx.h.

                                                                  {
        return join(x.lo | y.lo, x.hi | y.hi);
    }

◆ operator|() [3/4]

SINTU Vec< N, T > skvx::operator\|	(	const Vec< N, T > &	x,
		U	y
	)

Definition at line 442 of file SkVx.h.

442{ return x | Vec<N,T>(y); }

◆ operator|() [4/4]

SINTU Vec< N, T > skvx::operator\|	(	U	x,
		const Vec< N, T > &	y
	)

Definition at line 428 of file SkVx.h.

428{ return Vec<N,T>(x) | y; }

◆ operator|=() [1/2]

SINT Vec< N, T > & skvx::operator\|=	(	Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 456 of file SkVx.h.

456{ return (x = x | y); }

◆ operator|=() [2/2]

SINTU Vec< N, T > & skvx::operator\|=	(	Vec< N, T > &	x,
		U	y
	)

Definition at line 464 of file SkVx.h.

464{ return (x = x | Vec<N,T>(y)); }

◆ operator~() [1/2]

SIT Vec< 1, T > skvx::operator~ ( const Vec< 1, T > & x )

Definition at line 346 of file SkVx.h.

346{ return ~x.val; }

◆ operator~() [2/2]

SINT Vec< N, T > skvx::operator~ ( const Vec< N, T > & x )

Definition at line 396 of file SkVx.h.

396{ return join(~x.lo, ~x.hi); }

◆ pin()

SINT Vec< N, T > skvx::pin	(	const Vec< N, T > &	x,
		const Vec< N, T > &	lo,
		const Vec< N, T > &	hi
	)

Definition at line 655 of file SkVx.h.

                                                                             {
    return max(lo, min(x, hi));
}

◆ round()

SIN Vec< N, float > skvx::round ( const Vec< N, float > & x )

Definition at line 705 of file SkVx.h.

705{ return map(roundf, x); }

◆ saturated_add()

SINT std::enable_if_t< std::is_unsigned_v< T >, Vec< N, T > > skvx::saturated_add	(	const Vec< N, T > &	x,
		const Vec< N, T > &	y
	)

Definition at line 833 of file SkVx.h.

                                                                                        {
#if SKVX_USE_SIMD && (SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1 || defined(SK_ARM_HAS_NEON) || \
        SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX)
    // Both SSE and ARM have 16-lane saturated adds, so use intrinsics for those and recurse down
    // or join up to take advantage.
    if constexpr (N == 16 && sizeof(T) == 1) {
        #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE1
        return sk_bit_cast<Vec<N,T>>(_mm_adds_epu8(sk_bit_cast<__m128i>(x),
                                                   sk_bit_cast<__m128i>(y)));
        #elif SK_CPU_LSX_LEVEL >= SK_CPU_LSX_LEVEL_LSX
        return sk_bit_cast<Vec<N,T>>(__lsx_vsadd_bu(sk_bit_cast<__m128i>(x),
                                                    sk_bit_cast<__m128i>(y)));
        #else  // SK_ARM_HAS_NEON
        return sk_bit_cast<Vec<N,T>>(vqaddq_u8(sk_bit_cast<uint8x16_t>(x),
                                               sk_bit_cast<uint8x16_t>(y)));
        #endif
    } else if constexpr (N < 16 && sizeof(T) == 1) {
        return saturated_add(join(x,x), join(y,y)).lo;
    } else if constexpr (sizeof(T) == 1) {
        return join(saturated_add(x.lo, y.lo), saturated_add(x.hi, y.hi));
    }
#endif
    // Otherwise saturate manually
    auto sum = x + y;
    return if_then_else(sum < x, Vec<N,T>(std::numeric_limits<T>::max()), sum);
}

◆ shuffle()

template<int... Ix, int N, typename T >

SI Vec< sizeof...(Ix), T > skvx::shuffle ( const Vec< N, T > & x )

Definition at line 667 of file SkVx.h.

                                                   {
#if SKVX_USE_SIMD && defined(__clang__)
    // TODO: can we just always use { x[Ix]... }?
    return to_vec<sizeof...(Ix),T>(__builtin_shufflevector(to_vext(x), to_vext(x), Ix...));
#else
    return { x[Ix]... };
#endif
}

◆ sqrt()

SIN Vec< N, float > skvx::sqrt ( const Vec< N, float > & x )

Definition at line 706 of file SkVx.h.

706{ return map( sqrtf, x); }

◆ strided_load2() [1/2]

SIT void skvx::strided_load2	(	const T *	v,
		Vec< 1, T > &	a,
		Vec< 1, T > &	b
	)

Definition at line 1112 of file SkVx.h.

                                                             {
    a.val = v[0];
    b.val = v[1];
}

◆ strided_load2() [2/2]

SINT void skvx::strided_load2	(	const T *	v,
		Vec< N, T > &	a,
		Vec< N, T > &	b
	)

Definition at line 1116 of file SkVx.h.

                                                              {
    strided_load2(v, a.lo, b.lo);
    strided_load2(v + 2*(N/2), a.hi, b.hi);
}

◆ strided_load4() [1/3]

SI void skvx::strided_load4	(	const float *	v,
		Vec< 4, float > &	a,
		Vec< 4, float > &	b,
		Vec< 4, float > &	c,
		Vec< 4, float > &	d
	)

Definition at line 1062 of file SkVx.h.

                                       {
    __m128 a_ = _mm_loadu_ps(v);
    __m128 b_ = _mm_loadu_ps(v+4);
    __m128 c_ = _mm_loadu_ps(v+8);
    __m128 d_ = _mm_loadu_ps(v+12);
    _MM_TRANSPOSE4_PS(a_, b_, c_, d_);
    a = sk_bit_cast<Vec<4,float>>(a_);
    b = sk_bit_cast<Vec<4,float>>(b_);
    c = sk_bit_cast<Vec<4,float>>(c_);
    d = sk_bit_cast<Vec<4,float>>(d_);
}

◆ strided_load4() [2/3]

SIT void skvx::strided_load4	(	const T *	v,
		Vec< 1, T > &	a,
		Vec< 1, T > &	b,
		Vec< 1, T > &	c,
		Vec< 1, T > &	d
	)

Definition at line 1013 of file SkVx.h.

                                    {
    a.val = v[0];
    b.val = v[1];
    c.val = v[2];
    d.val = v[3];
}

◆ strided_load4() [3/3]

SINT void skvx::strided_load4	(	const T *	v,
		Vec< N, T > &	a,
		Vec< N, T > &	b,
		Vec< N, T > &	c,
		Vec< N, T > &	d
	)

Definition at line 1023 of file SkVx.h.

                                     {
    strided_load4(v, a.lo, b.lo, c.lo, d.lo);
    strided_load4(v + 4*(N/2), a.hi, b.hi, c.hi, d.hi);
}

◆ to_half()

SIN Vec< N, uint16_t > skvx::to_half ( const Vec< N, float > & x )

Definition at line 750 of file SkVx.h.

                                                   {
    assert(all(x == x)); // No NaNs should reach this function
 
    // Intrinsics for float->half tend to operate on 4 lanes, and the default implementation has
    // enough instructions that it's better to split and join on 128 bits groups vs.
    // recursing for each min/max/shift/etc.
    if constexpr (N > 4) {
        return join(to_half(x.lo),
                    to_half(x.hi));
    }
 
#if SKVX_USE_SIMD && defined(__aarch64__)
    if constexpr (N == 4) {
        return sk_bit_cast<Vec<N,uint16_t>>(vcvt_f16_f32(sk_bit_cast<float32x4_t>(x)));
 
    }
#endif
 
#define I(x) sk_bit_cast<Vec<N,int32_t>>(x)
#define F(x) sk_bit_cast<Vec<N,float>>(x)
    Vec<N,int32_t> sem = I(x),
                   s   = sem & 0x8000'0000,
                    em = min(sem ^ s, 0x4780'0000), // |x| clamped to f16 infinity
                 // F(em)*8192 increases the exponent by 13, which when added back to em will shift
                 // the mantissa bits 13 to the right. We clamp to 1/2 for subnormal values, which
                 // automatically shifts the mantissa to match 2^-14 expected for a subnorm f16.
                 magic = I(max(F(em) * 8192.f, 0.5f)) & (255 << 23),
               rounded = I((F(em) + F(magic))), // shift mantissa with automatic round-to-even
                   // Subtract 127 for f32 bias, subtract 13 to undo the *8192, subtract 1 to remove
                   // the implicit leading 1., and add 15 to get the f16 biased exponent.
                   exp = ((magic >> 13) - ((127-15+13+1)<<10)), // shift and re-bias exponent
                   f16 = rounded + exp; // use + if 'rounded' rolled over into first exponent bit
    return cast<uint16_t>((s>>16) | f16);
#undef I
#undef F
}

◆ trunc()

SIN Vec< N, float > skvx::trunc ( const Vec< N, float > & x )

Definition at line 704 of file SkVx.h.

704{ return map(truncf, x); }

Classes

Typedefs

Functions