24 #if defined (_M_IX86) || defined (_M_X64)
38 #if defined (_M_ARM64)
39 #include <arm64intr.h>
40 #include <arm64_neon.h>
44 #if defined (__cplusplus)
49 __MACHINE(
void * _AddressOfReturnAddress(
void))
51 __MACHINEX64(
unsigned char _BitScanForward64(
unsigned long * _Index,
unsigned __int64 _Mask))
52 __MACHINEARM64(
unsigned char _BitScanForward64(
unsigned long * _Index,
unsigned __int64 _Mask))
53 __MACHINE(
unsigned char _BitScanReverse(
unsigned long * _Index,
unsigned long _Mask))
54 __MACHINEX64(
unsigned char _BitScanReverse64(
unsigned long * _Index,
unsigned __int64 _Mask))
55 __MACHINEARM64(
unsigned char _BitScanReverse64(
unsigned long * _Index,
unsigned __int64 _Mask))
67 __MACHINEARM(
unsigned int _CountOneBits64(
unsigned __int64))
71 __MACHINEARM_ARM64(__int64 _InterlockedAdd64(__int64
volatile * _Addend, __int64 _Value))
72 __MACHINEARM_ARM64(__int64 _InterlockedAdd64_acq(__int64
volatile * _Addend, __int64 _Value))
73 __MACHINEARM_ARM64(__int64 _InterlockedAdd64_nf(__int64
volatile * _Addend, __int64 _Value))
74 __MACHINEARM_ARM64(__int64 _InterlockedAdd64_rel(__int64
volatile * _Addend, __int64 _Value))
75 __MACHINEX86(
long _InterlockedAddLargeStatistic(__int64
volatile * _Addend,
long _Value))
79 __MACHINEX64(
short _InterlockedAnd16_np(
short volatile * _Value,
short _Mask))
80 __MACHINEX64(__int64 _InterlockedAnd64_np(__int64
volatile * _Value, __int64 _Mask))
81 __MACHINEX64(
char _InterlockedAnd8_np(
char volatile * _Value,
char _Mask))
82 __MACHINEX64(
long _InterlockedAnd_np(
long volatile * _Value,
long _Mask))
83 __MACHINEARM64_X64(
unsigned char _InterlockedCompareExchange128(__int64
volatile *
_Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
84 __MACHINEARM64(
unsigned char _InterlockedCompareExchange128_acq(__int64
volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
85 __MACHINEARM64(
unsigned char _InterlockedCompareExchange128_nf(__int64
volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
86 __MACHINEX64(
unsigned char _InterlockedCompareExchange128_np(__int64
volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
87 __MACHINEARM64(
unsigned char _InterlockedCompareExchange128_rel(__int64
volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
88 __MACHINEX64(
short _InterlockedCompareExchange16_np(
short volatile * _Destination,
short _Exchange,
short _Comparand))
89 __MACHINEX64(__int64 _InterlockedCompareExchange64_np(__int64
volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
91 __MACHINEARM_ARM64(
void * _InterlockedCompareExchangePointer_acq(
void *
volatile * _Destination,
void * _Exchange,
void * _Comparand))
92 __MACHINEARM_ARM64(
void * _InterlockedCompareExchangePointer_nf(
void *
volatile * _Destination,
void * _Exchange,
void * _Comparand))
93 __MACHINEX64(
void * _InterlockedCompareExchangePointer_np(
void *
volatile * _Destination,
void * _Exchange,
void * _Comparand))
94 __MACHINEARM_ARM64(
void * _InterlockedCompareExchangePointer_rel(
void *
volatile * _Destination,
void * _Exchange,
void * _Comparand))
95 __MACHINEX64(
long _InterlockedCompareExchange_np(
long volatile * _Destination,
long _Exchange,
long _Comparand))
96 __MACHINE(
short _InterlockedDecrement16(
short volatile * _Addend))
107 __MACHINE(
void * _InterlockedExchangePointer(
void *
volatile *
_Target,
void * _Value))
108 __MACHINEARM_ARM64(
void * _InterlockedExchangePointer_acq(
void *
volatile * _Target,
void * _Value))
109 __MACHINEARM_ARM64(
void * _InterlockedExchangePointer_nf(
void *
volatile * _Target,
void * _Value))
110 __MACHINEARM_ARM64(
void * _InterlockedExchangePointer_rel(
void *
volatile * _Target,
void * _Value))
111 __MACHINE(
short _InterlockedIncrement16(
short volatile * _Addend))
122 __MACHINEX64(
short _InterlockedOr16_np(
short volatile * _Value,
short _Mask))
123 __MACHINEX64(__int64 _InterlockedOr64_np(__int64
volatile * _Value, __int64 _Mask))
124 __MACHINEX64(
char _InterlockedOr8_np(
char volatile * _Value,
char _Mask))
125 __MACHINEX64(
long _InterlockedOr_np(
long volatile * _Value,
long _Mask))
126 __MACHINEX64(
short _InterlockedXor16_np(
short volatile * _Value,
short _Mask))
127 __MACHINEX64(__int64 _InterlockedXor64_np(__int64
volatile * _Value, __int64 _Mask))
128 __MACHINEX64(
char _InterlockedXor8_np(
char volatile * _Value,
char _Mask))
129 __MACHINEX64(
long _InterlockedXor_np(
long volatile * _Value,
long _Mask))
130 __MACHINEARM(
unsigned int _MoveFromCoprocessor(
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int))
131 __MACHINEARM(
unsigned int _MoveFromCoprocessor2(
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int))
132 __MACHINEARM(
unsigned __int64 _MoveFromCoprocessor64(
unsigned int,
unsigned int,
unsigned int))
133 __MACHINEARM(
void _MoveToCoprocessor(
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int))
134 __MACHINEARM(
void _MoveToCoprocessor2(
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int,
unsigned int))
135 __MACHINEARM(
void _MoveToCoprocessor64(
unsigned __int64,
unsigned int,
unsigned int,
unsigned int))
137 __MACHINEARM(
unsigned long _MulUnsignedHigh(
unsigned long,
unsigned long))
154 __MACHINEX86(
void __addfsbyte(
unsigned long,
unsigned char))
155 __MACHINEX86(
void __addfsdword(
unsigned long,
unsigned long))
156 __MACHINEX86(
void __addfsword(
unsigned long,
unsigned short))
157 __MACHINEX64(
void __addgsbyte(
unsigned long,
unsigned char))
158 __MACHINEX64(
void __addgsdword(
unsigned long,
unsigned long))
159 __MACHINEX64(
void __addgsqword(
unsigned long,
unsigned __int64))
160 __MACHINEX64(
void __addgsword(
unsigned long,
unsigned short))
163 __MACHINEARM64(
void __addx18qword(
unsigned long,
unsigned __int64))
169 __MACHINE(
void __cdecl __debugbreak(
void))
180 __MACHINEX86_X64(
void __inbytestring(
unsigned short,
unsigned char *,
unsigned long))
193 __MACHINEX86_X64(
void __indwordstring(
unsigned short,
unsigned long *,
unsigned long))
197 __MACHINEX86_X64(
void __inwordstring(
unsigned short,
unsigned short *,
unsigned long))
203 __MACHINEX64(
unsigned __int64 __lzcnt64(
unsigned __int64))
204 __MACHINEX86_X64(
void __movsb(
unsigned char *,
unsigned char const *,
size_t))
205 __MACHINEX86_X64(
void __movsd(
unsigned long *,
unsigned long const *,
size_t))
206 __MACHINEX64(
void __movsq(
unsigned long long *,
unsigned long long const *,
size_t))
207 __MACHINEX86_X64(
void __movsw(
unsigned short *,
unsigned short const *,
size_t))
213 __MACHINEX86_X64(
void __outbytestring(
unsigned short,
unsigned char *,
unsigned long))
215 __MACHINEX86_X64(
void __outdwordstring(
unsigned short,
unsigned long *,
unsigned long))
217 __MACHINEX86_X64(
void __outwordstring(
unsigned short,
unsigned short *,
unsigned long))
220 __MACHINEX64(
unsigned __int64 __popcnt64(
unsigned __int64))
241 __MACHINEX86(
unsigned long __readfsdword(
unsigned long))
242 __MACHINEX86(
unsigned __int64 __readfsqword(
unsigned long))
243 __MACHINEX86(
unsigned short __readfsword(
unsigned long))
245 __MACHINEX64(
unsigned long __readgsdword(
unsigned long))
246 __MACHINEX64(
unsigned __int64 __readgsqword(
unsigned long))
247 __MACHINEX64(
unsigned short __readgsword(
unsigned long))
256 __MACHINEX64(
unsigned __int64 __shiftleft128(
unsigned __int64 _LowPart,
unsigned __int64 _HighPart,
unsigned char _Shift))
257 __MACHINEX64(
unsigned __int64 __shiftright128(
unsigned __int64 _LowPart,
unsigned __int64 _HighPart,
unsigned char _Shift))
262 __MACHINEX64(
void __stosq(
unsigned __int64 *,
unsigned __int64,
size_t))
280 __MACHINEX64(
unsigned char __vmx_on(
unsigned __int64 *))
281 __MACHINEX64(
unsigned char __vmx_vmclear(
unsigned __int64 *))
283 __MACHINEX64(
unsigned char __vmx_vmptrld(
unsigned __int64 *))
285 __MACHINEX64(
unsigned char __vmx_vmread(
size_t,
size_t *))
287 __MACHINEX64(
unsigned char __vmx_vmwrite(
size_t,
size_t))
301 __MACHINEX64(
void __writedr(
unsigned int,
unsigned __int64))
302 __MACHINEX86(
void __writedr(
unsigned int,
unsigned int))
305 __MACHINEX86(
void __writefsbyte(
unsigned long,
unsigned char))
306 __MACHINEX86(
void __writefsdword(
unsigned long,
unsigned long))
307 __MACHINEX86(
void __writefsqword(
unsigned long,
unsigned __int64))
308 __MACHINEX86(
void __writefsword(
unsigned long,
unsigned short))
309 __MACHINEX64(
void __writegsbyte(
unsigned long,
unsigned char))
310 __MACHINEX64(
void __writegsdword(
unsigned long,
unsigned long))
311 __MACHINEX64(
void __writegsqword(
unsigned long,
unsigned __int64))
312 __MACHINEX64(
void __writegsword(
unsigned long,
unsigned short))
315 __MACHINEARM64(
void __writex18dword(
unsigned long,
unsigned long))
316 __MACHINEARM64(
void __writex18qword(
unsigned long,
unsigned __int64))
317 __MACHINEARM64(
void __writex18word(
unsigned long,
unsigned short))
318 __MACHINE(
unsigned char _bittest(
long const *,
long))
320 __MACHINE(
unsigned char _bittestandcomplement(
long *,
long))
322 __MACHINE(
unsigned char _bittestandreset(
long *,
long))
324 __MACHINE(
unsigned char _bittestandset(
long *,
long))
331 __MACHINE(
unsigned char _interlockedbittestandreset(
long volatile *,
long))
332 __MACHINEARM64_X64(
unsigned char _interlockedbittestandreset64(__int64
volatile *, __int64))
333 __MACHINEARM_ARM64(
unsigned char _interlockedbittestandreset_acq(
long volatile *,
long))
334 __MACHINEARM_ARM64(
unsigned char _interlockedbittestandreset_nf(
long volatile *,
long))
335 __MACHINEARM_ARM64(
unsigned char _interlockedbittestandreset_rel(
long volatile *,
long))
336 __MACHINEARM64(
unsigned char _interlockedbittestandreset64_acq(__int64
volatile *, __int64))
337 __MACHINEARM64(
unsigned char _interlockedbittestandreset64_rel(__int64
volatile *, __int64))
338 __MACHINEARM64(
unsigned char _interlockedbittestandreset64_nf(__int64
volatile *, __int64))
339 __MACHINEARM64_X64(
unsigned char _interlockedbittestandset64(__int64
volatile *, __int64))
340 __MACHINEARM64(
unsigned char _interlockedbittestandset64_acq(__int64
volatile *, __int64))
341 __MACHINEARM64(
unsigned char _interlockedbittestandset64_rel(__int64
volatile *, __int64))
342 __MACHINEARM64(
unsigned char _interlockedbittestandset64_nf(__int64
volatile *, __int64))
343 __MACHINEARM64(
unsigned __int32 __crc32b(
unsigned __int32,
unsigned __int32))
344 __MACHINEARM64(
unsigned __int32 __crc32h(
unsigned __int32,
unsigned __int32))
345 __MACHINEARM64(
unsigned __int32 __crc32w(
unsigned __int32,
unsigned __int32))
346 __MACHINEARM64(
unsigned __int32 __crc32d(
unsigned __int32,
unsigned __int64))
347 __MACHINEARM64(
unsigned __int32 __crc32cb(
unsigned __int32,
unsigned __int32))
348 __MACHINEARM64(
unsigned __int32 __crc32ch(
unsigned __int32,
unsigned __int32))
349 __MACHINEARM64(
unsigned __int32 __crc32cw(
unsigned __int32,
unsigned __int32))
350 __MACHINEARM64(
unsigned __int32 __crc32cd(
unsigned __int32,
unsigned __int64))
580 __MACHINEX64(
unsigned __int64 _mm_crc32_u64(
unsigned __int64,
unsigned __int64))
779 __MACHINEX86_X64(
__m128i _mm_set_epi8(
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char))
794 __MACHINEX86_X64(
__m128i _mm_setr_epi8(
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char,
char))
909 __MACHINEX64(__int64 _mul128(__int64 _Multiplier, __int64 _Multiplicand, __int64 * _HighProduct))
911 __MACHINE(
unsigned short __cdecl _rotl16(
unsigned short _Value,
unsigned char _Shift))
913 __MACHINE(
unsigned char __cdecl _rotl8(
unsigned char _Value,
unsigned char _Shift))
915 __MACHINE(
unsigned short __cdecl _rotr16(
unsigned short _Value,
unsigned char _Shift))
917 __MACHINE(
unsigned char __cdecl _rotr8(
unsigned char _Value,
unsigned char _Shift))
920 __MACHINEX64(
unsigned __int64 _umul128(
unsigned __int64 _Multiplier,
unsigned __int64 _Multiplicand,
unsigned __int64 * _HighProduct))
926 __MACHINEX86_X64(
unsigned char __cdecl _addcarry_u8(
unsigned char,
unsigned char,
unsigned char,
unsigned char *))
927 __MACHINEX86_X64(
unsigned char __cdecl _subborrow_u8(
unsigned char,
unsigned char,
unsigned char,
unsigned char *))
928 __MACHINEX86_X64(
unsigned char __cdecl _addcarry_u16(
unsigned char,
unsigned short,
unsigned short,
unsigned short *))
929 __MACHINEX86_X64(
unsigned char __cdecl _subborrow_u16(
unsigned char,
unsigned short,
unsigned short,
unsigned short *))
930 __MACHINEX86_X64(
unsigned char __cdecl _addcarry_u32(
unsigned char,
unsigned int,
unsigned int,
unsigned int *))
931 __MACHINEX86_X64(
unsigned char __cdecl _subborrow_u32(
unsigned char,
unsigned int,
unsigned int,
unsigned int *))
932 __MACHINEX64(
unsigned char __cdecl _addcarry_u64(
unsigned char,
unsigned __int64,
unsigned __int64,
unsigned __int64 *))
933 __MACHINEX64(
unsigned char __cdecl _subborrow_u64(
unsigned char,
unsigned __int64,
unsigned __int64,
unsigned __int64 *))
937 #if defined (__cplusplus)
__m128i _mm_sub_epi32(__m128i _A, __m128i _B)
__m128i _mm_adds_epi8(__m128i _A, __m128i _B)
__m128i _mm_cvttps_epi32(__m128 _A)
void _mm_clzero(void const *)
__m128 _mm_set_ps(float _A, float _B, float _C, float _D)
int _mm_movemask_epi8(__m128i _A)
void _mm_store_sd(double *_Dp, __m128d _A)
__m128i _mm_sign_epi32(__m128i, __m128i)
__m128i _mm_mulhi_epi16(__m128i _A, __m128i _B)
#define __MACHINEX86
Definition: intrin0.h:58
#define __MACHINEX86_X64
Definition: intrin0.h:68
__m128d _mm_cmpngt_pd(__m128d _A, __m128d _B)
int _mm_comineq_sd(__m128d _A, __m128d _B)
int _mm_extract_epi16(__m128i _A, int _Imm)
__m128i _mm_xor_si128(__m128i _A, __m128i _B)
__m128 _mm_and_ps(__m128 _A, __m128 _B)
__m128d _mm_move_sd(__m128d _A, __m128d _B)
void _mm_store_ps1(float *_V, __m128 _A)
__m128 _mm_setr_ps(float _A, float _B, float _C, float _D)
__m128i _mm_loadu_si128(__m128i const *_P)
__m128i _mm_cvtepu16_epi64(__m128i)
__m128d _mm_load_sd(double const *_Dp)
__m128i _mm_max_epi32(__m128i, __m128i)
int _mm_ucomilt_ss(__m128 _A, __m128 _B)
__m128i _mm_srai_epi32(__m128i _A, int _Count)
__m128d _mm_cmpord_sd(__m128d _A, __m128d _B)
__m128 _mm_movehl_ps(__m128, __m128)
__m128i _mm_blendv_epi8(__m128i, __m128i, __m128i mask)
__m128 _mm_rsqrt_ss(__m128 _A)
__m128 _mm_sqrt_ps(__m128 _A)
__m128 _mm_max_ps(__m128 _A, __m128 _B)
__m128i _mm_packs_epi32(__m128i _A, __m128i _B)
__m128d _mm_min_pd(__m128d _A, __m128d _B)
__m128d _mm_cmpeq_pd(__m128d _A, __m128d _B)
_SourceSize void *const _Destination
Definition: corecrt_memcpy_s.h:36
__m128i _mm_sra_epi16(__m128i _A, __m128i _Count)
int _mm_cmpestrc(__m128i, int, __m128i, int, const int)
__m128 _mm_cmpgt_ss(__m128 _A, __m128 _B)
__m128 _mm_cmpngt_ps(__m128 _A, __m128 _B)
int _mm_ucomilt_sd(__m128d _A, __m128d _B)
__m128i _mm_cvtepu16_epi32(__m128i)
__m128d _mm_cmpneq_sd(__m128d _A, __m128d _B)
int _mm_comieq_sd(__m128d _A, __m128d _B)
#define __MACHINEARM64
Definition: intrin0.h:85
__m128 _mm_blend_ps(__m128, __m128, const int)
int _mm_comigt_ss(__m128 _A, __m128 _B)
__m128d _mm_loadu_pd(double const *_Dp)
__m128i _mm_cvtepi8_epi16(__m128i)
__m128i _mm_abs_epi16(__m128i)
void _mm_storeu_ps(float *_V, __m128 _A)
__m128i _mm_blend_epi16(__m128i, __m128i, const int)
int _mm_ucomigt_sd(__m128d _A, __m128d _B)
_Check_return_ unsigned long __cdecl _lrotl(_In_ unsigned long _Value, _In_ int _Shift)
__m128d _mm_cvtsi32_sd(__m128d _A, int _B)
int _mm_ucomigt_ss(__m128 _A, __m128 _B)
__m128 _mm_cmpord_ss(__m128 _A, __m128 _B)
__m128d _mm_cmplt_pd(__m128d _A, __m128d _B)
__m128i _mm_move_epi64(__m128i _Q)
__m128i _mm_cmpgt_epi32(__m128i _A, __m128i _B)
__m128d _mm_cmpgt_sd(__m128d _A, __m128d _B)
__m64 _m_pfpnacc(__m64, __m64)
int _mm_cmpestrz(__m128i, int, __m128i, int, const int)
__m128 _mm_cmpord_ps(__m128 _A, __m128 _B)
__m128d _mm_set1_pd(double _A)
__m128i _mm_cvtepu8_epi64(__m128i)
__m128d _mm_unpacklo_pd(__m128d _A, __m128d _B)
_Check_return_ unsigned short __cdecl _byteswap_ushort(_In_ unsigned short _Number)
__m128i _mm_lddqu_si128(__m128i const *)
int _mm_cmpestrs(__m128i, int, __m128i, int, const int)
#define __MACHINE(X)
Definition: intrin0.h:50
void _m_prefetchw(volatile const void *_Source)
__m64 _m_pfmin(__m64, __m64)
int _mm_ucomieq_sd(__m128d _A, __m128d _B)
void _mm_store1_pd(double *_Dp, __m128d _A)
_JBTYPE jmp_buf[_JBLEN]
Definition: setjmp.h:145
__m128i _mm_packus_epi32(__m128i, __m128i)
__m128d _mm_cmple_pd(__m128d _A, __m128d _B)
__m128i _mm_max_epi16(__m128i _A, __m128i _B)
__m128d _mm_cmpunord_sd(__m128d _A, __m128d _B)
__m128d _mm_cmpge_sd(__m128d _A, __m128d _B)
unsigned int _mm_crc32_u32(unsigned int, unsigned int)
__m128d
Definition: emmintrin.h:57
__m128i _mm_unpacklo_epi16(__m128i _A, __m128i _B)
__m128 _mm_sqrt_ss(__m128 _A)
int _mm_comige_sd(__m128d _A, __m128d _B)
__m128 _mm_movehdup_ps(__m128)
__m128i _mm_add_epi64(__m128i _A, __m128i _B)
__m128i _mm_set1_epi16(short _W)
int _mm_comigt_sd(__m128d _A, __m128d _B)
__m128i _mm_set1_epi8(char _B)
__m128d _mm_hsub_pd(__m128d, __m128d)
__m128i _mm_abs_epi8(__m128i)
__m128d _mm_loaddup_pd(double const *)
__m128i _mm_setl_epi64(__m128i _Q)
__m128i _mm_set1_epi64x(__int64 i)
int _mm_extract_epi8(__m128i, const int)
__m128i _mm_srli_epi16(__m128i _A, int _Count)
__m128d _mm_loadh_pd(__m128d _A, double const *_Dp)
__m64 _m_pfnacc(__m64, __m64)
__m128d _mm_shuffle_pd(__m128d _A, __m128d _B, int _I)
__m128i _mm_mpsadbw_epu8(__m128i, __m128i, const int)
__m64 _m_pfadd(__m64, __m64)
__m128i _mm_cmplt_epi8(__m128i _A, __m128i _B)
int _mm_cvtsd_si32(__m128d _A)
__m128i _mm_set_epi16(short _W7, short _W6, short _W5, short _W4, short _W3, short _W2, short _W1, short _W0)
__m128i _mm_packs_epi16(__m128i _A, __m128i _B)
__m64 _m_pavgusb(__m64, __m64)
int _mm_popcnt_u32(unsigned int)
__m128i _mm_cvtepi16_epi32(__m128i)
__m128 _mm_shuffle_ps(__m128 _A, __m128 _B, unsigned int _Imm8)
__m128i _mm_cmpeq_epi64(__m128i, __m128i)
__m128i _mm_add_epi8(__m128i _A, __m128i _B)
void _mm_storeh_pi(__m64 *, __m128)
__m128i _mm_setr_epi8(char _B15, char _B14, char _B13, char _B12, char _B11, char _B10, char _B9, char _B8, char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128i _mm_hsub_epi32(__m128i, __m128i)
__m128d _mm_set_pd(double _Z, double _Y)
int _mm_comile_ss(__m128 _A, __m128 _B)
__m64 _m_pfrsqit1(__m64, __m64)
int _mm_cmpistrs(__m128i, __m128i, const int)
__m128i _mm_srl_epi32(__m128i _A, __m128i _Count)
int _mm_comige_ss(__m128 _A, __m128 _B)
__m128i _mm_set1_epi32(int _I)
__m128 _mm_cmpngt_ss(__m128 _A, __m128 _B)
__m128i _mm_cvtepi32_epi64(__m128i)
int _mm_cmpestri(__m128i, int, __m128i, int, const int)
__m128 _mm_loadu_ps(float const *_A)
__m128d _mm_hadd_pd(__m128d, __m128d)
__m128i _mm_hadds_epi16(__m128i, __m128i)
__m128i _mm_sra_epi32(__m128i _A, __m128i _Count)
__m128i _mm_setzero_si128(void)
int _mm_ucomineq_ss(__m128 _A, __m128 _B)
int _mm_comineq_ss(__m128 _A, __m128 _B)
__m128i _mm_srli_epi32(__m128i _A, int _Count)
__m128d _mm_cmpnge_sd(__m128d _A, __m128d _B)
__m128d _mm_cmplt_sd(__m128d _A, __m128d _B)
int _mm_testnzc_si128(__m128i, __m128i)
__m128i _mm_set_epi32(int _I3, int _I2, int _I1, int _I0)
__m128i _mm_sll_epi16(__m128i _A, __m128i _Count)
__m128i _mm_minpos_epu16(__m128i)
__m128 _mm_cmple_ps(__m128 _A, __m128 _B)
__m128i _mm_avg_epu16(__m128i _A, __m128i _B)
__m64 _m_pfrcpit1(__m64, __m64)
__m128i _mm_insert_epi32(__m128i, int, const int)
int _mm_cmpistro(__m128i, __m128i, const int)
__m128i _mm_insert_epi16(__m128i _A, int _B, int _Imm)
__m128d _mm_load_pd(double const *_Dp)
__m128i _mm_min_epi16(__m128i _A, __m128i _B)
int _mm_testz_si128(__m128i, __m128i)
__m128i _mm_min_epi8(__m128i, __m128i)
_In_ size_t _In_ int _Index
Definition: time.h:102
__m128 _mm_add_ps(__m128 _A, __m128 _B)
__m64 _m_pfsub(__m64, __m64)
__m128i _mm_unpacklo_epi32(__m128i _A, __m128i _B)
__m128 _mm_addsub_ps(__m128, __m128)
__m128d _mm_movedup_pd(__m128d)
_Check_return_ unsigned __int64 __cdecl _byteswap_uint64(_In_ unsigned __int64 _Number)
__m128i _mm_adds_epu8(__m128i _A, __m128i _B)
__m64 _m_pfrcpit2(__m64, __m64)
__m128d _mm_sqrt_sd(__m128d _A, __m128d _B)
unsigned int __cdecl _rotr(_In_ unsigned int _Value, _In_ int _Shift)
__m128i _mm_cvtepu8_epi16(__m128i)
unsigned int _mm_crc32_u16(unsigned int, unsigned short)
__m128 _mm_cvtpd_ps(__m128d _A)
int _mm_cmpistra(__m128i, __m128i, const int)
int _mm_ucomile_sd(__m128d _A, __m128d _B)
__m128i _mm_sll_epi32(__m128i _A, __m128i _Count)
void _mm_store_ss(float *_V, __m128 _A)
__m128i _mm_unpackhi_epi16(__m128i _A, __m128i _B)
__m128 _mm_sub_ps(__m128 _A, __m128 _B)
__m128 _mm_div_ps(__m128 _A, __m128 _B)
__m128d _mm_cmpnle_pd(__m128d _A, __m128d _B)
__m128 _mm_set_ss(float _A)
__m128i _mm_slli_epi16(__m128i _A, int _Count)
__m128 _mm_moveldup_ps(__m128)
int _mm_movemask_pd(__m128d _A)
__m128d _mm_cmpngt_sd(__m128d _A, __m128d _B)
int _mm_cvttsd_si32(__m128d _A)
__m128i _mm_sad_epu8(__m128i _A, __m128i _B)
__m128i _mm_setr_epi16(short _W0, short _W1, short _W2, short _W3, short _W4, short _W5, short _W6, short _W7)
__m128i _mm_cvtpd_epi32(__m128d _A)
__m128i _mm_cvtepu32_epi64(__m128i)
__m128 _mm_cmplt_ss(__m128 _A, __m128 _B)
__m128i _mm_max_epu8(__m128i _A, __m128i _B)
__m128d _mm_cmpneq_pd(__m128d _A, __m128d _B)
_Check_return_ unsigned long __cdecl _byteswap_ulong(_In_ unsigned long _Number)
__m128i _mm_maddubs_epi16(__m128i, __m128i)
int _mm_ucomile_ss(__m128 _A, __m128 _B)
int _mm_cmpistrc(__m128i, __m128i, const int)
__m64 _m_pmulhrw(__m64, __m64)
__m128 _mm_round_ss(__m128, __m128, int)
unsigned int __cdecl _rotl(_In_ unsigned int _Value, _In_ int _Shift)
#define _Check_return_
Definition: sal.h:554
int _mm_comile_sd(__m128d _A, __m128d _B)
__m128i _mm_cvtepi8_epi32(__m128i)
__m128d _mm_cmpnlt_sd(__m128d _A, __m128d _B)
void _mm_mwait(unsigned, unsigned)
#define _In_
Definition: sal.h:305
__m128d _mm_cmpnge_pd(__m128d _A, __m128d _B)
__m128d _mm_add_pd(__m128d _A, __m128d _B)
__m128d _mm_or_pd(__m128d _A, __m128d _B)
__m128 _mm_rcp_ps(__m128 _A)
__m128i _mm_mul_epu32(__m128i _A, __m128i _B)
__m128i _mm_min_epu8(__m128i _A, __m128i _B)
__m128 _mm_cmpeq_ps(__m128 _A, __m128 _B)
__m128d _mm_cmpord_pd(__m128d _A, __m128d _B)
__m128i _mm_cmplt_epi32(__m128i _A, __m128i _B)
__m128d _mm_div_pd(__m128d _A, __m128d _B)
void _mm_setcsr(unsigned int)
#define __MACHINEX64
Definition: intrin0.h:63
__m128i _mm_cmpistrm(__m128i, __m128i, const int)
void _mm_storel_pd(double *_Dp, __m128d _A)
__m128d _mm_cvtepi32_pd(__m128i _A)
int _mm_comilt_sd(__m128d _A, __m128d _B)
__m128i _mm_slli_si128(__m128i _A, int _Imm)
__m128 _mm_cmpneq_ps(__m128 _A, __m128 _B)
__m64
Definition: mmintrin.h:45
__m128i _mm_srli_si128(__m128i _A, int _Imm)
__m128d _mm_and_pd(__m128d _A, __m128d _B)
__m128i _mm_srl_epi16(__m128i _A, __m128i _Count)
__m128i _mm_min_epi32(__m128i, __m128i)
__m128i _mm_cmpestrm(__m128i, int, __m128i, int, const int)
void _mm_stream_ps(float *, __m128)
void _mm_store_pd(double *_Dp, __m128d _A)
__m128i _mm_hsubs_epi16(__m128i, __m128i)
__m128i _mm_slli_epi64(__m128i _A, int _Count)
__m128i _mm_cmpgt_epi8(__m128i _A, __m128i _B)
void _mm_clflush(void const *_P)
int _mm_ucomige_sd(__m128d _A, __m128d _B)
__m64 _m_pfacc(__m64, __m64)
__m128 _mm_hadd_ps(__m128, __m128)
__m128 _mm_insert_ps(__m128, __m128, const int)
__m128i _mm_shuffle_epi8(__m128i, __m128i)
__m128i _mm_unpackhi_epi32(__m128i _A, __m128i _B)
__m64 _m_pfcmpeq(__m64, __m64)
__m128 _mm_andnot_ps(__m128 _A, __m128 _B)
__m128d _mm_cmpgt_pd(__m128d _A, __m128d _B)
__m128d _mm_max_pd(__m128d _A, __m128d _B)
__m128 _mm_cvtepi32_ps(__m128i _A)
__m128 _mm_cmpnlt_ps(__m128 _A, __m128 _B)
__m128i _mm_cvttpd_epi32(__m128d _A)
unsigned __int64 __cdecl _rotl64(_In_ unsigned __int64 _Value, _In_ int _Shift)
__m128i
Definition: emmintrin.h:53
__interface __declspec(uuid("00000035-0000-0000-C000-000000000046")) __abi_IActivationFactory
Definition: vccorlib.h:286
void _mm_store_si128(__m128i *_P, __m128i _B)
__m128d _mm_cmpnlt_pd(__m128d _A, __m128d _B)
__m128d _mm_blendv_pd(__m128d, __m128d, __m128d)
__m128i _mm_srli_epi64(__m128i _A, int _Count)
__m128i _mm_set_epi64x(__int64 _I1, __int64 _I0)
__m128 _mm_cmpnlt_ss(__m128 _A, __m128 _B)
__m128 _mm_xor_ps(__m128 _A, __m128 _B)
__m128i _mm_unpackhi_epi64(__m128i _A, __m128i _B)
__m128i _mm_sign_epi16(__m128i, __m128i)
int _mm_comieq_ss(__m128 _A, __m128 _B)
__m128d _mm_addsub_pd(__m128d, __m128d)
void _mm_monitorx(void const *, unsigned int, unsigned int)
int _mm_cvtsi128_si32(__m128i _A)
__m128d _mm_unpackhi_pd(__m128d _A, __m128d _B)
int _mm_extract_epi32(__m128i, const int)
void * _InterlockedCompareExchangePointer(void *volatile *, void *, void *)
__m128 _mm_round_ps(__m128, int)
__m128
Definition: xmmintrin.h:75
__m128 _mm_load_ps1(float const *_A)
void _mm_storeu_pd(double *_Dp, __m128d _A)
__m128i _mm_cmpgt_epi16(__m128i _A, __m128i _B)
void _mm_storeh_pd(double *_Dp, __m128d _A)
int _mm_testc_si128(__m128i, __m128i)
__m128d _mm_load1_pd(double const *_Dp)
__m128d _mm_xor_pd(__m128d _A, __m128d _B)
int _mm_cvt_ss2si(__m128 _A)
__m128 _mm_mul_ps(__m128 _A, __m128 _B)
__m128d _mm_loadr_pd(double const *_Dp)
__m64 _m_from_float(float)
int _mm_ucomige_ss(__m128 _A, __m128 _B)
__m128i _mm_shufflelo_epi16(__m128i _A, int _Imm)
__m128d _mm_loadl_pd(__m128d _A, double const *_Dp)
__m128i _mm_cmplt_epi16(__m128i _A, __m128i _B)
__m128i _mm_avg_epu8(__m128i _A, __m128i _B)
__m128i _mm_cvtsi32_si128(int _A)
__m128i _mm_mullo_epi16(__m128i _A, __m128i _B)
int _mm_cmpistri(__m128i, __m128i, const int)
__m128 _mm_set_ps1(float _A)
__m128d _mm_setzero_pd(void)
__m128i _mm_subs_epu8(__m128i _A, __m128i _B)
void _mm_storer_pd(double *_Dp, __m128d _A)
__m128 _mm_cmpneq_ss(__m128 _A, __m128 _B)
__m128d _mm_round_pd(__m128d, int)
#define __MACHINEARM_ARM64
Definition: intrin0.h:90
__m128 _mm_cvt_si2ss(__m128, int)
__m128i _mm_cmpeq_epi16(__m128i _A, __m128i _B)
__m128i _mm_or_si128(__m128i _A, __m128i _B)
__m128i _mm_shufflehi_epi16(__m128i _A, int _Imm)
__m128i _mm_mulhrs_epi16(__m128i, __m128i)
__m128i _mm_sll_epi64(__m128i _A, __m128i _Count)
__m128i _mm_hadd_epi16(__m128i, __m128i)
__m128i _mm_cmpeq_epi32(__m128i _A, __m128i _B)
__m128i _mm_load_si128(__m128i const *_P)
__m128 _mm_add_ss(__m128 _A, __m128 _B)
int _mm_extract_ps(__m128, const int)
__m128i _mm_adds_epu16(__m128i _A, __m128i _B)
__m128i _mm_setr_epi32(int _I0, int _I1, int _I2, int _I3)
__m128i _mm_cvtepi8_epi64(__m128i)
_In_ _Value
Definition: corecrt_wstdlib.h:65
__m128 _mm_min_ss(__m128 _A, __m128 _B)
__m128i _mm_add_epi32(__m128i _A, __m128i _B)
__m128i _mm_hsub_epi16(__m128i, __m128i)
__m128d _mm_dp_pd(__m128d, __m128d, const int)
__m128d _mm_cmpnle_sd(__m128d _A, __m128d _B)
__m128 _mm_min_ps(__m128 _A, __m128 _B)
__m128i _mm_unpacklo_epi8(__m128i _A, __m128i _B)
int _mm_ucomieq_ss(__m128 _A, __m128 _B)
void _mm_storel_epi64(__m128i *_P, __m128i _Q)
int _mm_cmpestro(__m128i, int, __m128i, int, const int)
int _mm_comilt_ss(__m128 _A, __m128 _B)
__m128i _mm_max_epi8(__m128i, __m128i)
__m128 _mm_cmpnle_ss(__m128 _A, __m128 _B)
__m128 _mm_cmpgt_ps(__m128 _A, __m128 _B)
void _mm_store_ps(float *_V, __m128 _A)
_Check_return_ unsigned long __cdecl _lrotr(_In_ unsigned long _Value, _In_ int _Shift)
int _mm_movemask_ps(__m128 _A)
__m128i _mm_stream_load_si128(const __m128i *)
__m128 _mm_setzero_ps(void)
__m128d _mm_blend_pd(__m128d, __m128d, const int)
#define __MACHINEARM_ARM64_X64
Definition: intrin0.h:95
__m128d _mm_round_sd(__m128d, __m128d, int)
int _mm_cmpistrz(__m128i, __m128i, const int)
__m128i _mm_max_epu32(__m128i, __m128i)
__m128d _mm_sub_pd(__m128d _A, __m128d _B)
__m128i _mm_cvtepi16_epi64(__m128i)
__m128 _mm_rcp_ss(__m128 _A)
__m128i _mm_min_epu16(__m128i, __m128i)
__m128 _mm_cmplt_ps(__m128 _A, __m128 _B)
__m128i _mm_alignr_epi8(__m128i, __m128i, int)
__m128d _mm_sub_sd(__m128d _A, __m128d _B)
__m128d _mm_cvtss_sd(__m128d _A, __m128 _B)
__m128 _mm_move_ss(__m128 _A, __m128 _B)
__m128i _mm_slli_epi32(__m128i _A, int _Count)
unsigned int _mm_crc32_u8(unsigned int, unsigned char)
__m128 _mm_sub_ss(__m128 _A, __m128 _B)
__m128i _mm_sub_epi16(__m128i _A, __m128i _B)
void _mm_stream_pd(double *_Dp, __m128d _A)
__m128d _mm_cmple_sd(__m128d _A, __m128d _B)
__m128 _mm_loadr_ps(float const *_A)
__m64 _m_pfmul(__m64, __m64)
__m128 _mm_cmpnle_ps(__m128 _A, __m128 _B)
void _mm_monitor(void const *, unsigned, unsigned)
__m128 _mm_cmpnge_ps(__m128 _A, __m128 _B)
__m128d _mm_mul_sd(__m128d _A, __m128d _B)
__m128 _mm_cmpeq_ss(__m128 _A, __m128 _B)
__m128i _mm_abs_epi32(__m128i)
__m128 _mm_unpackhi_ps(__m128 _A, __m128 _B)
void _mm_mwaitx(unsigned int, unsigned int, unsigned int)
int _mm_ucomineq_sd(__m128d _A, __m128d _B)
__m128 _mm_unpacklo_ps(__m128 _A, __m128 _B)
__m128i _mm_subs_epu16(__m128i _A, __m128i _B)
__m128 _mm_div_ss(__m128 _A, __m128 _B)
__m128i _mm_sub_epi8(__m128i _A, __m128i _B)
void _mm_storel_pi(__m64 *, __m128)
__m128i _mm_shuffle_epi32(__m128i _A, int _Imm)
__m64 _m_pfcmpgt(__m64, __m64)
__m128 _mm_rsqrt_ps(__m128 _A)
unsigned __int64 __cdecl _rotr64(_In_ unsigned __int64 _Value, _In_ int _Shift)
void _mm_storeu_si128(__m128i *_P, __m128i _B)
__m128i _mm_unpacklo_epi64(__m128i _A, __m128i _B)
__m128 _mm_max_ss(__m128 _A, __m128 _B)
_CRT_MANAGED_FP_DEPRECATE _In_ unsigned int _Mask
Definition: float.h:235
void _mm_stream_si32(int *_P, int _I)
__m128 _mm_or_ps(__m128 _A, __m128 _B)
__m128 _mm_cmple_ss(__m128 _A, __m128 _B)
__m128i _mm_andnot_si128(__m128i _A, __m128i _B)
__m128d _mm_max_sd(__m128d _A, __m128d _B)
void _mm_prefetch(char const *_A, int _Sel)
__m128i _mm_min_epu32(__m128i, __m128i)
__m128d _mm_div_sd(__m128d _A, __m128d _B)
__m128i _mm_sign_epi8(__m128i, __m128i)
const void * _Target(const type_info &_Info) const _NOEXCEPT
Definition: functional:408
__m128 _mm_loadh_pi(__m128, __m64 const *)
__m128i _mm_loadl_epi64(__m128i const *_P)
__m128d _mm_set_sd(double _W)
void _mm_storer_ps(float *_V, __m128 _A)
__m128i _mm_srai_epi16(__m128i _A, int _Count)
__m128i _mm_cvtps_epi32(__m128 _A)
__m64 _m_pfcmpge(__m64, __m64)
__m128i _mm_subs_epi8(__m128i _A, __m128i _B)
__m128 _mm_cmpunord_ps(__m128 _A, __m128 _B)
__m128 _mm_mul_ss(__m128 _A, __m128 _B)
__m128i _mm_insert_epi8(__m128i, int, const int)
__m128 _mm_loadl_pi(__m128, __m64 const *)
__m128i _mm_max_epu16(__m128i, __m128i)
__m128 _mm_load_ps(float const *_A)
__m128d _mm_mul_pd(__m128d _A, __m128d _B)
__m128d _mm_min_sd(__m128d _A, __m128d _B)
__m128i _mm_add_epi16(__m128i _A, __m128i _B)
void _mm_maskmoveu_si128(__m128i _D, __m128i _N, char *_P)
__m64 _m_pfmax(__m64, __m64)
__m128i _mm_cmpgt_epi64(__m128i, __m128i)
__m128i _mm_set_epi8(char _B15, char _B14, char _B13, char _B12, char _B11, char _B10, char _B9, char _B8, char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128 _mm_cmpunord_ss(__m128 _A, __m128 _B)
__m128i _mm_mul_epi32(__m128i, __m128i)
__m128i _mm_cmpeq_epi8(__m128i _A, __m128i _B)
int _mm_cvtt_ss2si(__m128 _A)
__m128 _mm_hsub_ps(__m128, __m128)
__m128i _mm_unpackhi_epi8(__m128i _A, __m128i _B)
__m128i _mm_adds_epi16(__m128i _A, __m128i _B)
__m128d _mm_cvtps_pd(__m128 _A)
__m64 _m_pfsubr(__m64, __m64)
__m128d _mm_andnot_pd(__m128d _A, __m128d _B)
__m128i _mm_sub_epi64(__m128i _A, __m128i _B)
__m128 _mm_cvtsd_ss(__m128 _A, __m128d _B)
int _mm_cmpestra(__m128i, int, __m128i, int, const int)
__m128d _mm_cmpeq_sd(__m128d _A, __m128d _B)
__m128i _mm_mullo_epi32(__m128i, __m128i)
__m128 _mm_load_ss(float const *_A)
__m128 _mm_cmpnge_ss(__m128 _A, __m128 _B)
__m128i _mm_packus_epi16(__m128i _A, __m128i _B)
__m128 _mm_blendv_ps(__m128, __m128, __m128)
__m128i _mm_hadd_epi32(__m128i, __m128i)
__m128 _mm_movelh_ps(__m128, __m128)
unsigned int _mm_getcsr(void)
__m128i _mm_mulhi_epu16(__m128i _A, __m128i _B)
__m128i _mm_cvtepu8_epi32(__m128i)
__m128d _mm_cmpge_pd(__m128d _A, __m128d _B)
#define __MACHINEARM
Definition: intrin0.h:73
__m128 _mm_dp_ps(__m128, __m128, const int)
__m128 _mm_cmpge_ps(__m128 _A, __m128 _B)
#define __MACHINEARM64_X64
Definition: intrin0.h:100
__m128i _mm_srl_epi64(__m128i _A, __m128i _Count)
__m128d _mm_setr_pd(double _Y, double _Z)
__m128d _mm_add_sd(__m128d _A, __m128d _B)
__m128i _mm_and_si128(__m128i _A, __m128i _B)
__m128i _mm_madd_epi16(__m128i _A, __m128i _B)
void _mm_stream_si128(__m128i *_P, __m128i _A)
__m128d _mm_sqrt_pd(__m128d _A)
__m128i _mm_subs_epi16(__m128i _A, __m128i _B)
__m128 _mm_cmpge_ss(__m128 _A, __m128 _B)
__m128d _mm_cmpunord_pd(__m128d _A, __m128d _B)