STLdoc
STLdocumentation
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros
intrin.h
Go to the documentation of this file.
1 /***
2 * intrin.h - declarations/definitions for platform specific intrinsic functions.
3 *
4 * Copyright (c) Microsoft Corporation. All rights reserved.
5 *Purpose:
6 * This include file contains the declarations for platform specific intrinsic
7 * functions, or will include other files that have declaration of intrinsic
8 * functions. Also there will be some platform specific macros to be used with
9 * intrinsic functions.
10 *
11 ****/
12 
13 #pragma once
14 #define __INTRIN_H_
15 #ifndef RC_INVOKED
16 #ifndef __midl
17 
18 #include <crtdefs.h>
19 #include <setjmp.h>
20 #include <stddef.h>
21 
22 #if !defined (_M_CEE_PURE)
23 #if defined (_M_IX86) || defined (_M_X64) || defined (_M_ARM)
24 
25 #if defined (_M_IX86) || defined (_M_X64)
26 #include <immintrin.h>
27 #include <ammintrin.h>
28 #endif /* defined (_M_IX86) || defined (_M_X64) */
29 
30 #if defined (_M_IX86)
31 #include <mm3dnow.h>
32 #endif /* defined (_M_IX86) */
33 
34 #if defined (_M_ARM)
35 #include <armintr.h>
36 #endif /* defined (_M_ARM) */
37 
38 #endif /* defined (_M_IX86) || defined (_M_X64) || defined (_M_ARM) */
39 
40 #endif /* !defined (_M_CEE_PURE) */
41 
42 #if defined (__cplusplus)
43 extern "C" {
44 #endif /* defined (__cplusplus) */
45 
46 /*
47 ** __MACHINE : everything
48 ** __MACHINEX86 : x86 only
49 ** __MACHINEX64 : x64 only
50 ** __MACHINEX86_X64 : x86 and x64 only
51 ** __MACHINEARM : ARM only
52 ** __MACHINEARM_X64 : ARM and x64 only
53 ** __MACHINEWVMPURE : /clr:pure only
54 ** __MACHINEZ : nothing
55 */
56 
57 #define __MACHINEX86 __MACHINE
58 #define __MACHINEX64 __MACHINE
59 #define __MACHINEX86_X64 __MACHINE
60 #define __MACHINEARM __MACHINE
61 #define __MACHINEARM_X64 __MACHINE
62 
63 /* Most intrinsics not available to pure managed code */
64 #if defined (_M_CEE_PURE)
65 #define __MACHINE(X) __MACHINEZ(X)
66 #define __MACHINEWVMPURE(X) X;
67 #else /* defined (_M_CEE_PURE) */
68 #define __MACHINE(X) X;
69 #define __MACHINEWVMPURE(X) __MACHINEZ(X)
70 #endif /* defined (_M_CEE_PURE) */
71 
72 #define __MACHINEZ(X) /* NOTHING */
73 
74 #if !defined (_M_IX86)
75 #undef __MACHINEX86
76 #define __MACHINEX86 __MACHINEZ
77 #endif /* !defined (_M_IX86) */
78 
79 #if !defined (_M_X64)
80 #undef __MACHINEX64
81 #define __MACHINEX64 __MACHINEZ
82 #endif /* !defined (_M_X64) */
83 
84 #if !(defined (_M_IX86) || defined (_M_X64))
85 #undef __MACHINEX86_X64
86 #define __MACHINEX86_X64 __MACHINEZ
87 #endif /* !(defined (_M_IX86) || defined (_M_X64)) */
88 
89 #if !(defined (_M_ARM) || defined (_M_X64))
90 #undef __MACHINEARM_X64
91 #define __MACHINEARM_X64 __MACHINEZ
92 #endif /* !(defined (_M_ARM) || defined (_M_X64)) */
93 
94 #if !defined (_M_ARM)
95 #undef __MACHINEARM
96 #define __MACHINEARM __MACHINEZ
97 #endif /* !defined (_M_ARM) */
98 
99 /* For compatibility with <winnt.h>, some intrinsics are __cdecl except on x64 */
100 #if defined (_M_X64)
101 #define __MACHINECALL_CDECL_OR_DEFAULT
102 #else
103 #define __MACHINECALL_CDECL_OR_DEFAULT __cdecl
104 #endif
105 
106 __MACHINEARM(int _AddSatInt(int, int))
107 __MACHINE(void * _AddressOfReturnAddress(void))
108 __MACHINE(unsigned char _BitScanForward(unsigned long * _Index, unsigned long _Mask))
109 __MACHINEX64(unsigned char _BitScanForward64(unsigned long * _Index, unsigned __int64 _Mask))
110 __MACHINE(unsigned char _BitScanReverse(unsigned long * _Index, unsigned long _Mask))
111 __MACHINEX64(unsigned char _BitScanReverse64(unsigned long * _Index, unsigned __int64 _Mask))
112 __MACHINEARM(double _CopyDoubleFromInt64(__int64))
113 __MACHINEARM(float _CopyFloatFromInt32(__int32))
114 __MACHINEARM(__int32 _CopyInt32FromFloat(float))
115 __MACHINEARM(__int64 _CopyInt64FromDouble(double))
116 __MACHINEARM(unsigned int _CountLeadingOnes(unsigned long))
117 __MACHINEARM(unsigned int _CountLeadingOnes64(unsigned __int64))
118 __MACHINEARM(unsigned int _CountLeadingSigns(long))
119 __MACHINEARM(unsigned int _CountLeadingSigns64(__int64))
120 __MACHINEARM(unsigned int _CountLeadingZeros(unsigned long))
121 __MACHINEARM(unsigned int _CountLeadingZeros64(unsigned __int64))
122 __MACHINEARM(unsigned int _CountOneBits(unsigned long))
123 __MACHINEARM(unsigned int _CountOneBits64(unsigned __int64))
124 __MACHINEARM(int _DAddSatInt(int, int))
125 __MACHINEARM(int _DSubSatInt(int, int))
126 __MACHINEARM(long _InterlockedAdd(long volatile * _Addend, long _Value))
127 __MACHINEARM(__int64 _InterlockedAdd64(__int64 volatile * _Addend, __int64 _Value))
128 __MACHINEARM(__int64 _InterlockedAdd64_acq(__int64 volatile * _Addend, __int64 _Value))
129 __MACHINEARM(__int64 _InterlockedAdd64_nf(__int64 volatile * _Addend, __int64 _Value))
130 __MACHINEARM(__int64 _InterlockedAdd64_rel(__int64 volatile * _Addend, __int64 _Value))
131 __MACHINEX86(long _InterlockedAddLargeStatistic(__int64 volatile * _Addend, long _Value))
132 __MACHINEARM(long _InterlockedAdd_acq(long volatile * _Addend, long _Value))
133 __MACHINEARM(long _InterlockedAdd_nf(long volatile * _Addend, long _Value))
134 __MACHINEARM(long _InterlockedAdd_rel(long volatile * _Addend, long _Value))
135 __MACHINE(long _InterlockedAnd(long volatile * _Value, long _Mask))
136 __MACHINE(short _InterlockedAnd16(short volatile * _Value, short _Mask))
137 __MACHINEARM(short _InterlockedAnd16_acq(short volatile * _Value, short _Mask))
138 __MACHINEARM(short _InterlockedAnd16_nf(short volatile * _Value, short _Mask))
139 __MACHINEX64(short _InterlockedAnd16_np(short volatile * _Value, short _Mask))
140 __MACHINEARM(short _InterlockedAnd16_rel(short volatile * _Value, short _Mask))
141 __MACHINEARM_X64(__int64 _InterlockedAnd64(__int64 volatile * _Value, __int64 _Mask))
142 __MACHINEARM(__int64 _InterlockedAnd64_acq(__int64 volatile * _Value, __int64 _Mask))
143 __MACHINEARM(__int64 _InterlockedAnd64_nf(__int64 volatile * _Value, __int64 _Mask))
144 __MACHINEX64(__int64 _InterlockedAnd64_np(__int64 volatile * _Value, __int64 _Mask))
145 __MACHINEARM(__int64 _InterlockedAnd64_rel(__int64 volatile * _Value, __int64 _Mask))
146 __MACHINE(char _InterlockedAnd8(char volatile * _Value, char _Mask))
147 __MACHINEARM(char _InterlockedAnd8_acq(char volatile * _Value, char _Mask))
148 __MACHINEARM(char _InterlockedAnd8_nf(char volatile * _Value, char _Mask))
149 __MACHINEX64(char _InterlockedAnd8_np(char volatile * _Value, char _Mask))
150 __MACHINEARM(char _InterlockedAnd8_rel(char volatile * _Value, char _Mask))
151 __MACHINEARM(long _InterlockedAnd_acq(long volatile * _Value, long _Mask))
152 __MACHINEARM(long _InterlockedAnd_nf(long volatile * _Value, long _Mask))
153 __MACHINEX64(long _InterlockedAnd_np(long volatile * _Value, long _Mask))
154 __MACHINEARM(long _InterlockedAnd_rel(long volatile * _Value, long _Mask))
155 __MACHINE(long __MACHINECALL_CDECL_OR_DEFAULT _InterlockedCompareExchange(long volatile * _Destination, long _Exchange, long _Comparand))
156 __MACHINEWVMPURE(long _InterlockedCompareExchange(long volatile * _Destination, long _Exchange, long _Comparand))
157 __MACHINEX64(unsigned char _InterlockedCompareExchange128(__int64 volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
158 __MACHINEX64(unsigned char _InterlockedCompareExchange128_np(__int64 volatile * _Destination, __int64 _ExchangeHigh, __int64 _ExchangeLow, __int64 * _ComparandResult))
159 __MACHINE(short _InterlockedCompareExchange16(short volatile * _Destination, short _Exchange, short _Comparand))
160 __MACHINEARM(short _InterlockedCompareExchange16_acq(short volatile * _Destination, short _Exchange, short _Comparand))
161 __MACHINEARM(short _InterlockedCompareExchange16_nf(short volatile * _Destination, short _Exchange, short _Comparand))
162 __MACHINEX64(short _InterlockedCompareExchange16_np(short volatile * _Destination, short _Exchange, short _Comparand))
163 __MACHINEARM(short _InterlockedCompareExchange16_rel(short volatile * _Destination, short _Exchange, short _Comparand))
164 __MACHINE(__int64 _InterlockedCompareExchange64(__int64 volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
165 __MACHINEARM(__int64 _InterlockedCompareExchange64_acq(__int64 volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
166 __MACHINEARM(__int64 _InterlockedCompareExchange64_nf(__int64 volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
167 __MACHINEX64(__int64 _InterlockedCompareExchange64_np(__int64 volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
168 __MACHINEARM(__int64 _InterlockedCompareExchange64_rel(__int64 volatile * _Destination, __int64 _Exchange, __int64 _Comparand))
169 __MACHINE(char _InterlockedCompareExchange8(char volatile * _Destination, char _Exchange, char _Comparand))
170 __MACHINEARM(char _InterlockedCompareExchange8_acq(char volatile * _Destination, char _Exchange, char _Comparand))
171 __MACHINEARM(char _InterlockedCompareExchange8_nf(char volatile * _Destination, char _Exchange, char _Comparand))
172 __MACHINEARM(char _InterlockedCompareExchange8_rel(char volatile * _Destination, char _Exchange, char _Comparand))
173 __MACHINE(void * _InterlockedCompareExchangePointer(void * volatile * _Destination, void * _Exchange, void * _Comparand))
174 __MACHINEARM(void * _InterlockedCompareExchangePointer_acq(void * volatile * _Destination, void * _Exchange, void * _Comparand))
175 __MACHINEARM(void * _InterlockedCompareExchangePointer_nf(void * volatile * _Destination, void * _Exchange, void * _Comparand))
176 __MACHINEX64(void * _InterlockedCompareExchangePointer_np(void * volatile * _Destination, void * _Exchange, void * _Comparand))
177 __MACHINEARM(void * _InterlockedCompareExchangePointer_rel(void * volatile * _Destination, void * _Exchange, void * _Comparand))
178 __MACHINEARM(long _InterlockedCompareExchange_acq(long volatile * _Destination, long _Exchange, long _Comparand))
179 __MACHINEARM(long _InterlockedCompareExchange_nf(long volatile * _Destination, long _Exchange, long _Comparand))
180 __MACHINEX64(long _InterlockedCompareExchange_np(long volatile * _Destination, long _Exchange, long _Comparand))
181 __MACHINEARM(long _InterlockedCompareExchange_rel(long volatile * _Destination, long _Exchange, long _Comparand))
183 __MACHINEWVMPURE(long _InterlockedDecrement(long volatile * _Addend))
184 __MACHINE(short _InterlockedDecrement16(short volatile * _Addend))
185 __MACHINEARM(short _InterlockedDecrement16_acq(short volatile * _Addend))
186 __MACHINEARM(short _InterlockedDecrement16_nf(short volatile * _Addend))
187 __MACHINEARM(short _InterlockedDecrement16_rel(short volatile * _Addend))
188 __MACHINEARM_X64(__int64 _InterlockedDecrement64(__int64 volatile * _Addend))
189 __MACHINEARM(__int64 _InterlockedDecrement64_acq(__int64 volatile * _Addend))
190 __MACHINEARM(__int64 _InterlockedDecrement64_nf(__int64 volatile * _Addend))
191 __MACHINEARM(__int64 _InterlockedDecrement64_rel(__int64 volatile * _Addend))
192 __MACHINEARM(long _InterlockedDecrement_acq(long volatile * _Addend))
193 __MACHINEARM(long _InterlockedDecrement_nf(long volatile * _Addend))
194 __MACHINEARM(long _InterlockedDecrement_rel(long volatile * _Addend))
195 __MACHINE(long __MACHINECALL_CDECL_OR_DEFAULT _InterlockedExchange(long volatile * _Target, long _Value))
196 __MACHINEWVMPURE(long __MACHINECALL_CDECL_OR_DEFAULT _InterlockedExchange(long volatile * _Target, long _Value))
197 __MACHINE(short _InterlockedExchange16(short volatile * _Target, short _Value))
198 __MACHINEARM(short _InterlockedExchange16_acq(short volatile * _Target, short _Value))
199 __MACHINEARM(short _InterlockedExchange16_nf(short volatile * _Target, short _Value))
200 __MACHINEARM(short _InterlockedExchange16_rel(short volatile * _Target, short _Value))
201 __MACHINEARM_X64(__int64 _InterlockedExchange64(__int64 volatile * _Target, __int64 _Value))
202 __MACHINEARM(__int64 _InterlockedExchange64_acq(__int64 volatile * _Target, __int64 _Value))
203 __MACHINEARM(__int64 _InterlockedExchange64_nf(__int64 volatile * _Target, __int64 _Value))
204 __MACHINEARM(__int64 _InterlockedExchange64_rel(__int64 volatile * _Target, __int64 _Value))
205 __MACHINE(char _InterlockedExchange8(char volatile * _Target, char _Value))
206 __MACHINEARM(char _InterlockedExchange8_acq(char volatile * _Target, char _Value))
207 __MACHINEARM(char _InterlockedExchange8_nf(char volatile * _Target, char _Value))
208 __MACHINEARM(char _InterlockedExchange8_rel(char volatile * _Target, char _Value))
209 __MACHINE(long __MACHINECALL_CDECL_OR_DEFAULT _InterlockedExchangeAdd(long volatile * _Addend, long _Value))
210 __MACHINE(short _InterlockedExchangeAdd16(short volatile * _Addend, short _Value))
211 __MACHINEARM(short _InterlockedExchangeAdd16_acq(short volatile * _Addend, short _Value))
212 __MACHINEARM(short _InterlockedExchangeAdd16_nf(short volatile * _Addend, short _Value))
213 __MACHINEARM(short _InterlockedExchangeAdd16_rel(short volatile * _Addend, short _Value))
214 __MACHINEARM_X64(__int64 _InterlockedExchangeAdd64(__int64 volatile * _Addend, __int64 _Value))
215 __MACHINEARM(__int64 _InterlockedExchangeAdd64_acq(__int64 volatile * _Addend, __int64 _Value))
216 __MACHINEARM(__int64 _InterlockedExchangeAdd64_nf(__int64 volatile * _Addend, __int64 _Value))
217 __MACHINEARM(__int64 _InterlockedExchangeAdd64_rel(__int64 volatile * _Addend, __int64 _Value))
218 __MACHINE(char _InterlockedExchangeAdd8(char volatile * _Addend, char _Value))
219 __MACHINEARM(char _InterlockedExchangeAdd8_acq(char volatile * _Addend, char _Value))
220 __MACHINEARM(char _InterlockedExchangeAdd8_nf(char volatile * _Addend, char _Value))
221 __MACHINEARM(char _InterlockedExchangeAdd8_rel(char volatile * _Addend, char _Value))
222 __MACHINEARM(long _InterlockedExchangeAdd_acq(long volatile * _Addend, long _Value))
223 __MACHINEARM(long _InterlockedExchangeAdd_nf(long volatile * _Addend, long _Value))
224 __MACHINEARM(long _InterlockedExchangeAdd_rel(long volatile * _Addend, long _Value))
225  // Temporarily use macro for x86 due to conflict with inline function in 8.1 SDK winnt.h header
226 #if !defined(FIXED_592562) && defined (_M_IX86) && !defined (_M_CEE_PURE)
227 #undef _InterlockedExchangePointer
228 __forceinline static void * _Intrin_h_InterlockedExchangePointer(void * volatile * _Target, void * _Value)
229 {
230  return (void *)_InterlockedExchange((long volatile *) _Target, (long) _Value);
231 }
232 #define _InterlockedExchangePointer(p,v) _Intrin_h_InterlockedExchangePointer(p,v)
233 #else
234 __MACHINE(void * _InterlockedExchangePointer(void * volatile * _Target, void * _Value))
235 #endif
236 __MACHINEARM(void * _InterlockedExchangePointer_acq(void * volatile * _Target, void * _Value))
237 __MACHINEARM(void * _InterlockedExchangePointer_nf(void * volatile * _Target, void * _Value))
238 __MACHINEARM(void * _InterlockedExchangePointer_rel(void * volatile * _Target, void * _Value))
239 __MACHINEARM(long _InterlockedExchange_acq(long volatile * _Target, long _Value))
240 __MACHINEARM(long _InterlockedExchange_nf(long volatile * _Target, long _Value))
241 __MACHINEARM(long _InterlockedExchange_rel(long volatile * _Target, long _Value))
243 __MACHINEWVMPURE(long _InterlockedIncrement(long volatile * _Addend))
244 __MACHINE(short _InterlockedIncrement16(short volatile * _Addend))
245 __MACHINEARM(short _InterlockedIncrement16_acq(short volatile * _Addend))
246 __MACHINEARM(short _InterlockedIncrement16_nf(short volatile * _Addend))
247 __MACHINEARM(short _InterlockedIncrement16_rel(short volatile * _Addend))
248 __MACHINEARM_X64(__int64 _InterlockedIncrement64(__int64 volatile * _Addend))
249 __MACHINEARM(__int64 _InterlockedIncrement64_acq(__int64 volatile * _Addend))
250 __MACHINEARM(__int64 _InterlockedIncrement64_nf(__int64 volatile * _Addend))
251 __MACHINEARM(__int64 _InterlockedIncrement64_rel(__int64 volatile * _Addend))
252 __MACHINEARM(long _InterlockedIncrement_acq(long volatile * _Addend))
253 __MACHINEARM(long _InterlockedIncrement_nf(long volatile * _Addend))
254 __MACHINEARM(long _InterlockedIncrement_rel(long volatile * _Addend))
255 __MACHINE(long _InterlockedOr(long volatile * _Value, long _Mask))
256 __MACHINE(short _InterlockedOr16(short volatile * _Value, short _Mask))
257 __MACHINEARM(short _InterlockedOr16_acq(short volatile * _Value, short _Mask))
258 __MACHINEARM(short _InterlockedOr16_nf(short volatile * _Value, short _Mask))
259 __MACHINEX64(short _InterlockedOr16_np(short volatile * _Value, short _Mask))
260 __MACHINEARM(short _InterlockedOr16_rel(short volatile * _Value, short _Mask))
261 __MACHINEARM_X64(__int64 _InterlockedOr64(__int64 volatile * _Value, __int64 _Mask))
262 __MACHINEARM(__int64 _InterlockedOr64_acq(__int64 volatile * _Value, __int64 _Mask))
263 __MACHINEARM(__int64 _InterlockedOr64_nf(__int64 volatile * _Value, __int64 _Mask))
264 __MACHINEX64(__int64 _InterlockedOr64_np(__int64 volatile * _Value, __int64 _Mask))
265 __MACHINEARM(__int64 _InterlockedOr64_rel(__int64 volatile * _Value, __int64 _Mask))
266 __MACHINE(char _InterlockedOr8(char volatile * _Value, char _Mask))
267 __MACHINEARM(char _InterlockedOr8_acq(char volatile * _Value, char _Mask))
268 __MACHINEARM(char _InterlockedOr8_nf(char volatile * _Value, char _Mask))
269 __MACHINEX64(char _InterlockedOr8_np(char volatile * _Value, char _Mask))
270 __MACHINEARM(char _InterlockedOr8_rel(char volatile * _Value, char _Mask))
271 __MACHINEARM(long _InterlockedOr_acq(long volatile * _Value, long _Mask))
272 __MACHINEARM(long _InterlockedOr_nf(long volatile * _Value, long _Mask))
273 __MACHINEX64(long _InterlockedOr_np(long volatile * _Value, long _Mask))
274 __MACHINEARM(long _InterlockedOr_rel(long volatile * _Value, long _Mask))
275 __MACHINE(long _InterlockedXor(long volatile * _Value, long _Mask))
276 __MACHINE(short _InterlockedXor16(short volatile * _Value, short _Mask))
277 __MACHINEARM(short _InterlockedXor16_acq(short volatile * _Value, short _Mask))
278 __MACHINEARM(short _InterlockedXor16_nf(short volatile * _Value, short _Mask))
279 __MACHINEX64(short _InterlockedXor16_np(short volatile * _Value, short _Mask))
280 __MACHINEARM(short _InterlockedXor16_rel(short volatile * _Value, short _Mask))
281 __MACHINEARM_X64(__int64 _InterlockedXor64(__int64 volatile * _Value, __int64 _Mask))
282 __MACHINEARM(__int64 _InterlockedXor64_acq(__int64 volatile * _Value, __int64 _Mask))
283 __MACHINEARM(__int64 _InterlockedXor64_nf(__int64 volatile * _Value, __int64 _Mask))
284 __MACHINEX64(__int64 _InterlockedXor64_np(__int64 volatile * _Value, __int64 _Mask))
285 __MACHINEARM(__int64 _InterlockedXor64_rel(__int64 volatile * _Value, __int64 _Mask))
286 __MACHINE(char _InterlockedXor8(char volatile * _Value, char _Mask))
287 __MACHINEARM(char _InterlockedXor8_acq(char volatile * _Value, char _Mask))
288 __MACHINEARM(char _InterlockedXor8_nf(char volatile * _Value, char _Mask))
289 __MACHINEX64(char _InterlockedXor8_np(char volatile * _Value, char _Mask))
290 __MACHINEARM(char _InterlockedXor8_rel(char volatile * _Value, char _Mask))
291 __MACHINEARM(long _InterlockedXor_acq(long volatile * _Value, long _Mask))
292 __MACHINEARM(long _InterlockedXor_nf(long volatile * _Value, long _Mask))
293 __MACHINEX64(long _InterlockedXor_np(long volatile * _Value, long _Mask))
294 __MACHINEARM(long _InterlockedXor_rel(long volatile * _Value, long _Mask))
295 __MACHINEARM(unsigned int _MoveFromCoprocessor(unsigned int, unsigned int, unsigned int, unsigned int, unsigned int))
296 __MACHINEARM(unsigned int _MoveFromCoprocessor2(unsigned int, unsigned int, unsigned int, unsigned int, unsigned int))
297 __MACHINEARM(unsigned __int64 _MoveFromCoprocessor64(unsigned int, unsigned int, unsigned int))
298 __MACHINEARM(void _MoveToCoprocessor(unsigned int, unsigned int, unsigned int, unsigned int, unsigned int, unsigned int))
299 __MACHINEARM(void _MoveToCoprocessor2(unsigned int, unsigned int, unsigned int, unsigned int, unsigned int, unsigned int))
300 __MACHINEARM(void _MoveToCoprocessor64(unsigned __int64, unsigned int, unsigned int, unsigned int))
301 __MACHINEARM(long _MulHigh(long, long))
302 __MACHINEARM(unsigned long _MulUnsignedHigh(unsigned long, unsigned long))
303 __MACHINE(void _ReadBarrier(void))
304 __MACHINEARM(int _ReadStatusReg(int))
305 __MACHINE(void _ReadWriteBarrier(void))
306 __MACHINE(void * _ReturnAddress(void))
307 __MACHINEARM(int _SubSatInt(int, int))
308 __MACHINE(void _WriteBarrier(void))
309 __MACHINEARM(void _WriteStatusReg(int, int, int))
310 __MACHINEX86(void __addfsbyte(unsigned long, unsigned char))
311 __MACHINEX86(void __addfsdword(unsigned long, unsigned long))
312 __MACHINEX86(void __addfsword(unsigned long, unsigned short))
313 __MACHINEX64(void __addgsbyte(unsigned long, unsigned char))
314 __MACHINEX64(void __addgsdword(unsigned long, unsigned long))
315 __MACHINEX64(void __addgsqword(unsigned long, unsigned __int64))
316 __MACHINEX64(void __addgsword(unsigned long, unsigned short))
317 __MACHINE(void __code_seg(const char *))
318 __MACHINEX86_X64(void __cpuid(int[4], int))
319 __MACHINEX86_X64(void __cpuidex(int[4], int, int))
320 __MACHINE(void __cdecl __debugbreak(void))
321 __MACHINEARM(void __emit(unsigned __int32))
322 __MACHINEX86_X64(__int64 __emul(int, int))
323 __MACHINEX86_X64(unsigned __int64 __emulu(unsigned int, unsigned int))
324 __MACHINE(__declspec(noreturn) void __fastfail(unsigned int))
325 __MACHINEX64(void __faststorefence(void))
326 __MACHINEX86_X64(unsigned int __getcallerseflags(void))
327 __MACHINEX86_X64(void __halt(void))
328 __MACHINEARM(unsigned int __hvc(unsigned int, ...))
329 __MACHINEX86_X64(unsigned char __inbyte(unsigned short))
330 __MACHINEX86_X64(void __inbytestring(unsigned short, unsigned char *, unsigned long))
331 __MACHINEX86(void __incfsbyte(unsigned long))
332 __MACHINEX86(void __incfsdword(unsigned long))
333 __MACHINEX86(void __incfsword(unsigned long))
334 __MACHINEX64(void __incgsbyte(unsigned long))
335 __MACHINEX64(void __incgsdword(unsigned long))
336 __MACHINEX64(void __incgsqword(unsigned long))
337 __MACHINEX64(void __incgsword(unsigned long))
338 __MACHINEX86_X64(unsigned long __indword(unsigned short))
339 __MACHINEX86_X64(void __indwordstring(unsigned short, unsigned long *, unsigned long))
340 __MACHINEX86_X64(void __int2c(void))
341 __MACHINEX86_X64(void __invlpg(void *))
342 __MACHINEX86_X64(unsigned short __inword(unsigned short))
343 __MACHINEX86_X64(void __inwordstring(unsigned short, unsigned short *, unsigned long))
344 __MACHINEARM(__int16 __iso_volatile_load16(const volatile __int16 *))
345 __MACHINEARM(__int32 __iso_volatile_load32(const volatile __int32 *))
346 __MACHINEARM(__int64 __iso_volatile_load64(const volatile __int64 *))
347 __MACHINEARM(__int8 __iso_volatile_load8(const volatile __int8 *))
348 __MACHINEARM(void __iso_volatile_store16(volatile __int16 *, __int16))
349 __MACHINEARM(void __iso_volatile_store32(volatile __int32 *, __int32))
350 __MACHINEARM(void __iso_volatile_store64(volatile __int64 *, __int64))
351 __MACHINEARM(void __iso_volatile_store8(volatile __int8 *, __int8))
352 __MACHINEARM(__int64 __ldrexd(const volatile __int64 *))
353 __MACHINEX86_X64(void __lidt(void *))
354 __MACHINEX86_X64(unsigned __int64 __ll_lshift(unsigned __int64, int))
355 __MACHINEX86_X64(__int64 __ll_rshift(__int64, int))
356 __MACHINEX86_X64(unsigned int __lzcnt(unsigned int))
357 __MACHINEX86_X64(unsigned short __lzcnt16(unsigned short))
358 __MACHINEX64(unsigned __int64 __lzcnt64(unsigned __int64))
359 __MACHINEX86_X64(void __movsb(unsigned char *, unsigned char const *, size_t))
360 __MACHINEX86_X64(void __movsd(unsigned long *, unsigned long const *, size_t))
361 __MACHINEX64(void __movsq(unsigned long long *, unsigned long long const *, size_t))
362 __MACHINEX86_X64(void __movsw(unsigned short *, unsigned short const *, size_t))
363 __MACHINEX64(__int64 __mulh(__int64, __int64))
364 __MACHINE(void __nop(void))
365 __MACHINEX86_X64(void __nvreg_restore_fence(void))
366 __MACHINEX86_X64(void __nvreg_save_fence(void))
367 __MACHINEX86_X64(void __outbyte(unsigned short, unsigned char))
368 __MACHINEX86_X64(void __outbytestring(unsigned short, unsigned char *, unsigned long))
369 __MACHINEX86_X64(void __outdword(unsigned short, unsigned long))
370 __MACHINEX86_X64(void __outdwordstring(unsigned short, unsigned long *, unsigned long))
371 __MACHINEX86_X64(void __outword(unsigned short, unsigned short))
372 __MACHINEX86_X64(void __outwordstring(unsigned short, unsigned short *, unsigned long))
373 __MACHINEX86_X64(unsigned int __popcnt(unsigned int))
374 __MACHINEX86_X64(unsigned short __popcnt16(unsigned short))
375 __MACHINEX64(unsigned __int64 __popcnt64(unsigned __int64))
376 __MACHINEARM(void __cdecl __prefetch(const void *))
377 __MACHINEARM(void __cdecl __prefetchw(const void *))
378 __MACHINEARM(unsigned __int64 __rdpmccntr64(void))
379 __MACHINEX86_X64(unsigned __int64 __rdtsc(void))
380 __MACHINEX86_X64(unsigned __int64 __rdtscp(unsigned int *))
381 __MACHINEX64(unsigned __int64 __readcr0(void))
382 __MACHINEX86(unsigned long __readcr0(void))
383 __MACHINEX64(unsigned __int64 __readcr2(void))
384 __MACHINEX86(unsigned long __readcr2(void))
385 __MACHINEX64(unsigned __int64 __readcr3(void))
386 __MACHINEX86(unsigned long __readcr3(void))
387 __MACHINEX64(unsigned __int64 __readcr4(void))
388 __MACHINEX86(unsigned long __readcr4(void))
389 __MACHINEX64(unsigned __int64 __readcr8(void))
390 __MACHINEX86(unsigned long __readcr8(void))
391 __MACHINEX64(unsigned __int64 __readdr(unsigned int))
392 __MACHINEX86(unsigned int __readdr(unsigned int))
393 __MACHINEX64(unsigned __int64 __readeflags(void))
394 __MACHINEX86(unsigned int __readeflags(void))
395 __MACHINEX86(unsigned char __readfsbyte(unsigned long))
396 __MACHINEX86(unsigned long __readfsdword(unsigned long))
397 __MACHINEX86(unsigned __int64 __readfsqword(unsigned long))
398 __MACHINEX86(unsigned short __readfsword(unsigned long))
399 __MACHINEX64(unsigned char __readgsbyte(unsigned long))
400 __MACHINEX64(unsigned long __readgsdword(unsigned long))
401 __MACHINEX64(unsigned __int64 __readgsqword(unsigned long))
402 __MACHINEX64(unsigned short __readgsword(unsigned long))
403 __MACHINEX86_X64(unsigned __int64 __readmsr(unsigned long))
404 __MACHINEX86_X64(unsigned __int64 __readpmc(unsigned long))
405 __MACHINEX86_X64(unsigned long __segmentlimit(unsigned long))
406 __MACHINEARM(void __sev(void))
407 __MACHINEX64(unsigned __int64 __shiftleft128(unsigned __int64 _LowPart, unsigned __int64 _HighPart, unsigned char _Shift))
408 __MACHINEX64(unsigned __int64 __shiftright128(unsigned __int64 _LowPart, unsigned __int64 _HighPart, unsigned char _Shift))
409 __MACHINEX86_X64(void __sidt(void *))
410 __MACHINEARM(void __static_assert(int, const char *))
411 __MACHINEX86_X64(void __stosb(unsigned char *, unsigned char, size_t))
412 __MACHINEX86_X64(void __stosd(unsigned long *, unsigned long, size_t))
413 __MACHINEX64(void __stosq(unsigned __int64 *, unsigned __int64, size_t))
414 __MACHINEX86_X64(void __stosw(unsigned short *, unsigned short, size_t))
415 __MACHINEX86_X64(void __svm_clgi(void))
416 __MACHINEX86_X64(void __svm_invlpga(void *, int))
417 __MACHINEX86_X64(void __svm_skinit(int))
418 __MACHINEX86_X64(void __svm_stgi(void))
419 __MACHINEX86_X64(void __svm_vmload(size_t))
420 __MACHINEX86_X64(void __svm_vmrun(size_t))
421 __MACHINEX86_X64(void __svm_vmsave(size_t))
422 __MACHINEARM(unsigned int __swi(unsigned int, ...))
423 __MACHINEARM(unsigned int __svc(unsigned int, ...))
424 __MACHINEARM(int __trap(int, ...))
425 __MACHINEX86_X64(void __ud2(void))
426 __MACHINEX86_X64(unsigned __int64 __ull_rshift(unsigned __int64, int))
427 __MACHINEX64(unsigned __int64 __umulh(unsigned __int64, unsigned __int64))
428 __MACHINEX86_X64(void __vmx_off(void))
429 __MACHINEX64(unsigned char __vmx_on(unsigned __int64 *))
430 __MACHINEX64(unsigned char __vmx_vmclear(unsigned __int64 *))
431 __MACHINEX64(unsigned char __vmx_vmlaunch(void))
432 __MACHINEX64(unsigned char __vmx_vmptrld(unsigned __int64 *))
433 __MACHINEX86_X64(void __vmx_vmptrst(unsigned __int64 *))
434 __MACHINEX64(unsigned char __vmx_vmread(size_t, size_t *))
435 __MACHINEX64(unsigned char __vmx_vmresume(void))
436 __MACHINEX64(unsigned char __vmx_vmwrite(size_t, size_t))
437 __MACHINEX86_X64(void __wbinvd(void))
438 __MACHINEARM(void __wfe(void))
439 __MACHINEARM(void __wfi(void))
440 __MACHINEX64(void __writecr0(unsigned __int64))
441 __MACHINEX86(void __writecr0(unsigned int))
442 __MACHINEX64(void __writecr3(unsigned __int64))
443 __MACHINEX86(void __writecr3(unsigned int))
444 __MACHINEX64(void __writecr4(unsigned __int64))
445 __MACHINEX86(void __writecr4(unsigned int))
446 __MACHINEX64(void __writecr8(unsigned __int64))
447 __MACHINEX86(void __writecr8(unsigned int))
448 __MACHINEX64(void __writedr(unsigned int, unsigned __int64))
449 __MACHINEX86(void __writedr(unsigned int, unsigned int))
450 __MACHINEX64(void __writeeflags(unsigned __int64))
451 __MACHINEX86(void __writeeflags(unsigned int))
452 __MACHINEX86(void __writefsbyte(unsigned long, unsigned char))
453 __MACHINEX86(void __writefsdword(unsigned long, unsigned long))
454 __MACHINEX86(void __writefsqword(unsigned long, unsigned __int64))
455 __MACHINEX86(void __writefsword(unsigned long, unsigned short))
456 __MACHINEX64(void __writegsbyte(unsigned long, unsigned char))
457 __MACHINEX64(void __writegsdword(unsigned long, unsigned long))
458 __MACHINEX64(void __writegsqword(unsigned long, unsigned __int64))
459 __MACHINEX64(void __writegsword(unsigned long, unsigned short))
460 __MACHINEX86_X64(void __writemsr(unsigned long, unsigned __int64))
461 __MACHINEARM(void __yield(void))
462 __MACHINE(unsigned char _bittest(long const *, long))
463 __MACHINEX64(unsigned char _bittest64(__int64 const *, __int64))
464 __MACHINE(unsigned char _bittestandcomplement(long *, long))
465 __MACHINEX64(unsigned char _bittestandcomplement64(__int64 *, __int64))
466 __MACHINE(unsigned char _bittestandreset(long *, long))
467 __MACHINEX64(unsigned char _bittestandreset64(__int64 *, __int64))
468 __MACHINE(unsigned char _bittestandset(long *, long))
469 __MACHINEX64(unsigned char _bittestandset64(__int64 *, __int64))
470 __MACHINE(_Check_return_ unsigned __int64 __cdecl _byteswap_uint64(_In_ unsigned __int64))
471 __MACHINE(_Check_return_ unsigned long __cdecl _byteswap_ulong(_In_ unsigned long))
472 __MACHINE(_Check_return_ unsigned short __cdecl _byteswap_ushort(_In_ unsigned short))
473 __MACHINE(void __cdecl _disable(void))
474 __MACHINE(void __cdecl _enable(void))
475 __MACHINE(unsigned char _interlockedbittestandreset(long volatile *, long))
476 __MACHINEX64(unsigned char _interlockedbittestandreset64(__int64 volatile *, __int64))
477 __MACHINEARM(unsigned char _interlockedbittestandreset_acq(long volatile *, long))
478 __MACHINEARM(unsigned char _interlockedbittestandreset_nf(long volatile *, long))
479 __MACHINEARM(unsigned char _interlockedbittestandreset_rel(long volatile *, long))
480 __MACHINE(unsigned char _interlockedbittestandset(long volatile *, long))
481 __MACHINEX64(unsigned char _interlockedbittestandset64(__int64 volatile *, __int64))
482 __MACHINEARM(unsigned char _interlockedbittestandset_acq(long volatile *, long))
483 __MACHINEARM(unsigned char _interlockedbittestandset_nf(long volatile *, long))
484 __MACHINEARM(unsigned char _interlockedbittestandset_rel(long volatile *, long))
485 __MACHINEARM(int _isunordered(double, double))
486 __MACHINEARM(int _isunorderedf(float, float))
487 __MACHINE(_Check_return_ unsigned long __cdecl _lrotl(_In_ unsigned long, _In_ int))
488 __MACHINE(_Check_return_ unsigned long __cdecl _lrotr(_In_ unsigned long, _In_ int))
489 __MACHINEX86(void _m_empty(void))
490 __MACHINEX86(void _m_femms(void))
493 __MACHINEX86(void _m_maskmovq(__m64, __m64, char *))
494 __MACHINEX86(__m64 _m_packssdw(__m64, __m64))
495 __MACHINEX86(__m64 _m_packsswb(__m64, __m64))
496 __MACHINEX86(__m64 _m_packuswb(__m64, __m64))
497 __MACHINEX86(__m64 _m_paddb(__m64, __m64))
498 __MACHINEX86(__m64 _m_paddd(__m64, __m64))
499 __MACHINEX86(__m64 _m_paddsb(__m64, __m64))
500 __MACHINEX86(__m64 _m_paddsw(__m64, __m64))
501 __MACHINEX86(__m64 _m_paddusb(__m64, __m64))
502 __MACHINEX86(__m64 _m_paddusw(__m64, __m64))
503 __MACHINEX86(__m64 _m_paddw(__m64, __m64))
504 __MACHINEX86(__m64 _m_pand(__m64, __m64))
505 __MACHINEX86(__m64 _m_pandn(__m64, __m64))
506 __MACHINEX86(__m64 _m_pavgb(__m64, __m64))
507 __MACHINEX86(__m64 _m_pavgusb(__m64, __m64))
508 __MACHINEX86(__m64 _m_pavgw(__m64, __m64))
509 __MACHINEX86(__m64 _m_pcmpeqb(__m64, __m64))
510 __MACHINEX86(__m64 _m_pcmpeqd(__m64, __m64))
511 __MACHINEX86(__m64 _m_pcmpeqw(__m64, __m64))
512 __MACHINEX86(__m64 _m_pcmpgtb(__m64, __m64))
513 __MACHINEX86(__m64 _m_pcmpgtd(__m64, __m64))
514 __MACHINEX86(__m64 _m_pcmpgtw(__m64, __m64))
515 __MACHINEX86(int _m_pextrw(__m64, int))
516 __MACHINEX86(__m64 _m_pf2id(__m64))
517 __MACHINEX86(__m64 _m_pf2iw(__m64))
518 __MACHINEX86(__m64 _m_pfacc(__m64, __m64))
519 __MACHINEX86(__m64 _m_pfadd(__m64, __m64))
520 __MACHINEX86(__m64 _m_pfcmpeq(__m64, __m64))
521 __MACHINEX86(__m64 _m_pfcmpge(__m64, __m64))
522 __MACHINEX86(__m64 _m_pfcmpgt(__m64, __m64))
523 __MACHINEX86(__m64 _m_pfmax(__m64, __m64))
524 __MACHINEX86(__m64 _m_pfmin(__m64, __m64))
525 __MACHINEX86(__m64 _m_pfmul(__m64, __m64))
526 __MACHINEX86(__m64 _m_pfnacc(__m64, __m64))
527 __MACHINEX86(__m64 _m_pfpnacc(__m64, __m64))
528 __MACHINEX86(__m64 _m_pfrcp(__m64))
529 __MACHINEX86(__m64 _m_pfrcpit1(__m64, __m64))
530 __MACHINEX86(__m64 _m_pfrcpit2(__m64, __m64))
531 __MACHINEX86(__m64 _m_pfrsqit1(__m64, __m64))
532 __MACHINEX86(__m64 _m_pfrsqrt(__m64))
533 __MACHINEX86(__m64 _m_pfsub(__m64, __m64))
534 __MACHINEX86(__m64 _m_pfsubr(__m64, __m64))
535 __MACHINEX86(__m64 _m_pi2fd(__m64))
536 __MACHINEX86(__m64 _m_pi2fw(__m64))
537 __MACHINEX86(__m64 _m_pinsrw(__m64, int, int))
538 __MACHINEX86(__m64 _m_pmaddwd(__m64, __m64))
539 __MACHINEX86(__m64 _m_pmaxsw(__m64, __m64))
540 __MACHINEX86(__m64 _m_pmaxub(__m64, __m64))
541 __MACHINEX86(__m64 _m_pminsw(__m64, __m64))
542 __MACHINEX86(__m64 _m_pminub(__m64, __m64))
543 __MACHINEX86(int _m_pmovmskb(__m64))
544 __MACHINEX86(__m64 _m_pmulhrw(__m64, __m64))
545 __MACHINEX86(__m64 _m_pmulhuw(__m64, __m64))
546 __MACHINEX86(__m64 _m_pmulhw(__m64, __m64))
547 __MACHINEX86(__m64 _m_pmullw(__m64, __m64))
548 __MACHINEX86(__m64 _m_por(__m64, __m64))
549 __MACHINEX86_X64(void _m_prefetch(void *))
550 __MACHINEX86_X64(void _m_prefetchw(volatile const void *))
551 __MACHINEX86(__m64 _m_psadbw(__m64, __m64))
552 __MACHINEX86(__m64 _m_pshufw(__m64, int))
553 __MACHINEX86(__m64 _m_pslld(__m64, __m64))
554 __MACHINEX86(__m64 _m_pslldi(__m64, int))
555 __MACHINEX86(__m64 _m_psllq(__m64, __m64))
556 __MACHINEX86(__m64 _m_psllqi(__m64, int))
557 __MACHINEX86(__m64 _m_psllw(__m64, __m64))
558 __MACHINEX86(__m64 _m_psllwi(__m64, int))
559 __MACHINEX86(__m64 _m_psrad(__m64, __m64))
560 __MACHINEX86(__m64 _m_psradi(__m64, int))
561 __MACHINEX86(__m64 _m_psraw(__m64, __m64))
562 __MACHINEX86(__m64 _m_psrawi(__m64, int))
563 __MACHINEX86(__m64 _m_psrld(__m64, __m64))
564 __MACHINEX86(__m64 _m_psrldi(__m64, int))
565 __MACHINEX86(__m64 _m_psrlq(__m64, __m64))
566 __MACHINEX86(__m64 _m_psrlqi(__m64, int))
567 __MACHINEX86(__m64 _m_psrlw(__m64, __m64))
568 __MACHINEX86(__m64 _m_psrlwi(__m64, int))
569 __MACHINEX86(__m64 _m_psubb(__m64, __m64))
570 __MACHINEX86(__m64 _m_psubd(__m64, __m64))
571 __MACHINEX86(__m64 _m_psubsb(__m64, __m64))
572 __MACHINEX86(__m64 _m_psubsw(__m64, __m64))
573 __MACHINEX86(__m64 _m_psubusb(__m64, __m64))
574 __MACHINEX86(__m64 _m_psubusw(__m64, __m64))
575 __MACHINEX86(__m64 _m_psubw(__m64, __m64))
576 __MACHINEX86(__m64 _m_pswapd(__m64))
577 __MACHINEX86(__m64 _m_punpckhbw(__m64, __m64))
578 __MACHINEX86(__m64 _m_punpckhdq(__m64, __m64))
579 __MACHINEX86(__m64 _m_punpckhwd(__m64, __m64))
580 __MACHINEX86(__m64 _m_punpcklbw(__m64, __m64))
581 __MACHINEX86(__m64 _m_punpckldq(__m64, __m64))
582 __MACHINEX86(__m64 _m_punpcklwd(__m64, __m64))
583 __MACHINEX86(__m64 _m_pxor(__m64, __m64))
584 __MACHINEX86(float _m_to_float(__m64))
585 __MACHINEX86(int _m_to_int(__m64))
589 __MACHINEX86_X64(__m64 _mm_abs_pi16(__m64))
590 __MACHINEX86_X64(__m64 _mm_abs_pi32(__m64))
591 __MACHINEX86_X64(__m64 _mm_abs_pi8(__m64))
593 __MACHINEX86_X64(__m128i _mm_add_epi32(__m128i, __m128i))
594 __MACHINEX86_X64(__m128i _mm_add_epi64(__m128i, __m128i))
595 __MACHINEX86_X64(__m128i _mm_add_epi8(__m128i, __m128i))
598 __MACHINEX86_X64(__m128d _mm_add_sd(__m128d, __m128d))
599 __MACHINEX86(__m64 _mm_add_si64(__m64, __m64))
600 __MACHINEX86_X64(__m128 _mm_add_ss(__m128, __m128))
601 __MACHINEX86_X64(__m128i _mm_adds_epi16(__m128i, __m128i))
602 __MACHINEX86_X64(__m128i _mm_adds_epi8(__m128i, __m128i))
603 __MACHINEX86_X64(__m128i _mm_adds_epu16(__m128i, __m128i))
604 __MACHINEX86_X64(__m128i _mm_adds_epu8(__m128i, __m128i))
605 __MACHINEX86_X64(__m128d _mm_addsub_pd(__m128d, __m128d))
606 __MACHINEX86_X64(__m128 _mm_addsub_ps(__m128, __m128))
607 __MACHINEX86_X64(__m128i _mm_alignr_epi8(__m128i, __m128i, int))
608 __MACHINEX86_X64(__m64 _mm_alignr_pi8(__m64, __m64, int))
609 __MACHINEX86_X64(__m128d _mm_and_pd(__m128d, __m128d))
610 __MACHINEX86_X64(__m128 _mm_and_ps(__m128, __m128))
611 __MACHINEX86_X64(__m128i _mm_and_si128(__m128i, __m128i))
612 __MACHINEX86_X64(__m128d _mm_andnot_pd(__m128d, __m128d))
613 __MACHINEX86_X64(__m128 _mm_andnot_ps(__m128, __m128))
614 __MACHINEX86_X64(__m128i _mm_andnot_si128(__m128i, __m128i))
615 __MACHINEX86_X64(__m128i _mm_avg_epu16(__m128i, __m128i))
616 __MACHINEX86_X64(__m128i _mm_avg_epu8(__m128i, __m128i))
617 __MACHINEX86_X64(__m128i _mm_blend_epi16(__m128i, __m128i, int))
618 __MACHINEX86_X64(__m128d _mm_blend_pd(__m128d, __m128d, int))
619 __MACHINEX86_X64(__m128 _mm_blend_ps(__m128, __m128, int))
620 __MACHINEX86_X64(__m128i _mm_blendv_epi8(__m128i, __m128i, __m128i))
621 __MACHINEX86_X64(__m128d _mm_blendv_pd(__m128d, __m128d, __m128d))
622 __MACHINEX86_X64(__m128 _mm_blendv_ps(__m128, __m128, __m128))
623 __MACHINEX86_X64(void _mm_clflush(void const *))
624 __MACHINEX86_X64(__m128i _mm_cmpeq_epi16(__m128i, __m128i))
625 __MACHINEX86_X64(__m128i _mm_cmpeq_epi32(__m128i, __m128i))
626 __MACHINEX86_X64(__m128i _mm_cmpeq_epi64(__m128i, __m128i))
627 __MACHINEX86_X64(__m128i _mm_cmpeq_epi8(__m128i, __m128i))
628 __MACHINEX86_X64(__m128d _mm_cmpeq_pd(__m128d, __m128d))
629 __MACHINEX86_X64(__m128 _mm_cmpeq_ps(__m128, __m128))
630 __MACHINEX86_X64(__m128d _mm_cmpeq_sd(__m128d, __m128d))
631 __MACHINEX86_X64(__m128 _mm_cmpeq_ss(__m128, __m128))
632 __MACHINEX86_X64(int _mm_cmpestra(__m128i, int, __m128i, int, int))
633 __MACHINEX86_X64(int _mm_cmpestrc(__m128i, int, __m128i, int, int))
634 __MACHINEX86_X64(int _mm_cmpestri(__m128i, int, __m128i, int, int))
635 __MACHINEX86_X64(__m128i _mm_cmpestrm(__m128i, int, __m128i, int, int))
636 __MACHINEX86_X64(int _mm_cmpestro(__m128i, int, __m128i, int, int))
637 __MACHINEX86_X64(int _mm_cmpestrs(__m128i, int, __m128i, int, int))
638 __MACHINEX86_X64(int _mm_cmpestrz(__m128i, int, __m128i, int, int))
639 __MACHINEX86_X64(__m128d _mm_cmpge_pd(__m128d, __m128d))
640 __MACHINEX86_X64(__m128 _mm_cmpge_ps(__m128, __m128))
641 __MACHINEX86_X64(__m128d _mm_cmpge_sd(__m128d, __m128d))
642 __MACHINEX86_X64(__m128 _mm_cmpge_ss(__m128, __m128))
643 __MACHINEX86_X64(__m128i _mm_cmpgt_epi16(__m128i, __m128i))
644 __MACHINEX86_X64(__m128i _mm_cmpgt_epi32(__m128i, __m128i))
645 __MACHINEX86_X64(__m128i _mm_cmpgt_epi64(__m128i, __m128i))
646 __MACHINEX86_X64(__m128i _mm_cmpgt_epi8(__m128i, __m128i))
647 __MACHINEX86_X64(__m128d _mm_cmpgt_pd(__m128d, __m128d))
648 __MACHINEX86_X64(__m128 _mm_cmpgt_ps(__m128, __m128))
649 __MACHINEX86_X64(__m128d _mm_cmpgt_sd(__m128d, __m128d))
650 __MACHINEX86_X64(__m128 _mm_cmpgt_ss(__m128, __m128))
651 __MACHINEX86_X64(int _mm_cmpistra(__m128i, __m128i, int))
652 __MACHINEX86_X64(int _mm_cmpistrc(__m128i, __m128i, int))
653 __MACHINEX86_X64(int _mm_cmpistri(__m128i, __m128i, int))
654 __MACHINEX86_X64(__m128i _mm_cmpistrm(__m128i, __m128i, int))
655 __MACHINEX86_X64(int _mm_cmpistro(__m128i, __m128i, int))
656 __MACHINEX86_X64(int _mm_cmpistrs(__m128i, __m128i, int))
657 __MACHINEX86_X64(int _mm_cmpistrz(__m128i, __m128i, int))
658 __MACHINEX86_X64(__m128d _mm_cmple_pd(__m128d, __m128d))
659 __MACHINEX86_X64(__m128 _mm_cmple_ps(__m128, __m128))
660 __MACHINEX86_X64(__m128d _mm_cmple_sd(__m128d, __m128d))
661 __MACHINEX86_X64(__m128 _mm_cmple_ss(__m128, __m128))
662 __MACHINEX86_X64(__m128i _mm_cmplt_epi16(__m128i, __m128i))
663 __MACHINEX86_X64(__m128i _mm_cmplt_epi32(__m128i, __m128i))
664 __MACHINEX86_X64(__m128i _mm_cmplt_epi8(__m128i, __m128i))
665 __MACHINEX86_X64(__m128d _mm_cmplt_pd(__m128d, __m128d))
666 __MACHINEX86_X64(__m128 _mm_cmplt_ps(__m128, __m128))
667 __MACHINEX86_X64(__m128d _mm_cmplt_sd(__m128d, __m128d))
668 __MACHINEX86_X64(__m128 _mm_cmplt_ss(__m128, __m128))
669 __MACHINEX86_X64(__m128d _mm_cmpneq_pd(__m128d, __m128d))
670 __MACHINEX86_X64(__m128 _mm_cmpneq_ps(__m128, __m128))
671 __MACHINEX86_X64(__m128d _mm_cmpneq_sd(__m128d, __m128d))
672 __MACHINEX86_X64(__m128 _mm_cmpneq_ss(__m128, __m128))
673 __MACHINEX86_X64(__m128d _mm_cmpnge_pd(__m128d, __m128d))
674 __MACHINEX86_X64(__m128 _mm_cmpnge_ps(__m128, __m128))
675 __MACHINEX86_X64(__m128d _mm_cmpnge_sd(__m128d, __m128d))
676 __MACHINEX86_X64(__m128 _mm_cmpnge_ss(__m128, __m128))
677 __MACHINEX86_X64(__m128d _mm_cmpngt_pd(__m128d, __m128d))
678 __MACHINEX86_X64(__m128 _mm_cmpngt_ps(__m128, __m128))
679 __MACHINEX86_X64(__m128d _mm_cmpngt_sd(__m128d, __m128d))
680 __MACHINEX86_X64(__m128 _mm_cmpngt_ss(__m128, __m128))
681 __MACHINEX86_X64(__m128d _mm_cmpnle_pd(__m128d, __m128d))
682 __MACHINEX86_X64(__m128 _mm_cmpnle_ps(__m128, __m128))
683 __MACHINEX86_X64(__m128d _mm_cmpnle_sd(__m128d, __m128d))
684 __MACHINEX86_X64(__m128 _mm_cmpnle_ss(__m128, __m128))
685 __MACHINEX86_X64(__m128d _mm_cmpnlt_pd(__m128d, __m128d))
686 __MACHINEX86_X64(__m128 _mm_cmpnlt_ps(__m128, __m128))
687 __MACHINEX86_X64(__m128d _mm_cmpnlt_sd(__m128d, __m128d))
688 __MACHINEX86_X64(__m128 _mm_cmpnlt_ss(__m128, __m128))
689 __MACHINEX86_X64(__m128d _mm_cmpord_pd(__m128d, __m128d))
690 __MACHINEX86_X64(__m128 _mm_cmpord_ps(__m128, __m128))
691 __MACHINEX86_X64(__m128d _mm_cmpord_sd(__m128d, __m128d))
692 __MACHINEX86_X64(__m128 _mm_cmpord_ss(__m128, __m128))
693 __MACHINEX86_X64(__m128d _mm_cmpunord_pd(__m128d, __m128d))
694 __MACHINEX86_X64(__m128 _mm_cmpunord_ps(__m128, __m128))
695 __MACHINEX86_X64(__m128d _mm_cmpunord_sd(__m128d, __m128d))
696 __MACHINEX86_X64(__m128 _mm_cmpunord_ss(__m128, __m128))
697 __MACHINEX86_X64(int _mm_comieq_sd(__m128d, __m128d))
698 __MACHINEX86_X64(int _mm_comieq_ss(__m128, __m128))
699 __MACHINEX86_X64(int _mm_comige_sd(__m128d, __m128d))
700 __MACHINEX86_X64(int _mm_comige_ss(__m128, __m128))
701 __MACHINEX86_X64(int _mm_comigt_sd(__m128d, __m128d))
702 __MACHINEX86_X64(int _mm_comigt_ss(__m128, __m128))
703 __MACHINEX86_X64(int _mm_comile_sd(__m128d, __m128d))
704 __MACHINEX86_X64(int _mm_comile_ss(__m128, __m128))
705 __MACHINEX86_X64(int _mm_comilt_sd(__m128d, __m128d))
706 __MACHINEX86_X64(int _mm_comilt_ss(__m128, __m128))
707 __MACHINEX86_X64(int _mm_comineq_sd(__m128d, __m128d))
708 __MACHINEX86_X64(int _mm_comineq_ss(__m128, __m128))
709 __MACHINEX86_X64(unsigned int _mm_crc32_u16(unsigned int, unsigned short))
710 __MACHINEX86_X64(unsigned int _mm_crc32_u32(unsigned int, unsigned int))
711 __MACHINEX64(unsigned __int64 _mm_crc32_u64(unsigned __int64, unsigned __int64))
712 __MACHINEX86_X64(unsigned int _mm_crc32_u8(unsigned int, unsigned char))
713 __MACHINEX86(__m128 _mm_cvt_pi2ps(__m128, __m64))
714 __MACHINEX86(__m64 _mm_cvt_ps2pi(__m128))
715 __MACHINEX86_X64(__m128 _mm_cvt_si2ss(__m128, int))
716 __MACHINEX86_X64(int _mm_cvt_ss2si(__m128))
717 __MACHINEX86_X64(__m128i _mm_cvtepi16_epi32(__m128i))
718 __MACHINEX86_X64(__m128i _mm_cvtepi16_epi64(__m128i))
719 __MACHINEX86_X64(__m128i _mm_cvtepi32_epi64(__m128i))
720 __MACHINEX86_X64(__m128d _mm_cvtepi32_pd(__m128i))
721 __MACHINEX86_X64(__m128 _mm_cvtepi32_ps(__m128i))
722 __MACHINEX86_X64(__m128i _mm_cvtepi8_epi16(__m128i))
723 __MACHINEX86_X64(__m128i _mm_cvtepi8_epi32(__m128i))
724 __MACHINEX86_X64(__m128i _mm_cvtepi8_epi64(__m128i))
725 __MACHINEX86_X64(__m128i _mm_cvtepu16_epi32(__m128i))
726 __MACHINEX86_X64(__m128i _mm_cvtepu16_epi64(__m128i))
727 __MACHINEX86_X64(__m128i _mm_cvtepu32_epi64(__m128i))
728 __MACHINEX86_X64(__m128i _mm_cvtepu8_epi16(__m128i))
729 __MACHINEX86_X64(__m128i _mm_cvtepu8_epi32(__m128i))
730 __MACHINEX86_X64(__m128i _mm_cvtepu8_epi64(__m128i))
731 __MACHINEX86_X64(__m128i _mm_cvtpd_epi32(__m128d))
732 __MACHINEX86(__m64 _mm_cvtpd_pi32(__m128d))
733 __MACHINEX86_X64(__m128 _mm_cvtpd_ps(__m128d))
734 __MACHINEX86(__m128d _mm_cvtpi32_pd(__m64))
735 __MACHINEX86_X64(__m128i _mm_cvtps_epi32(__m128))
736 __MACHINEX86_X64(__m128d _mm_cvtps_pd(__m128))
737 __MACHINEX86_X64(int _mm_cvtsd_si32(__m128d))
738 __MACHINEX64(__int64 _mm_cvtsd_si64(__m128d))
739 __MACHINEX64(__int64 _mm_cvtsd_si64x(__m128d))
740 __MACHINEX86_X64(__m128 _mm_cvtsd_ss(__m128, __m128d))
742 __MACHINEX64(__int64 _mm_cvtsi128_si64(__m128i))
743 __MACHINEX64(__int64 _mm_cvtsi128_si64x(__m128i))
744 __MACHINEX86_X64(__m128d _mm_cvtsi32_sd(__m128d, int))
746 __MACHINEX64(__m128d _mm_cvtsi64_sd(__m128d, __int64))
747 __MACHINEX64(__m128i _mm_cvtsi64_si128(__int64))
748 __MACHINEX64(__m128 _mm_cvtsi64_ss(__m128, __int64))
749 __MACHINEX64(__m128d _mm_cvtsi64x_sd(__m128d, __int64))
750 __MACHINEX64(__m128i _mm_cvtsi64x_si128(__int64))
751 __MACHINEX64(__m128 _mm_cvtsi64x_ss(__m128, __int64))
752 __MACHINEX86_X64(__m128d _mm_cvtss_sd(__m128d, __m128))
753 __MACHINEX64(__int64 _mm_cvtss_si64(__m128))
754 __MACHINEX64(__int64 _mm_cvtss_si64x(__m128))
755 __MACHINEX86(__m64 _mm_cvtt_ps2pi(__m128))
756 __MACHINEX86_X64(int _mm_cvtt_ss2si(__m128))
757 __MACHINEX86_X64(__m128i _mm_cvttpd_epi32(__m128d))
758 __MACHINEX86(__m64 _mm_cvttpd_pi32(__m128d))
759 __MACHINEX86_X64(__m128i _mm_cvttps_epi32(__m128))
760 __MACHINEX86_X64(int _mm_cvttsd_si32(__m128d))
761 __MACHINEX64(__int64 _mm_cvttsd_si64(__m128d))
762 __MACHINEX64(__int64 _mm_cvttsd_si64x(__m128d))
763 __MACHINEX64(__int64 _mm_cvttss_si64(__m128))
764 __MACHINEX64(__int64 _mm_cvttss_si64x(__m128))
765 __MACHINEX86_X64(__m128d _mm_div_pd(__m128d, __m128d))
766 __MACHINEX86_X64(__m128 _mm_div_ps(__m128, __m128))
767 __MACHINEX86_X64(__m128d _mm_div_sd(__m128d, __m128d))
768 __MACHINEX86_X64(__m128 _mm_div_ss(__m128, __m128))
769 __MACHINEX86_X64(__m128d _mm_dp_pd(__m128d, __m128d, int))
770 __MACHINEX86_X64(__m128 _mm_dp_ps(__m128, __m128, int))
771 __MACHINEX86_X64(int _mm_extract_epi16(__m128i, int))
772 __MACHINEX86_X64(int _mm_extract_epi32(__m128i, int))
773 __MACHINEX64(__int64 _mm_extract_epi64(__m128i, int))
774 __MACHINEX86_X64(int _mm_extract_epi8(__m128i, int))
775 __MACHINEX86_X64(int _mm_extract_ps(__m128, int))
776 __MACHINEX86_X64(__m128i _mm_extract_si64(__m128i, __m128i))
777 __MACHINEX86_X64(__m128i _mm_extracti_si64(__m128i, int, int))
778 __MACHINEX86_X64(unsigned int _mm_getcsr(void))
779 __MACHINEX86_X64(__m128i _mm_hadd_epi16(__m128i, __m128i))
780 __MACHINEX86_X64(__m128i _mm_hadd_epi32(__m128i, __m128i))
781 __MACHINEX86_X64(__m128d _mm_hadd_pd(__m128d, __m128d))
782 __MACHINEX86_X64(__m64 _mm_hadd_pi16(__m64, __m64))
783 __MACHINEX86_X64(__m64 _mm_hadd_pi32(__m64, __m64))
784 __MACHINEX86_X64(__m128 _mm_hadd_ps(__m128, __m128))
785 __MACHINEX86_X64(__m128i _mm_hadds_epi16(__m128i, __m128i))
786 __MACHINEX86_X64(__m64 _mm_hadds_pi16(__m64, __m64))
787 __MACHINEX86_X64(__m128i _mm_hsub_epi16(__m128i, __m128i))
788 __MACHINEX86_X64(__m128i _mm_hsub_epi32(__m128i, __m128i))
789 __MACHINEX86_X64(__m128d _mm_hsub_pd(__m128d, __m128d))
790 __MACHINEX86_X64(__m64 _mm_hsub_pi16(__m64, __m64))
791 __MACHINEX86_X64(__m64 _mm_hsub_pi32(__m64, __m64))
792 __MACHINEX86_X64(__m128 _mm_hsub_ps(__m128, __m128))
793 __MACHINEX86_X64(__m128i _mm_hsubs_epi16(__m128i, __m128i))
794 __MACHINEX86_X64(__m64 _mm_hsubs_pi16(__m64, __m64))
795 __MACHINEX86_X64(__m128i _mm_insert_epi16(__m128i, int, int))
796 __MACHINEX86_X64(__m128i _mm_insert_epi32(__m128i, int, int))
797 __MACHINEX64(__m128i _mm_insert_epi64(__m128i, __int64, int))
798 __MACHINEX86_X64(__m128i _mm_insert_epi8(__m128i, int, int))
799 __MACHINEX86_X64(__m128 _mm_insert_ps(__m128, __m128, int))
800 __MACHINEX86_X64(__m128i _mm_insert_si64(__m128i, __m128i))
801 __MACHINEX86_X64(__m128i _mm_inserti_si64(__m128i, __m128i, int, int))
802 __MACHINEX86_X64(__m128i _mm_lddqu_si128(__m128i const *))
803 __MACHINEX86_X64(void _mm_lfence(void))
804 __MACHINEX86_X64(__m128d _mm_load1_pd(double const *))
805 __MACHINEX86_X64(__m128d _mm_load_pd(double const *))
806 __MACHINEX86_X64(__m128 _mm_load_ps(float const *))
807 __MACHINEX86_X64(__m128 _mm_load_ps1(float const *))
808 __MACHINEX86_X64(__m128d _mm_load_sd(double const *))
809 __MACHINEX86_X64(__m128i _mm_load_si128(__m128i const *))
810 __MACHINEX86_X64(__m128 _mm_load_ss(float const *))
811 __MACHINEX86_X64(__m128d _mm_loaddup_pd(double const *))
812 __MACHINEX86_X64(__m128d _mm_loadh_pd(__m128d, double const *))
813 __MACHINEX86_X64(__m128 _mm_loadh_pi(__m128, __m64 const *))
814 __MACHINEX86_X64(__m128i _mm_loadl_epi64(__m128i const *))
815 __MACHINEX86_X64(__m128d _mm_loadl_pd(__m128d, double const *))
816 __MACHINEX86_X64(__m128 _mm_loadl_pi(__m128, __m64 const *))
817 __MACHINEX86_X64(__m128d _mm_loadr_pd(double const *))
818 __MACHINEX86_X64(__m128 _mm_loadr_ps(float const *))
819 __MACHINEX86_X64(__m128d _mm_loadu_pd(double const *))
820 __MACHINEX86_X64(__m128 _mm_loadu_ps(float const *))
821 __MACHINEX86_X64(__m128i _mm_loadu_si128(__m128i const *))
822 __MACHINEX86_X64(__m128i _mm_madd_epi16(__m128i, __m128i))
823 __MACHINEX86_X64(__m128i _mm_maddubs_epi16(__m128i, __m128i))
824 __MACHINEX86_X64(__m64 _mm_maddubs_pi16(__m64, __m64))
825 __MACHINEX86_X64(void _mm_maskmoveu_si128(__m128i, __m128i, char *))
826 __MACHINEX86_X64(__m128i _mm_max_epi16(__m128i, __m128i))
827 __MACHINEX86_X64(__m128i _mm_max_epi32(__m128i, __m128i))
828 __MACHINEX86_X64(__m128i _mm_max_epi8(__m128i, __m128i))
829 __MACHINEX86_X64(__m128i _mm_max_epu16(__m128i, __m128i))
830 __MACHINEX86_X64(__m128i _mm_max_epu32(__m128i, __m128i))
831 __MACHINEX86_X64(__m128i _mm_max_epu8(__m128i, __m128i))
832 __MACHINEX86_X64(__m128d _mm_max_pd(__m128d, __m128d))
833 __MACHINEX86_X64(__m128 _mm_max_ps(__m128, __m128))
834 __MACHINEX86_X64(__m128d _mm_max_sd(__m128d, __m128d))
835 __MACHINEX86_X64(__m128 _mm_max_ss(__m128, __m128))
836 __MACHINEX86_X64(void _mm_mfence(void))
837 __MACHINEX86_X64(__m128i _mm_min_epi16(__m128i, __m128i))
838 __MACHINEX86_X64(__m128i _mm_min_epi32(__m128i, __m128i))
839 __MACHINEX86_X64(__m128i _mm_min_epi8(__m128i, __m128i))
840 __MACHINEX86_X64(__m128i _mm_min_epu16(__m128i, __m128i))
841 __MACHINEX86_X64(__m128i _mm_min_epu32(__m128i, __m128i))
842 __MACHINEX86_X64(__m128i _mm_min_epu8(__m128i, __m128i))
843 __MACHINEX86_X64(__m128d _mm_min_pd(__m128d, __m128d))
844 __MACHINEX86_X64(__m128 _mm_min_ps(__m128, __m128))
845 __MACHINEX86_X64(__m128d _mm_min_sd(__m128d, __m128d))
846 __MACHINEX86_X64(__m128 _mm_min_ss(__m128, __m128))
847 __MACHINEX86_X64(__m128i _mm_minpos_epu16(__m128i))
848 __MACHINEX86_X64(void _mm_monitor(void const *, unsigned int, unsigned int))
849 __MACHINEX86_X64(__m128i _mm_move_epi64(__m128i))
850 __MACHINEX86_X64(__m128d _mm_move_sd(__m128d, __m128d))
851 __MACHINEX86_X64(__m128 _mm_move_ss(__m128, __m128))
852 __MACHINEX86_X64(__m128d _mm_movedup_pd(__m128d))
853 __MACHINEX86_X64(__m128 _mm_movehdup_ps(__m128))
854 __MACHINEX86_X64(__m128 _mm_movehl_ps(__m128, __m128))
855 __MACHINEX86_X64(__m128 _mm_moveldup_ps(__m128))
856 __MACHINEX86_X64(__m128 _mm_movelh_ps(__m128, __m128))
858 __MACHINEX86_X64(int _mm_movemask_pd(__m128d))
860 __MACHINEX86(__m64 _mm_movepi64_pi64(__m128i))
861 __MACHINEX86(__m128i _mm_movpi64_epi64(__m64))
862 __MACHINEX86_X64(__m128i _mm_mpsadbw_epu8(__m128i, __m128i, int))
863 __MACHINEX86_X64(__m128i _mm_mul_epi32(__m128i, __m128i))
864 __MACHINEX86_X64(__m128i _mm_mul_epu32(__m128i, __m128i))
865 __MACHINEX86_X64(__m128d _mm_mul_pd(__m128d, __m128d))
866 __MACHINEX86_X64(__m128 _mm_mul_ps(__m128, __m128))
867 __MACHINEX86_X64(__m128d _mm_mul_sd(__m128d, __m128d))
868 __MACHINEX86_X64(__m128 _mm_mul_ss(__m128, __m128))
869 __MACHINEX86(__m64 _mm_mul_su32(__m64, __m64))
870 __MACHINEX86_X64(__m128i _mm_mulhi_epi16(__m128i, __m128i))
871 __MACHINEX86_X64(__m128i _mm_mulhi_epu16(__m128i, __m128i))
872 __MACHINEX86_X64(__m128i _mm_mulhrs_epi16(__m128i, __m128i))
873 __MACHINEX86_X64(__m64 _mm_mulhrs_pi16(__m64, __m64))
874 __MACHINEX86_X64(__m128i _mm_mullo_epi16(__m128i, __m128i))
875 __MACHINEX86_X64(__m128i _mm_mullo_epi32(__m128i, __m128i))
876 __MACHINEX86_X64(void _mm_mwait(unsigned int, unsigned int))
877 __MACHINEX86_X64(__m128d _mm_or_pd(__m128d, __m128d))
878 __MACHINEX86_X64(__m128 _mm_or_ps(__m128, __m128))
879 __MACHINEX86_X64(__m128i _mm_or_si128(__m128i, __m128i))
880 __MACHINEX86_X64(__m128i _mm_packs_epi16(__m128i, __m128i))
881 __MACHINEX86_X64(__m128i _mm_packs_epi32(__m128i, __m128i))
882 __MACHINEX86_X64(__m128i _mm_packus_epi16(__m128i, __m128i))
883 __MACHINEX86_X64(__m128i _mm_packus_epi32(__m128i, __m128i))
884 __MACHINEX86_X64(void _mm_pause(void))
885 __MACHINEX86_X64(int _mm_popcnt_u32(unsigned int))
886 __MACHINEX64(__int64 _mm_popcnt_u64(unsigned __int64))
887 __MACHINEX86_X64(void _mm_prefetch(char const *, int))
888 __MACHINEX86_X64(__m128 _mm_rcp_ps(__m128))
889 __MACHINEX86_X64(__m128 _mm_rcp_ss(__m128))
890 __MACHINEX86_X64(__m128d _mm_round_pd(__m128d, int))
891 __MACHINEX86_X64(__m128 _mm_round_ps(__m128, int))
892 __MACHINEX86_X64(__m128d _mm_round_sd(__m128d, __m128d, int))
893 __MACHINEX86_X64(__m128 _mm_round_ss(__m128, __m128, int))
894 __MACHINEX86_X64(__m128 _mm_rsqrt_ps(__m128))
895 __MACHINEX86_X64(__m128 _mm_rsqrt_ss(__m128))
896 __MACHINEX86_X64(__m128i _mm_sad_epu8(__m128i, __m128i))
897 __MACHINEX86_X64(__m128i _mm_set1_epi16(short))
898 __MACHINEX86_X64(__m128i _mm_set1_epi32(int))
899 __MACHINEX86(__m128i _mm_set1_epi64(__m64))
900 __MACHINEX64(__m128i _mm_set1_epi64x(__int64))
901 __MACHINEX86_X64(__m128i _mm_set1_epi8(char))
902 __MACHINEX86_X64(__m128d _mm_set1_pd(double))
903 __MACHINEX86(__m64 _mm_set1_pi16(short))
904 __MACHINEX86(__m64 _mm_set1_pi32(int))
905 __MACHINEX86(__m64 _mm_set1_pi8(char))
906 __MACHINEX86_X64(__m128i _mm_set_epi16(short, short, short, short, short, short, short, short))
907 __MACHINEX86_X64(__m128i _mm_set_epi32(int, int, int, int))
908 __MACHINEX86(__m128i _mm_set_epi64(__m64, __m64))
909 __MACHINEX64(__m128i _mm_set_epi64x(__int64, __int64))
910 __MACHINEX86_X64(__m128i _mm_set_epi8(char, char, char, char, char, char, char, char, char, char, char, char, char, char, char, char))
911 __MACHINEX86_X64(__m128d _mm_set_pd(double, double))
912 __MACHINEX86(__m64 _mm_set_pi16(short, short, short, short))
913 __MACHINEX86(__m64 _mm_set_pi32(int, int))
914 __MACHINEX86(__m64 _mm_set_pi8(char, char, char, char, char, char, char, char))
915 __MACHINEX86_X64(__m128 _mm_set_ps(float, float, float, float))
916 __MACHINEX86_X64(__m128 _mm_set_ps1(float))
917 __MACHINEX86_X64(__m128d _mm_set_sd(double))
918 __MACHINEX86_X64(__m128 _mm_set_ss(float))
919 __MACHINEX86_X64(void _mm_setcsr(unsigned int))
920 __MACHINEX86_X64(__m128i _mm_setl_epi64(__m128i))
921 __MACHINEX86_X64(__m128i _mm_setr_epi16(short, short, short, short, short, short, short, short))
922 __MACHINEX86_X64(__m128i _mm_setr_epi32(int, int, int, int))
923 __MACHINEX86(__m128i _mm_setr_epi64(__m64, __m64))
924 __MACHINEX86_X64(__m128i _mm_setr_epi8(char, char, char, char, char, char, char, char, char, char, char, char, char, char, char, char))
925 __MACHINEX86_X64(__m128d _mm_setr_pd(double, double))
926 __MACHINEX86(__m64 _mm_setr_pi16(short, short, short, short))
927 __MACHINEX86(__m64 _mm_setr_pi32(int, int))
928 __MACHINEX86(__m64 _mm_setr_pi8(char, char, char, char, char, char, char, char))
929 __MACHINEX86_X64(__m128 _mm_setr_ps(float, float, float, float))
930 __MACHINEX86_X64(__m128d _mm_setzero_pd(void))
931 __MACHINEX86_X64(__m128 _mm_setzero_ps(void))
932 __MACHINEX86_X64(__m128i _mm_setzero_si128(void))
933 __MACHINEX86(__m64 _mm_setzero_si64(void))
934 __MACHINEX86_X64(void _mm_sfence(void))
935 __MACHINEX86_X64(__m128i _mm_shuffle_epi32(__m128i, int))
936 __MACHINEX86_X64(__m128i _mm_shuffle_epi8(__m128i, __m128i))
937 __MACHINEX86_X64(__m128d _mm_shuffle_pd(__m128d, __m128d, int))
938 __MACHINEX86_X64(__m64 _mm_shuffle_pi8(__m64, __m64))
939 __MACHINEX86_X64(__m128 _mm_shuffle_ps(__m128, __m128, unsigned int))
940 __MACHINEX86_X64(__m128i _mm_shufflehi_epi16(__m128i, int))
941 __MACHINEX86_X64(__m128i _mm_shufflelo_epi16(__m128i, int))
942 __MACHINEX86_X64(__m128i _mm_sign_epi16(__m128i, __m128i))
943 __MACHINEX86_X64(__m128i _mm_sign_epi32(__m128i, __m128i))
944 __MACHINEX86_X64(__m128i _mm_sign_epi8(__m128i, __m128i))
945 __MACHINEX86_X64(__m64 _mm_sign_pi16(__m64, __m64))
946 __MACHINEX86_X64(__m64 _mm_sign_pi32(__m64, __m64))
947 __MACHINEX86_X64(__m64 _mm_sign_pi8(__m64, __m64))
948 __MACHINEX86_X64(__m128i _mm_sll_epi16(__m128i, __m128i))
949 __MACHINEX86_X64(__m128i _mm_sll_epi32(__m128i, __m128i))
950 __MACHINEX86_X64(__m128i _mm_sll_epi64(__m128i, __m128i))
951 __MACHINEX86_X64(__m128i _mm_slli_epi16(__m128i, int))
952 __MACHINEX86_X64(__m128i _mm_slli_epi32(__m128i, int))
953 __MACHINEX86_X64(__m128i _mm_slli_epi64(__m128i, int))
954 __MACHINEX86_X64(__m128i _mm_slli_si128(__m128i, int))
955 __MACHINEX86_X64(__m128d _mm_sqrt_pd(__m128d))
956 __MACHINEX86_X64(__m128 _mm_sqrt_ps(__m128))
957 __MACHINEX86_X64(__m128d _mm_sqrt_sd(__m128d, __m128d))
958 __MACHINEX86_X64(__m128 _mm_sqrt_ss(__m128))
959 __MACHINEX86_X64(__m128i _mm_sra_epi16(__m128i, __m128i))
960 __MACHINEX86_X64(__m128i _mm_sra_epi32(__m128i, __m128i))
961 __MACHINEX86_X64(__m128i _mm_srai_epi16(__m128i, int))
962 __MACHINEX86_X64(__m128i _mm_srai_epi32(__m128i, int))
963 __MACHINEX86_X64(__m128i _mm_srl_epi16(__m128i, __m128i))
964 __MACHINEX86_X64(__m128i _mm_srl_epi32(__m128i, __m128i))
965 __MACHINEX86_X64(__m128i _mm_srl_epi64(__m128i, __m128i))
966 __MACHINEX86_X64(__m128i _mm_srli_epi16(__m128i, int))
967 __MACHINEX86_X64(__m128i _mm_srli_epi32(__m128i, int))
968 __MACHINEX86_X64(__m128i _mm_srli_epi64(__m128i, int))
969 __MACHINEX86_X64(__m128i _mm_srli_si128(__m128i, int))
970 __MACHINEX86_X64(void _mm_store1_pd(double *, __m128d))
971 __MACHINEX86_X64(void _mm_store_pd(double *, __m128d))
972 __MACHINEX86_X64(void _mm_store_ps(float *, __m128))
973 __MACHINEX86_X64(void _mm_store_ps1(float *, __m128))
974 __MACHINEX86_X64(void _mm_store_sd(double *, __m128d))
975 __MACHINEX86_X64(void _mm_store_si128(__m128i *, __m128i))
976 __MACHINEX86_X64(void _mm_store_ss(float *, __m128))
977 __MACHINEX86_X64(void _mm_storeh_pd(double *, __m128d))
978 __MACHINEX86_X64(void _mm_storeh_pi(__m64 *, __m128))
979 __MACHINEX86_X64(void _mm_storel_epi64(__m128i *, __m128i))
980 __MACHINEX86_X64(void _mm_storel_pd(double *, __m128d))
981 __MACHINEX86_X64(void _mm_storel_pi(__m64 *, __m128))
982 __MACHINEX86_X64(void _mm_storer_pd(double *, __m128d))
983 __MACHINEX86_X64(void _mm_storer_ps(float *, __m128))
984 __MACHINEX86_X64(void _mm_storeu_pd(double *, __m128d))
985 __MACHINEX86_X64(void _mm_storeu_ps(float *, __m128))
986 __MACHINEX86_X64(void _mm_storeu_si128(__m128i *, __m128i))
987 __MACHINEX86_X64(__m128i _mm_stream_load_si128(__m128i *))
988 __MACHINEX86_X64(void _mm_stream_pd(double *, __m128d))
989 __MACHINEX86(void _mm_stream_pi(__m64 *, __m64))
990 __MACHINEX86_X64(void _mm_stream_ps(float *, __m128))
991 __MACHINEX86_X64(void _mm_stream_sd(double *, __m128d))
992 __MACHINEX86_X64(void _mm_stream_si128(__m128i *, __m128i))
993 __MACHINEX86_X64(void _mm_stream_si32(int *, int))
994 __MACHINEX64(void _mm_stream_si64x(__int64 *, __int64))
995 __MACHINEX86_X64(void _mm_stream_ss(float *, __m128))
996 __MACHINEX86_X64(__m128i _mm_sub_epi16(__m128i, __m128i))
997 __MACHINEX86_X64(__m128i _mm_sub_epi32(__m128i, __m128i))
998 __MACHINEX86_X64(__m128i _mm_sub_epi64(__m128i, __m128i))
999 __MACHINEX86_X64(__m128i _mm_sub_epi8(__m128i, __m128i))
1000 __MACHINEX86_X64(__m128d _mm_sub_pd(__m128d, __m128d))
1001 __MACHINEX86_X64(__m128 _mm_sub_ps(__m128, __m128))
1002 __MACHINEX86_X64(__m128d _mm_sub_sd(__m128d, __m128d))
1003 __MACHINEX86(__m64 _mm_sub_si64(__m64, __m64))
1004 __MACHINEX86_X64(__m128 _mm_sub_ss(__m128, __m128))
1005 __MACHINEX86_X64(__m128i _mm_subs_epi16(__m128i, __m128i))
1006 __MACHINEX86_X64(__m128i _mm_subs_epi8(__m128i, __m128i))
1007 __MACHINEX86_X64(__m128i _mm_subs_epu16(__m128i, __m128i))
1008 __MACHINEX86_X64(__m128i _mm_subs_epu8(__m128i, __m128i))
1009 __MACHINEX86_X64(int _mm_testc_si128(__m128i, __m128i))
1010 __MACHINEX86_X64(int _mm_testnzc_si128(__m128i, __m128i))
1011 __MACHINEX86_X64(int _mm_testz_si128(__m128i, __m128i))
1012 __MACHINEX86_X64(int _mm_ucomieq_sd(__m128d, __m128d))
1013 __MACHINEX86_X64(int _mm_ucomieq_ss(__m128, __m128))
1014 __MACHINEX86_X64(int _mm_ucomige_sd(__m128d, __m128d))
1015 __MACHINEX86_X64(int _mm_ucomige_ss(__m128, __m128))
1016 __MACHINEX86_X64(int _mm_ucomigt_sd(__m128d, __m128d))
1017 __MACHINEX86_X64(int _mm_ucomigt_ss(__m128, __m128))
1018 __MACHINEX86_X64(int _mm_ucomile_sd(__m128d, __m128d))
1019 __MACHINEX86_X64(int _mm_ucomile_ss(__m128, __m128))
1020 __MACHINEX86_X64(int _mm_ucomilt_sd(__m128d, __m128d))
1021 __MACHINEX86_X64(int _mm_ucomilt_ss(__m128, __m128))
1022 __MACHINEX86_X64(int _mm_ucomineq_sd(__m128d, __m128d))
1023 __MACHINEX86_X64(int _mm_ucomineq_ss(__m128, __m128))
1024 __MACHINEX86_X64(__m128i _mm_unpackhi_epi16(__m128i, __m128i))
1025 __MACHINEX86_X64(__m128i _mm_unpackhi_epi32(__m128i, __m128i))
1026 __MACHINEX86_X64(__m128i _mm_unpackhi_epi64(__m128i, __m128i))
1027 __MACHINEX86_X64(__m128i _mm_unpackhi_epi8(__m128i, __m128i))
1028 __MACHINEX86_X64(__m128d _mm_unpackhi_pd(__m128d, __m128d))
1029 __MACHINEX86_X64(__m128 _mm_unpackhi_ps(__m128, __m128))
1030 __MACHINEX86_X64(__m128i _mm_unpacklo_epi16(__m128i, __m128i))
1031 __MACHINEX86_X64(__m128i _mm_unpacklo_epi32(__m128i, __m128i))
1032 __MACHINEX86_X64(__m128i _mm_unpacklo_epi64(__m128i, __m128i))
1033 __MACHINEX86_X64(__m128i _mm_unpacklo_epi8(__m128i, __m128i))
1034 __MACHINEX86_X64(__m128d _mm_unpacklo_pd(__m128d, __m128d))
1035 __MACHINEX86_X64(__m128 _mm_unpacklo_ps(__m128, __m128))
1036 __MACHINEX86_X64(__m128d _mm_xor_pd(__m128d, __m128d))
1037 __MACHINEX86_X64(__m128 _mm_xor_ps(__m128, __m128))
1038 __MACHINEX86_X64(__m128i _mm_xor_si128(__m128i, __m128i))
1039 __MACHINEX64(__int64 _mul128(__int64 _Multiplier, __int64 _Multiplicand, __int64 * _HighProduct))
1040 __MACHINE(unsigned int __cdecl _rotl(_In_ unsigned int _Value, _In_ int _Shift))
1041 __MACHINE(unsigned short __cdecl _rotl16(unsigned short _Value, unsigned char _Shift))
1042 __MACHINE(unsigned __int64 __cdecl _rotl64(_In_ unsigned __int64 _Value, _In_ int _Shift))
1043 __MACHINE(unsigned char __cdecl _rotl8(unsigned char _Value, unsigned char _Shift))
1044 __MACHINE(unsigned int __cdecl _rotr(_In_ unsigned int _Value, _In_ int _Shift))
1045 __MACHINE(unsigned short __cdecl _rotr16(unsigned short _Value, unsigned char _Shift))
1046 __MACHINE(unsigned __int64 __cdecl _rotr64(_In_ unsigned __int64 _Value, _In_ int _Shift))
1047 __MACHINE(unsigned char __cdecl _rotr8(unsigned char _Value, unsigned char _Shift))
1048 __MACHINE(int __cdecl _setjmp(jmp_buf))
1049 __MACHINEARM_X64(int __cdecl _setjmpex(jmp_buf))
1050 __MACHINEX64(unsigned __int64 _umul128(unsigned __int64 _Multiplier, unsigned __int64 _Multiplicand, unsigned __int64 * _HighProduct))
1051 __MACHINEX86_X64(void _rsm(void))
1052 __MACHINEX86_X64(void _lgdt(void *))
1053 __MACHINEX86_X64(void _sgdt(void *))
1054 __MACHINEX86_X64(void _clac(void))
1055 __MACHINEX86_X64(void _stac(void))
1056 __MACHINEX86_X64(unsigned char __cdecl _addcarry_u8(unsigned char, unsigned char, unsigned char, unsigned char *))
1057 __MACHINEX86_X64(unsigned char __cdecl _subborrow_u8(unsigned char, unsigned char, unsigned char, unsigned char *))
1058 __MACHINEX86_X64(unsigned char __cdecl _addcarry_u16(unsigned char, unsigned short, unsigned short, unsigned short *))
1059 __MACHINEX86_X64(unsigned char __cdecl _subborrow_u16(unsigned char, unsigned short, unsigned short, unsigned short *))
1060 __MACHINEX86_X64(unsigned char __cdecl _addcarry_u32(unsigned char, unsigned int, unsigned int, unsigned int *))
1061 __MACHINEX86_X64(unsigned char __cdecl _subborrow_u32(unsigned char, unsigned int, unsigned int, unsigned int *))
1062 __MACHINEX64(unsigned char __cdecl _addcarry_u64(unsigned char, unsigned __int64, unsigned __int64, unsigned __int64 *))
1063 __MACHINEX64(unsigned char __cdecl _subborrow_u64(unsigned char, unsigned __int64, unsigned __int64, unsigned __int64 *))
1064 
1065 #if defined (__cplusplus)
1066 }
1067 #endif /* defined (__cplusplus) */
1068 #endif /* __midl */
1069 #endif /* RC_INVOKED */
__m128i _mm_sub_epi32(__m128i _A, __m128i _B)
__m128i _mm_adds_epi8(__m128i _A, __m128i _B)
__m128i _mm_cvttps_epi32(__m128 _A)
__m64 _m_pslld(__m64 _M, __m64 _Count)
__m128 _mm_set_ps(float _A, float _B, float _C, float _D)
int _mm_movemask_epi8(__m128i _A)
__m128d _mm_round_sd(__m128d dst, __m128d val, int iRoundMode)
void _mm_store_sd(double *_Dp, __m128d _A)
__m64 _m_psadbw(__m64, __m64)
__m128i _mm_mulhi_epi16(__m128i _A, __m128i _B)
__m128i _mm_hsub_epi16(__m128i a, __m128i b)
__m128d _mm_cmpngt_pd(__m128d _A, __m128d _B)
__m128 _mm_insert_ps(__m128 dst, __m128 src, const int ndx)
int _mm_comineq_sd(__m128d _A, __m128d _B)
int _mm_extract_epi16(__m128i _A, int _Imm)
__m64 _m_punpckhwd(__m64 _MM1, __m64 _MM2)
__m128i _mm_xor_si128(__m128i _A, __m128i _B)
__m64 _m_pslldi(__m64 _M, int _Count)
__m128 _mm_and_ps(__m128 _A, __m128 _B)
__m128d _mm_move_sd(__m128d _A, __m128d _B)
__m64 _m_paddb(__m64 _MM1, __m64 _MM2)
void _mm_store_ps1(float *_V, __m128 _A)
__m128i _mm_hadd_epi16(__m128i a, __m128i b)
__m128 _mm_setr_ps(float _A, float _B, float _C, float _D)
__m128i _mm_loadu_si128(__m128i const *_P)
unsigned int _mm_crc32_u8(unsigned int crc, unsigned char v)
__m64 _mm_set_pi16(short _S3, short _S2, short _S1, short _S0)
__m128d _mm_load_sd(double const *_Dp)
int _mm_ucomilt_ss(__m128 _A, __m128 _B)
__m128i _mm_sign_epi32(__m128i a, __m128i b)
__m128i _mm_srai_epi32(__m128i _A, int _Count)
__m128d _mm_cmpord_sd(__m128d _A, __m128d _B)
__m128 _mm_movehl_ps(__m128, __m128)
__m128 _mm_rsqrt_ss(__m128 _A)
__m128 _mm_dp_ps(__m128 val1, __m128 val2, const int mask)
__m128 _mm_sqrt_ps(__m128 _A)
__m128 _mm_max_ps(__m128 _A, __m128 _B)
int _mm_cmpistri(__m128i a, __m128i b, const int mode)
__m128i _mm_packs_epi32(__m128i _A, __m128i _B)
_CRTIMP _In_ int _Value
Definition: setjmp.h:190
__m128d _mm_min_pd(__m128d _A, __m128d _B)
__m128d _mm_cmpeq_pd(__m128d _A, __m128d _B)
int _mm_cmpistrz(__m128i a, __m128i b, const int mode)
__m128i _mm_sra_epi16(__m128i _A, __m128i _Count)
__m128 _mm_cmpgt_ss(__m128 _A, __m128 _B)
__m128 _mm_cmpngt_ps(__m128 _A, __m128 _B)
__m64 _mm_set1_pi16(short _S)
int _mm_ucomilt_sd(__m128d _A, __m128d _B)
__m64 _mm_cvt_ps2pi(__m128 _A)
__m128i _mm_cvtepi32_epi64(__m128i intValues)
__m64 _mm_setr_pi16(short _S3, short _S2, short _S1, short _S0)
__m128d _mm_cmpneq_sd(__m128d _A, __m128d _B)
int _mm_comieq_sd(__m128d _A, __m128d _B)
__m128i _mm_minpos_epu16(__m128i shortValues)
void _mm_stream_pi(__m64 *, __m64)
__m64 _m_pmullw(__m64 _MM1, __m64 _MM2)
int _mm_comigt_ss(__m128 _A, __m128 _B)
__m128d _mm_loadu_pd(double const *_Dp)
__m64 _m_pfrcp(__m64)
__m128i _mm_cvtepi8_epi16(__m128i byteValues)
void _mm_storeu_ps(float *_V, __m128 _A)
__m128i _mm_cvtepu32_epi64(__m128i intValues)
int _mm_ucomigt_sd(__m128d _A, __m128d _B)
__m128i _mm_min_epu32(__m128i val1, __m128i val2)
__m128d _mm_cvtsi32_sd(__m128d _A, int _B)
__m64 _m_punpckhdq(__m64 _MM1, __m64 _MM2)
__m128i _mm_blendv_epi8(__m128i v1, __m128i v2, __m128i mask)
__m64 _m_pfrsqrt(__m64)
int _mm_ucomigt_ss(__m128 _A, __m128 _B)
__m128d _mm_dp_pd(__m128d val1, __m128d val2, const int mask)
__m128 _mm_cmpord_ss(__m128 _A, __m128 _B)
__m128d _mm_cmplt_pd(__m128d _A, __m128d _B)
__m128 _mm_blendv_ps(__m128 v1, __m128 v2, __m128 v3)
__m128i _mm_move_epi64(__m128i _Q)
__m128i _mm_cmpgt_epi32(__m128i _A, __m128i _B)
__m128d _mm_cmpgt_sd(__m128d _A, __m128d _B)
__m64 _m_pfpnacc(__m64, __m64)
__m64 _m_pinsrw(__m64, int, int)
__m128i _mm_set1_epi64(__m64 _Q)
int _mm_cmpestrz(__m128i a, int la, __m128i b, int lb, const int mode)
void _mm_pause(void)
__m128i _mm_set_epi64(__m64 _Q1, __m64 _Q0)
__m128 _mm_cmpord_ps(__m128 _A, __m128 _B)
__m128d _mm_set1_pd(double _A)
__m128d _mm_unpacklo_pd(__m128d _A, __m128d _B)
void _m_prefetchw(volatile const void *_Source)
__m64 _m_pfmin(__m64, __m64)
int _mm_ucomieq_sd(__m128d _A, __m128d _B)
void _mm_store1_pd(double *_Dp, __m128d _A)
__m64 _mm_cvtt_ps2pi(__m128 _A)
__m64 _m_punpcklbw(__m64 _MM1, __m64 _MM2)
__m64 _mm_add_si64(__m64 _A, __m64 _B)
__m128d _mm_cmple_pd(__m128d _A, __m128d _B)
__m128i _mm_max_epi16(__m128i _A, __m128i _B)
__m128d _mm_cmpunord_sd(__m128d _A, __m128d _B)
__m128d _mm_cmpge_sd(__m128d _A, __m128d _B)
__m128i _mm_shuffle_epi8(__m128i a, __m128i b)
__m128d
Definition: emmintrin.h:48
__m64 _mm_sign_pi8(__m64 a, __m64 b)
__m128i _mm_stream_load_si128(__m128i *v1)
__m128i _mm_unpacklo_epi16(__m128i _A, __m128i _B)
__m64 _m_psrlwi(__m64 _M, int _Count)
__m64 _mm_hsub_pi16(__m64 a, __m64 b)
__m128 _mm_round_ss(__m128 dst, __m128 val, int iRoundMode)
int _mm_cmpestra(__m128i a, int la, __m128i b, int lb, const int mode)
__m128 _mm_sqrt_ss(__m128 _A)
int _mm_comige_sd(__m128d _A, __m128d _B)
__m128i _mm_cvtepi16_epi32(__m128i shortValues)
__m64 _m_psubw(__m64 _MM1, __m64 _MM2)
__m128i _mm_add_epi64(__m128i _A, __m128i _B)
__m128i _mm_set1_epi16(short _W)
int _mm_comigt_sd(__m128d _A, __m128d _B)
__m64 _m_pand(__m64 _MM1, __m64 _MM2)
__m128 _mm_blend_ps(__m128 v1, __m128 v2, const int mask)
int _mm_testnzc_si128(__m128i mask, __m128i s2)
__m128i _mm_set1_epi8(char _B)
__m128i _mm_setl_epi64(__m128i _Q)
__m64 _m_pshufw(__m64, int)
__m128i _mm_srli_epi16(__m128i _A, int _Count)
__m128d _mm_loadh_pd(__m128d _A, double const *_Dp)
__m64 _m_psllw(__m64 _M, __m64 _Count)
__m64 _m_pfnacc(__m64, __m64)
__m128d _mm_shuffle_pd(__m128d _A, __m128d _B, int _I)
__m128 _mm_round_ps(__m128 val, int iRoundMode)
__m64 _m_pfadd(__m64, __m64)
__m128i _mm_cmplt_epi8(__m128i _A, __m128i _B)
int _mm_cvtsd_si32(__m128d _A)
__m128i _mm_set_epi16(short _W7, short _W6, short _W5, short _W4, short _W3, short _W2, short _W1, short _W0)
__m128i _mm_packs_epi16(__m128i _A, __m128i _B)
__m64 _m_pavgusb(__m64, __m64)
__m128 _mm_addsub_ps(__m128 a, __m128 b)
void _m_femms(void)
__m128i _mm_cmpistrm(__m128i a, __m128i b, const int mode)
__m128 _mm_cvt_pi2ps(__m128, __m64)
__m128 _mm_shuffle_ps(__m128 _A, __m128 _B, unsigned int _Imm8)
__m64 _mm_set1_pi8(char _B)
__m128i _mm_add_epi8(__m128i _A, __m128i _B)
void _mm_storeh_pi(__m64 *, __m128)
__m64 _m_psrad(__m64 _M, __m64 _Count)
#define __MACHINEWVMPURE(X)
Definition: intrin.h:69
__m128i _mm_setr_epi8(char _B15, char _B14, char _B13, char _B12, char _B11, char _B10, char _B9, char _B8, char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128d _mm_set_pd(double _Z, double _Y)
__m128d _mm_cvtpi32_pd(__m64 _A)
int _mm_comile_ss(__m128 _A, __m128 _B)
__m64 _m_pfrsqit1(__m64, __m64)
__m128 _mm_hsub_ps(__m128 a, __m128 b)
__m128i _mm_srl_epi32(__m128i _A, __m128i _Count)
int _mm_comige_ss(__m128 _A, __m128 _B)
__m128i _mm_set1_epi32(int _I)
__m128 _mm_cmpngt_ss(__m128 _A, __m128 _B)
__m64 _mm_hsub_pi32(__m64 a, __m64 b)
_Check_return_ unsigned short __cdecl _byteswap_ushort(_In_ unsigned short _Short)
__m128i _mm_cvtepu8_epi16(__m128i byteValues)
void _m_empty(void)
__m64 _m_psubusb(__m64 _MM1, __m64 _MM2)
void _m_maskmovq(__m64, __m64, char *)
__m128 _mm_loadu_ps(float const *_A)
__m128i _mm_hsubs_epi16(__m128i a, __m128i b)
__m128i _mm_sra_epi32(__m128i _A, __m128i _Count)
__m128i _mm_setzero_si128(void)
int _mm_ucomineq_ss(__m128 _A, __m128 _B)
__m64 _mm_set_pi32(int _I1, int _I0)
__m128i _mm_min_epi32(__m128i val1, __m128i val2)
int _mm_comineq_ss(__m128 _A, __m128 _B)
__m128i _mm_srli_epi32(__m128i _A, int _Count)
__m64 _m_psubsb(__m64 _MM1, __m64 _MM2)
__m128d _mm_cmpnge_sd(__m128d _A, __m128d _B)
__m128d _mm_cmplt_sd(__m128d _A, __m128d _B)
__m128i _mm_max_epu32(__m128i val1, __m128i val2)
__m128i _mm_set_epi32(int _I3, int _I2, int _I1, int _I0)
__m128d _mm_movedup_pd(__m128d a)
__m128i _mm_sll_epi16(__m128i _A, __m128i _Count)
__m64 _m_psrlw(__m64 _M, __m64 _Count)
int _mm_extract_epi32(__m128i src, const int ndx)
__m64 _m_punpckhbw(__m64 _MM1, __m64 _MM2)
__m128 _mm_cmple_ps(__m128 _A, __m128 _B)
_Check_return_ unsigned long __cdecl _lrotr(_In_ unsigned long _Val, _In_ int _Shift)
__m128i _mm_avg_epu16(__m128i _A, __m128i _B)
__m64 _mm_cvtpd_pi32(__m128d _A)
void _mm_monitor(void const *p, unsigned extensions, unsigned hints)
__m64 _mm_hsubs_pi16(__m64 a, __m64 b)
__m64 _m_pfrcpit1(__m64, __m64)
__m128i _mm_insert_epi16(__m128i _A, int _B, int _Imm)
__m128i _mm_cvtepu16_epi32(__m128i shortValues)
__m128d _mm_load_pd(double const *_Dp)
__m128i _mm_min_epi16(__m128i _A, __m128i _B)
__m64 _m_psrldi(__m64 _M, int _Count)
unsigned __int64 __cdecl _rotl64(_In_ unsigned __int64 _Val, _In_ int _Shift)
__m128 _mm_add_ps(__m128 _A, __m128 _B)
__m64 _mm_hadd_pi16(__m64 a, __m64 b)
__m64 _m_pfsub(__m64, __m64)
#define __MACHINECALL_CDECL_OR_DEFAULT
Definition: intrin.h:103
__m128i _mm_mulhrs_epi16(__m128i a, __m128i b)
__m64 _m_psrawi(__m64 _M, int _Count)
void _mm_mfence(void)
__m64 _m_pcmpeqw(__m64 _MM1, __m64 _MM2)
__m128i _mm_unpacklo_epi32(__m128i _A, __m128i _B)
__m64 _mm_movepi64_pi64(__m128i _Q)
void _mm_mwait(unsigned extensions, unsigned hints)
__m64 _mm_set_pi8(char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128i _mm_adds_epu8(__m128i _A, __m128i _B)
__m64 _m_pfrcpit2(__m64, __m64)
__m128d _mm_sqrt_sd(__m128d _A, __m128d _B)
int _mm_cmpistra(__m128i a, __m128i b, const int mode)
int _mm_extract_epi8(__m128i src, const int ndx)
__m64 _m_psubusw(__m64 _MM1, __m64 _MM2)
int _m_pmovmskb(__m64)
__m128 _mm_cvtpd_ps(__m128d _A)
__m128i _mm_cvtepi8_epi32(__m128i byteValues)
int _mm_ucomile_sd(__m128d _A, __m128d _B)
__m64 _mm_maddubs_pi16(__m64 a, __m64 b)
__m128 _mm_hadd_ps(__m128 a, __m128 b)
__m128i _mm_sll_epi32(__m128i _A, __m128i _Count)
_JBTYPE jmp_buf[_JBLEN]
Definition: setjmp.h:167
void _mm_store_ss(float *_V, __m128 _A)
__m128d _mm_loaddup_pd(double const *dp)
__m128i _mm_unpackhi_epi16(__m128i _A, __m128i _B)
__m128 _mm_sub_ps(__m128 _A, __m128 _B)
__m128 _mm_div_ps(__m128 _A, __m128 _B)
__m128d _mm_cmpnle_pd(__m128d _A, __m128d _B)
__m64 _m_psraw(__m64 _M, __m64 _Count)
__m128 _mm_set_ss(float _A)
__m64 _m_packsswb(__m64 _MM1, __m64 _MM2)
__m64 _m_paddusw(__m64 _MM1, __m64 _MM2)
__m128i _mm_slli_epi16(__m128i _A, int _Count)
int _mm_movemask_pd(__m128d _A)
__m64 _mm_hadds_pi16(__m64 a, __m64 b)
__m128d _mm_cmpngt_sd(__m128d _A, __m128d _B)
__m64 _mm_mulhrs_pi16(__m64 a, __m64 b)
int _mm_cvttsd_si32(__m128d _A)
__m128i _mm_cvtepu8_epi64(__m128i shortValues)
__m128i _mm_sad_epu8(__m128i _A, __m128i _B)
__m128i _mm_setr_epi16(short _W0, short _W1, short _W2, short _W3, short _W4, short _W5, short _W6, short _W7)
__m64 _m_psllwi(__m64 _M, int _Count)
__m64 _mm_setr_pi32(int _I1, int _I0)
__m64 _m_por(__m64 _MM1, __m64 _MM2)
__m128i _mm_cvtpd_epi32(__m128d _A)
__m128 _mm_cmplt_ss(__m128 _A, __m128 _B)
__m128i _mm_max_epu8(__m128i _A, __m128i _B)
__m128d _mm_cmpneq_pd(__m128d _A, __m128d _B)
int _mm_ucomile_ss(__m128 _A, __m128 _B)
__m64 _m_pmulhrw(__m64, __m64)
float _m_to_float(__m64)
__m64 _m_pmaddwd(__m64 _MM1, __m64 _MM2)
#define _Check_return_
Definition: sal.h:563
__m128d _mm_round_pd(__m128d val, int iRoundMode)
int _mm_comile_sd(__m128d _A, __m128d _B)
__m128i _mm_insert_epi32(__m128i dst, int s, const int ndx)
__m64 _m_pandn(__m64 _MM1, __m64 _MM2)
__m128d _mm_cmpnlt_sd(__m128d _A, __m128d _B)
__m64 _m_pi2fd(__m64)
__m128d _mm_hadd_pd(__m128d a, __m128d b)
__m64 _mm_abs_pi8(__m64 a)
#define _In_
Definition: sal.h:314
__m128d _mm_cmpnge_pd(__m128d _A, __m128d _B)
__m128d _mm_add_pd(__m128d _A, __m128d _B)
__m128d _mm_or_pd(__m128d _A, __m128d _B)
__m64 _mm_sub_si64(__m64 _A, __m64 _B)
__m128 _mm_rcp_ps(__m128 _A)
__m64 _m_punpckldq(__m64 _MM1, __m64 _MM2)
struct _EXCEPTION_POINTERS *_CRTIMP __declspec(noreturn) void __cdecl terminate(void)
Definition: eh.h:55
__m64 _m_paddsw(__m64 _MM1, __m64 _MM2)
__m128i _mm_mul_epu32(__m128i _A, __m128i _B)
__m64 _m_punpcklwd(__m64 _MM1, __m64 _MM2)
__m128i _mm_min_epu8(__m128i _A, __m128i _B)
__m128 _mm_cmpeq_ps(__m128 _A, __m128 _B)
__m64 _m_psrld(__m64 _M, __m64 _Count)
__m128d _mm_cmpord_pd(__m128d _A, __m128d _B)
__m128i _mm_cmplt_epi32(__m128i _A, __m128i _B)
__m128d _mm_div_pd(__m128d _A, __m128d _B)
void _mm_setcsr(unsigned int)
__m128i _mm_min_epi8(__m128i val1, __m128i val2)
void _mm_storel_pd(double *_Dp, __m128d _A)
__m128d _mm_cvtepi32_pd(__m128i _A)
int _mm_comilt_sd(__m128d _A, __m128d _B)
__m128i _mm_slli_si128(__m128i _A, int _Imm)
__m128 _mm_cmpneq_ps(__m128 _A, __m128 _B)
__m64
Definition: mmintrin.h:42
__m128i _mm_srli_si128(__m128i _A, int _Imm)
__m64 _mm_mul_su32(__m64 _A, __m64 _B)
__m128d _mm_and_pd(__m128d _A, __m128d _B)
__m128i _mm_srl_epi16(__m128i _A, __m128i _Count)
__m64 _m_pmulhw(__m64 _MM1, __m64 _MM2)
__m64 _mm_alignr_pi8(__m64 a, __m64 b, int n)
void _mm_stream_ps(float *, __m128)
void _mm_store_pd(double *_Dp, __m128d _A)
__m128i _mm_sign_epi8(__m128i a, __m128i b)
unsigned int __cdecl _rotr(_In_ unsigned int _Val, _In_ int _Shift)
int _m_to_int(__m64 _M)
__m128i _mm_slli_epi64(__m128i _A, int _Count)
__m128i _mm_mul_epi32(__m128i a, __m128i b)
int _mm_popcnt_u32(unsigned int v)
__m128i _mm_cmpgt_epi8(__m128i _A, __m128i _B)
void _mm_clflush(void const *_P)
int _mm_ucomige_sd(__m128d _A, __m128d _B)
__m64 _m_pfacc(__m64, __m64)
__m64 _m_psubb(__m64 _MM1, __m64 _MM2)
__m64 _m_pf2id(__m64)
__m128i _mm_unpackhi_epi32(__m128i _A, __m128i _B)
__m64 _m_pfcmpeq(__m64, __m64)
__m128 _mm_andnot_ps(__m128 _A, __m128 _B)
__m128d _mm_cmpgt_pd(__m128d _A, __m128d _B)
__m128d _mm_max_pd(__m128d _A, __m128d _B)
_Check_return_ unsigned __int64 __cdecl _byteswap_uint64(_In_ unsigned __int64 _Int64)
__m64 _m_psllq(__m64 _M, __m64 _Count)
__m128 _mm_cvtepi32_ps(__m128i _A)
__m128 _mm_cmpnlt_ps(__m128 _A, __m128 _B)
__m128i _mm_cvttpd_epi32(__m128d _A)
__m128i
Definition: emmintrin.h:44
void _mm_store_si128(__m128i *_P, __m128i _B)
__m128d _mm_cmpnlt_pd(__m128d _A, __m128d _B)
__m128i _mm_srli_epi64(__m128i _A, int _Count)
__m128i _mm_maddubs_epi16(__m128i a, __m128i b)
__m64 _m_psrlq(__m64 _M, __m64 _Count)
__m128 _mm_cmpnlt_ss(__m128 _A, __m128 _B)
__m128 _mm_xor_ps(__m128 _A, __m128 _B)
__m128i _mm_unpackhi_epi64(__m128i _A, __m128i _B)
__m128i _mm_setr_epi64(__m64 _Q0, __m64 _Q1)
__m128i _mm_abs_epi16(__m128i a)
int _mm_comieq_ss(__m128 _A, __m128 _B)
__m64 _m_pmaxub(__m64, __m64)
__m128i _mm_cmpestrm(__m128i a, int la, __m128i b, int lb, const int mode)
int _mm_cvtsi128_si32(__m128i _A)
__m128d _mm_unpackhi_pd(__m128d _A, __m128d _B)
void * _InterlockedCompareExchangePointer(void *volatile *, void *, void *)
__m128
Definition: xmmintrin.h:70
__m128 _mm_load_ps1(float const *_A)
void _mm_storeu_pd(double *_Dp, __m128d _A)
__m128i _mm_cmpgt_epi16(__m128i _A, __m128i _B)
__m128i _mm_hsub_epi32(__m128i a, __m128i b)
int _mm_cmpistrc(__m128i a, __m128i b, const int mode)
void _mm_storeh_pd(double *_Dp, __m128d _A)
__m128i _mm_mullo_epi32(__m128i a, __m128i b)
__m128d _mm_load1_pd(double const *_Dp)
__m128d _mm_xor_pd(__m128d _A, __m128d _B)
int _mm_cvt_ss2si(__m128 _A)
__m128 _mm_mul_ps(__m128 _A, __m128 _B)
void _mm_sfence(void)
__m128d _mm_loadr_pd(double const *_Dp)
__m64 _m_from_float(float)
int _mm_cmpestrc(__m128i a, int la, __m128i b, int lb, const int mode)
int _mm_ucomige_ss(__m128 _A, __m128 _B)
__m128i _mm_shufflelo_epi16(__m128i _A, int _Imm)
__m128d _mm_loadl_pd(__m128d _A, double const *_Dp)
__m128i _mm_sign_epi16(__m128i a, __m128i b)
__m64 _mm_set1_pi32(int _I)
__m128i _mm_cmplt_epi16(__m128i _A, __m128i _B)
__m128i _mm_avg_epu8(__m128i _A, __m128i _B)
__m128i _mm_cvtsi32_si128(int _A)
__m128i _mm_mullo_epi16(__m128i _A, __m128i _B)
__m128i _mm_cmpeq_epi64(__m128i val1, __m128i val2)
__m128 _mm_set_ps1(float _A)
__m128d _mm_setzero_pd(void)
__m128i _mm_subs_epu8(__m128i _A, __m128i _B)
__m128i _mm_max_epi8(__m128i val1, __m128i val2)
_Check_return_ unsigned long __cdecl _lrotl(_In_ unsigned long _Val, _In_ int _Shift)
#define __MACHINE(X)
Definition: intrin.h:68
__m128 _mm_movehdup_ps(__m128 a)
#define __MACHINEARM
Definition: intrin.h:96
void _mm_storer_pd(double *_Dp, __m128d _A)
__m128 _mm_cmpneq_ss(__m128 _A, __m128 _B)
__m128i _mm_blend_epi16(__m128i v1, __m128i v2, const int mask)
__m128 _mm_cvt_si2ss(__m128, int)
__m64 _m_from_int(int _I)
unsigned int _mm_crc32_u32(unsigned int crc, unsigned int v)
int _mm_extract_ps(__m128 src, const int ndx)
__m128i _mm_cmpeq_epi16(__m128i _A, __m128i _B)
__m128i _mm_or_si128(__m128i _A, __m128i _B)
__m128i _mm_shufflehi_epi16(__m128i _A, int _Imm)
__m128i _mm_sll_epi64(__m128i _A, __m128i _Count)
__m64 _mm_setr_pi8(char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128i _mm_cmpeq_epi32(__m128i _A, __m128i _B)
__m128i _mm_load_si128(__m128i const *_P)
__m128 _mm_add_ss(__m128 _A, __m128 _B)
__m128d _mm_blend_pd(__m128d v1, __m128d v2, const int mask)
#define __MACHINEARM_X64
Definition: intrin.h:91
__m128i _mm_adds_epu16(__m128i _A, __m128i _B)
__m128i _mm_setr_epi32(int _I0, int _I1, int _I2, int _I3)
__m128 _mm_min_ss(__m128 _A, __m128 _B)
__m128i _mm_add_epi32(__m128i _A, __m128i _B)
int _mm_cmpestro(__m128i a, int la, __m128i b, int lb, const int mode)
__m128i _mm_min_epu16(__m128i val1, __m128i val2)
__m64 _m_pi2fw(__m64)
__m128d _mm_cmpnle_sd(__m128d _A, __m128d _B)
__m128 _mm_min_ps(__m128 _A, __m128 _B)
__m64 _m_pcmpgtw(__m64 _MM1, __m64 _MM2)
__m128i _mm_unpacklo_epi8(__m128i _A, __m128i _B)
__m128i _mm_cvtepu8_epi32(__m128i byteValues)
void _m_prefetch(void *)
int _mm_ucomieq_ss(__m128 _A, __m128 _B)
__m64 _m_pswapd(__m64)
void _mm_storel_epi64(__m128i *_P, __m128i _Q)
__m128i _mm_cvtepi16_epi64(__m128i shortValues)
int _mm_comilt_ss(__m128 _A, __m128 _B)
__m128d _mm_blendv_pd(__m128d v1, __m128d v2, __m128d v3)
int _mm_cmpestri(__m128i a, int la, __m128i b, int lb, const int mode)
__m128 _mm_cmpnle_ss(__m128 _A, __m128 _B)
__m128 _mm_cmpgt_ps(__m128 _A, __m128 _B)
void _mm_store_ps(float *_V, __m128 _A)
int _mm_movemask_ps(__m128 _A)
__m64 _mm_sign_pi16(__m64 a, __m64 b)
__m64 _m_paddw(__m64 _MM1, __m64 _MM2)
__m128 _mm_setzero_ps(void)
__m64 _m_pminub(__m64, __m64)
__m64 _mm_abs_pi32(__m64 a)
__m128 _mm_moveldup_ps(__m128 a)
__m64 _mm_setzero_si64(void)
#define __MACHINEX86_X64
Definition: intrin.h:86
#define __MACHINEX86
Definition: intrin.h:76
__m64 _m_pcmpgtb(__m64 _MM1, __m64 _MM2)
__m64 _m_pavgw(__m64, __m64)
__m128i _mm_max_epi32(__m128i val1, __m128i val2)
long __cdecl _InterlockedDecrement(long volatile *)
__m64 _mm_abs_pi16(__m64 a)
__m128d _mm_sub_pd(__m128d _A, __m128d _B)
__m128 _mm_rcp_ss(__m128 _A)
unsigned int _mm_crc32_u16(unsigned int crc, unsigned short v)
__m64 _mm_hadd_pi32(__m64 a, __m64 b)
int _mm_testc_si128(__m128i mask, __m128i val)
__m128 _mm_cmplt_ps(__m128 _A, __m128 _B)
__m128d _mm_sub_sd(__m128d _A, __m128d _B)
unsigned int __cdecl _rotl(_In_ unsigned int _Val, _In_ int _Shift)
__m128i _mm_abs_epi32(__m128i a)
__m128d _mm_cvtss_sd(__m128d _A, __m128 _B)
__m128i _mm_cvtepu16_epi64(__m128i shortValues)
__m64 _m_pmulhuw(__m64, __m64)
__m128 _mm_move_ss(__m128 _A, __m128 _B)
__m128i _mm_slli_epi32(__m128i _A, int _Count)
__m128 _mm_sub_ss(__m128 _A, __m128 _B)
__m128i _mm_movpi64_epi64(__m64 _Q)
__m128i _mm_sub_epi16(__m128i _A, __m128i _B)
void _mm_stream_pd(double *_Dp, __m128d _A)
__m64 _m_pcmpeqb(__m64 _MM1, __m64 _MM2)
__m128d _mm_cmple_sd(__m128d _A, __m128d _B)
__m128 _mm_loadr_ps(float const *_A)
__m64 _m_pfmul(__m64, __m64)
__m128 _mm_cmpnle_ps(__m128 _A, __m128 _B)
__m128 _mm_cmpnge_ps(__m128 _A, __m128 _B)
__m128i _mm_hadd_epi32(__m128i a, __m128i b)
__m128d _mm_mul_sd(__m128d _A, __m128d _B)
__m128 _mm_cmpeq_ss(__m128 _A, __m128 _B)
__m128 _mm_unpackhi_ps(__m128 _A, __m128 _B)
__m64 _m_paddusb(__m64 _MM1, __m64 _MM2)
__m64 _m_packuswb(__m64 _MM1, __m64 _MM2)
int _mm_ucomineq_sd(__m128d _A, __m128d _B)
__m128 _mm_unpacklo_ps(__m128 _A, __m128 _B)
__m128i _mm_subs_epu16(__m128i _A, __m128i _B)
__m128i _mm_abs_epi8(__m128i a)
__m128 _mm_div_ss(__m128 _A, __m128 _B)
__m128i _mm_sub_epi8(__m128i _A, __m128i _B)
void _mm_storel_pi(__m64 *, __m128)
__m128i _mm_shuffle_epi32(__m128i _A, int _Imm)
__m64 _m_pfcmpgt(__m64, __m64)
__m128 _mm_rsqrt_ps(__m128 _A)
__m64 _m_pcmpeqd(__m64 _MM1, __m64 _MM2)
__m128i _mm_alignr_epi8(__m128i a, __m128i b, int n)
__m64 _m_paddd(__m64 _MM1, __m64 _MM2)
void _mm_storeu_si128(__m128i *_P, __m128i _B)
__m128i _mm_unpacklo_epi64(__m128i _A, __m128i _B)
__m128 _mm_max_ss(__m128 _A, __m128 _B)
_CRT_MANAGED_FP_DEPRECATE _In_ unsigned int _Mask
Definition: float.h:120
void _mm_stream_si32(int *_P, int _I)
__m128 _mm_or_ps(__m128 _A, __m128 _B)
__m128 _mm_cmple_ss(__m128 _A, __m128 _B)
__m128i _mm_andnot_si128(__m128i _A, __m128i _B)
__m64 _mm_cvttpd_pi32(__m128d _A)
__m128d _mm_max_sd(__m128d _A, __m128d _B)
void _mm_prefetch(char const *_A, int _Sel)
__m64 _m_pavgb(__m64, __m64)
int _mm_cmpestrs(__m128i a, int la, __m128i b, int lb, const int mode)
__m128d _mm_div_sd(__m128d _A, __m128d _B)
long __cdecl _InterlockedIncrement(long volatile *)
__m128 _mm_loadh_pi(__m128, __m64 const *)
__m128i _mm_loadl_epi64(__m128i const *_P)
__m128d _mm_set_sd(double _W)
void _mm_storer_ps(float *_V, __m128 _A)
__m128i _mm_srai_epi16(__m128i _A, int _Count)
__m128i _mm_cvtps_epi32(__m128 _A)
__m64 _m_pfcmpge(__m64, __m64)
__m128i _mm_max_epu16(__m128i val1, __m128i val2)
__m128i _mm_subs_epi8(__m128i _A, __m128i _B)
__m64 _mm_shuffle_pi8(__m64 a, __m64 b)
__m128 _mm_cmpunord_ps(__m128 _A, __m128 _B)
__m64 _m_psrlqi(__m64 _M, int _Count)
__m64 _mm_sign_pi32(__m64 a, __m64 b)
__m128 _mm_mul_ss(__m128 _A, __m128 _B)
__m128 _mm_loadl_pi(__m128, __m64 const *)
__m64 _m_paddsb(__m64 _MM1, __m64 _MM2)
int _mm_testz_si128(__m128i mask, __m128i val)
__m128 _mm_load_ps(float const *_A)
__m128d _mm_mul_pd(__m128d _A, __m128d _B)
__m128d _mm_min_sd(__m128d _A, __m128d _B)
int _mm_cmpistrs(__m128i a, __m128i b, const int mode)
__m64 _m_psubsw(__m64 _MM1, __m64 _MM2)
__m128i _mm_add_epi16(__m128i _A, __m128i _B)
void _mm_maskmoveu_si128(__m128i _D, __m128i _N, char *_P)
__m64 _m_pfmax(__m64, __m64)
__m64 _m_psradi(__m64 _M, int _Count)
__m128i _mm_set_epi8(char _B15, char _B14, char _B13, char _B12, char _B11, char _B10, char _B9, char _B8, char _B7, char _B6, char _B5, char _B4, char _B3, char _B2, char _B1, char _B0)
__m128 _mm_cmpunord_ss(__m128 _A, __m128 _B)
__m128i _mm_cmpeq_epi8(__m128i _A, __m128i _B)
__m64 _m_pxor(__m64 _MM1, __m64 _MM2)
int _mm_cvtt_ss2si(__m128 _A)
__m64 _m_psubd(__m64 _MM1, __m64 _MM2)
_Check_return_ unsigned long __cdecl _byteswap_ulong(_In_ unsigned long _Long)
__m128i _mm_unpackhi_epi8(__m128i _A, __m128i _B)
__m64 _m_pcmpgtd(__m64 _MM1, __m64 _MM2)
__m128i _mm_adds_epi16(__m128i _A, __m128i _B)
__m128d _mm_cvtps_pd(__m128 _A)
__m64 _m_pfsubr(__m64, __m64)
__m128d _mm_andnot_pd(__m128d _A, __m128d _B)
__m128i _mm_sub_epi64(__m128i _A, __m128i _B)
__m128 _mm_cvtsd_ss(__m128 _A, __m128d _B)
__m128d _mm_cmpeq_sd(__m128d _A, __m128d _B)
__m128i _mm_cmpgt_epi64(__m128i val1, __m128i val2)
__m64 _m_pf2iw(__m64)
__m128 _mm_load_ss(float const *_A)
__m128i _mm_insert_epi8(__m128i dst, int s, const int ndx)
__m128 _mm_cmpnge_ss(__m128 _A, __m128 _B)
__m128i _mm_packus_epi16(__m128i _A, __m128i _B)
long __cdecl _InterlockedCompareExchange(long volatile *, long, long)
__m128 _mm_movelh_ps(__m128, __m128)
unsigned int _mm_getcsr(void)
__m128i _mm_mulhi_epu16(__m128i _A, __m128i _B)
__m128d _mm_cmpge_pd(__m128d _A, __m128d _B)
__m64 _m_psllqi(__m64 _M, int _Count)
__m128d _mm_hsub_pd(__m128d a, __m128d b)
unsigned __int64 __cdecl _rotr64(_In_ unsigned __int64 _Val, _In_ int _Shift)
__m128 _mm_cmpge_ps(__m128 _A, __m128 _B)
__m128i _mm_lddqu_si128(__m128i const *p)
__m128i _mm_hadds_epi16(__m128i a, __m128i b)
__m128i _mm_srl_epi64(__m128i _A, __m128i _Count)
__m128d _mm_setr_pd(double _Y, double _Z)
void _mm_lfence(void)
__m128d _mm_addsub_pd(__m128d a, __m128d b)
__m128d _mm_add_sd(__m128d _A, __m128d _B)
__m128i _mm_and_si128(__m128i _A, __m128i _B)
#define __MACHINEX64
Definition: intrin.h:81
int _mm_cmpistro(__m128i a, __m128i b, const int mode)
__m128i _mm_madd_epi16(__m128i _A, __m128i _B)
__m64 _m_pminsw(__m64, __m64)
void _mm_stream_si128(__m128i *_P, __m128i _A)
__m128d _mm_sqrt_pd(__m128d _A)
__m128i _mm_packus_epi32(__m128i val1, __m128i val2)
int _m_pextrw(__m64, int)
__m128i _mm_subs_epi16(__m128i _A, __m128i _B)
__m128i _mm_mpsadbw_epu8(__m128i s1, __m128i s2, const int msk)
const Is16vec4 &b return _m_pmaxsw(a, b)
__m128 _mm_cmpge_ss(__m128 _A, __m128 _B)
__m64 _m_packssdw(__m64 _MM1, __m64 _MM2)
__m128i _mm_cvtepi8_epi64(__m128i byteValues)
__m128d _mm_cmpunord_pd(__m128d _A, __m128d _B)