blob: a13715dd7d6cb5ecf836ea44720328ea6f6fc465 [file] [log] [blame]
Eric Christopherd1428bf2013-08-31 00:22:48 +00001/* ===-------- Intrin.h ---------------------------------------------------===
2 *
3 * Permission is hereby granted, free of charge, to any person obtaining a copy
4 * of this software and associated documentation files (the "Software"), to deal
5 * in the Software without restriction, including without limitation the rights
6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7 * copies of the Software, and to permit persons to whom the Software is
8 * furnished to do so, subject to the following conditions:
9 *
10 * The above copyright notice and this permission notice shall be included in
11 * all copies or substantial portions of the Software.
12 *
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19 * THE SOFTWARE.
20 *
21 *===-----------------------------------------------------------------------===
22 */
23
24/* Only include this if we're compiling for the windows platform. */
25#ifndef _MSC_VER
26#include_next <Intrin.h>
27#else
28
29#ifndef __INTRIN_H
30#define __INTRIN_H
31
32/* First include the standard intrinsics. */
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +000033#if defined(__i386__) || defined(__x86_64__)
Eric Christopherd1428bf2013-08-31 00:22:48 +000034#include <x86intrin.h>
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +000035#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +000036
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000037/* For the definition of jmp_buf. */
Nico Webera62cffa2014-07-08 18:34:46 +000038#if __STDC_HOSTED__
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000039#include <setjmp.h>
Nico Webera62cffa2014-07-08 18:34:46 +000040#endif
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000041
Eric Christopher0db88a72013-09-18 22:24:01 +000042#ifdef __cplusplus
43extern "C" {
44#endif
45
Saleem Abdulrasoolc4ebb122014-07-08 05:46:04 +000046#if defined(__MMX__)
Eric Christopherd1428bf2013-08-31 00:22:48 +000047/* And the random ones that aren't in those files. */
48__m64 _m_from_float(float);
49__m64 _m_from_int(int _l);
50void _m_prefetch(void *);
51float _m_to_float(__m64);
52int _m_to_int(__m64 _M);
Saleem Abdulrasoolc4ebb122014-07-08 05:46:04 +000053#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +000054
55/* Other assorted instruction intrinsics. */
56void __addfsbyte(unsigned long, unsigned char);
57void __addfsdword(unsigned long, unsigned long);
58void __addfsword(unsigned long, unsigned short);
59void __code_seg(const char *);
Hans Wennborg854f7d32014-01-16 23:39:35 +000060static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000061void __cpuid(int[4], int);
Hans Wennborg12fb89e2014-01-31 19:44:55 +000062static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000063void __cpuidex(int[4], int, int);
Eric Christopher0db88a72013-09-18 22:24:01 +000064void __debugbreak(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +000065__int64 __emul(int, int);
66unsigned __int64 __emulu(unsigned int, unsigned int);
Eric Christopher0db88a72013-09-18 22:24:01 +000067void __cdecl __fastfail(unsigned int);
Eric Christopherd1428bf2013-08-31 00:22:48 +000068unsigned int __getcallerseflags(void);
Hans Wennborg740a4d62014-01-28 22:55:01 +000069static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000070void __halt(void);
71unsigned char __inbyte(unsigned short);
72void __inbytestring(unsigned short, unsigned char *, unsigned long);
73void __incfsbyte(unsigned long);
74void __incfsdword(unsigned long);
75void __incfsword(unsigned long);
76unsigned long __indword(unsigned short);
77void __indwordstring(unsigned short, unsigned long *, unsigned long);
78void __int2c(void);
79void __invlpg(void *);
80unsigned short __inword(unsigned short);
81void __inwordstring(unsigned short, unsigned short *, unsigned long);
82void __lidt(void *);
83unsigned __int64 __ll_lshift(unsigned __int64, int);
84__int64 __ll_rshift(__int64, int);
85void __llwpcb(void *);
86unsigned char __lwpins32(unsigned int, unsigned int, unsigned int);
87void __lwpval32(unsigned int, unsigned int, unsigned int);
88unsigned int __lzcnt(unsigned int);
89unsigned short __lzcnt16(unsigned short);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000090static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000091void __movsb(unsigned char *, unsigned char const *, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000092static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000093void __movsd(unsigned long *, unsigned long const *, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000094static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000095void __movsw(unsigned short *, unsigned short const *, size_t);
96void __nop(void);
97void __nvreg_restore_fence(void);
98void __nvreg_save_fence(void);
99void __outbyte(unsigned short, unsigned char);
100void __outbytestring(unsigned short, unsigned char *, unsigned long);
101void __outdword(unsigned short, unsigned long);
102void __outdwordstring(unsigned short, unsigned long *, unsigned long);
103void __outword(unsigned short, unsigned short);
104void __outwordstring(unsigned short, unsigned short *, unsigned long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000105static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000106unsigned int __popcnt(unsigned int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000107static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000108unsigned short __popcnt16(unsigned short);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000109unsigned long __readcr0(void);
110unsigned long __readcr2(void);
Reid Kleckner592dc612014-04-08 00:28:22 +0000111static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000112unsigned long __readcr3(void);
Eric Christopher439137e2014-01-24 12:13:47 +0000113unsigned long __readcr4(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000114unsigned long __readcr8(void);
115unsigned int __readdr(unsigned int);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000116#ifdef __i386__
117static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000118unsigned char __readfsbyte(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000119static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000120unsigned long __readfsdword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000121static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000122unsigned __int64 __readfsqword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000123static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000124unsigned short __readfsword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000125#endif
Reid Kleckner592dc612014-04-08 00:28:22 +0000126static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000127unsigned __int64 __readmsr(unsigned long);
128unsigned __int64 __readpmc(unsigned long);
129unsigned long __segmentlimit(unsigned long);
130void __sidt(void *);
131void *__slwpcb(void);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000132static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000133void __stosb(unsigned char *, unsigned char, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000134static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000135void __stosd(unsigned long *, unsigned long, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000136static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000137void __stosw(unsigned short *, unsigned short, size_t);
138void __svm_clgi(void);
139void __svm_invlpga(void *, int);
140void __svm_skinit(int);
141void __svm_stgi(void);
142void __svm_vmload(size_t);
143void __svm_vmrun(size_t);
144void __svm_vmsave(size_t);
145void __ud2(void);
146unsigned __int64 __ull_rshift(unsigned __int64, int);
147void __vmx_off(void);
148void __vmx_vmptrst(unsigned __int64 *);
149void __wbinvd(void);
150void __writecr0(unsigned int);
Reid Kleckner592dc612014-04-08 00:28:22 +0000151static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000152void __writecr3(unsigned int);
153void __writecr4(unsigned int);
154void __writecr8(unsigned int);
155void __writedr(unsigned int, unsigned int);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000156void __writefsbyte(unsigned long, unsigned char);
157void __writefsdword(unsigned long, unsigned long);
158void __writefsqword(unsigned long, unsigned __int64);
159void __writefsword(unsigned long, unsigned short);
160void __writemsr(unsigned long, unsigned __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000161static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000162void *_AddressOfReturnAddress(void);
Warren Huntd6ffae92013-09-27 23:57:26 +0000163static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000164unsigned char _BitScanForward(unsigned long *_Index, unsigned long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000165static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000166unsigned char _BitScanReverse(unsigned long *_Index, unsigned long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000167static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000168unsigned char _bittest(long const *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000169static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000170unsigned char _bittestandcomplement(long *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000171static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000172unsigned char _bittestandreset(long *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000173static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000174unsigned char _bittestandset(long *, long);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000175unsigned __int64 __cdecl _byteswap_uint64(unsigned __int64);
176unsigned long __cdecl _byteswap_ulong(unsigned long);
177unsigned short __cdecl _byteswap_ushort(unsigned short);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000178void __cdecl _disable(void);
179void __cdecl _enable(void);
180void __cdecl _fxrstor(void const *);
181void __cdecl _fxsave(void *);
182long _InterlockedAddLargeStatistic(__int64 volatile *_Addend, long _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000183static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000184long _InterlockedAnd(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000185static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000186short _InterlockedAnd16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000187static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000188char _InterlockedAnd8(char volatile *_Value, char _Mask);
189unsigned char _interlockedbittestandreset(long volatile *, long);
Hans Wennborga3169332014-03-13 17:05:09 +0000190static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000191unsigned char _interlockedbittestandset(long volatile *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000192static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000193long __cdecl _InterlockedCompareExchange(long volatile *_Destination,
194 long _Exchange, long _Comparand);
195long _InterlockedCompareExchange_HLEAcquire(long volatile *, long, long);
196long _InterlockedCompareExchange_HLERelease(long volatile *, long, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000197static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000198short _InterlockedCompareExchange16(short volatile *_Destination,
199 short _Exchange, short _Comparand);
Warren Huntd6ffae92013-09-27 23:57:26 +0000200static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000201__int64 _InterlockedCompareExchange64(__int64 volatile *_Destination,
202 __int64 _Exchange, __int64 _Comparand);
203__int64 _InterlockedcompareExchange64_HLEAcquire(__int64 volatile *, __int64,
204 __int64);
205__int64 _InterlockedCompareExchange64_HLERelease(__int64 volatile *, __int64,
206 __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000207static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000208char _InterlockedCompareExchange8(char volatile *_Destination, char _Exchange,
209 char _Comparand);
210void *_InterlockedCompareExchangePointer_HLEAcquire(void *volatile *, void *,
211 void *);
212void *_InterlockedCompareExchangePointer_HLERelease(void *volatile *, void *,
213 void *);
Warren Huntd6ffae92013-09-27 23:57:26 +0000214static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000215long __cdecl _InterlockedDecrement(long volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000216static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000217short _InterlockedDecrement16(short volatile *_Addend);
Saleem Abdulrasool114efe02014-06-18 20:51:10 +0000218long _InterlockedExchange(long volatile *_Target, long _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000219static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000220short _InterlockedExchange16(short volatile *_Target, short _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000221static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000222char _InterlockedExchange8(char volatile *_Target, char _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000223static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000224long __cdecl _InterlockedExchangeAdd(long volatile *_Addend, long _Value);
225long _InterlockedExchangeAdd_HLEAcquire(long volatile *, long);
226long _InterlockedExchangeAdd_HLERelease(long volatile *, long);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000227static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000228short _InterlockedExchangeAdd16(short volatile *_Addend, short _Value);
229__int64 _InterlockedExchangeAdd64_HLEAcquire(__int64 volatile *, __int64);
230__int64 _InterlockedExchangeAdd64_HLERelease(__int64 volatile *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000231static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000232char _InterlockedExchangeAdd8(char volatile *_Addend, char _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000233static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000234long __cdecl _InterlockedIncrement(long volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000235static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000236short _InterlockedIncrement16(short volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000237static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000238long _InterlockedOr(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000239static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000240short _InterlockedOr16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000241static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000242char _InterlockedOr8(char volatile *_Value, char _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000243static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000244long _InterlockedXor(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000245static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000246short _InterlockedXor16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000247static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000248char _InterlockedXor8(char volatile *_Value, char _Mask);
249void __cdecl _invpcid(unsigned int, void *);
Warren Huntd6ffae92013-09-27 23:57:26 +0000250static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000251unsigned long __cdecl _lrotl(unsigned long, int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000252static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000253unsigned long __cdecl _lrotr(unsigned long, int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000254static __inline__
Reid Kleckner00d33a52013-10-17 01:29:48 +0000255static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000256void _ReadBarrier(void);
Reid Kleckner00d33a52013-10-17 01:29:48 +0000257static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000258void _ReadWriteBarrier(void);
Warren Huntd6ffae92013-09-27 23:57:26 +0000259static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000260void *_ReturnAddress(void);
261unsigned int _rorx_u32(unsigned int, const unsigned int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000262static __inline__
Eric Christopherfb4b4332013-08-31 00:27:38 +0000263unsigned int __cdecl _rotl(unsigned int _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000264static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000265unsigned short _rotl16(unsigned short _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000266static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000267unsigned __int64 __cdecl _rotl64(unsigned __int64 _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000268static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000269unsigned char _rotl8(unsigned char _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000270static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000271unsigned int __cdecl _rotr(unsigned int _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000272static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000273unsigned short _rotr16(unsigned short _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000274static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000275unsigned __int64 __cdecl _rotr64(unsigned __int64 _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000276static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000277unsigned char _rotr8(unsigned char _Value, unsigned char _Shift);
278int _sarx_i32(int, unsigned int);
Nico Webera62cffa2014-07-08 18:34:46 +0000279#if __STDC_HOSTED__
Hans Wennborg1fd6dd32014-01-28 23:01:59 +0000280int __cdecl _setjmp(jmp_buf);
Nico Webera62cffa2014-07-08 18:34:46 +0000281#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +0000282unsigned int _shlx_u32(unsigned int, unsigned int);
283unsigned int _shrx_u32(unsigned int, unsigned int);
284void _Store_HLERelease(long volatile *, long);
285void _Store64_HLERelease(__int64 volatile *, __int64);
286void _StorePointer_HLERelease(void *volatile *, void *);
Reid Kleckner00d33a52013-10-17 01:29:48 +0000287static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000288void _WriteBarrier(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000289unsigned __int32 xbegin(void);
290void _xend(void);
Hans Wennborg854f7d32014-01-16 23:39:35 +0000291static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000292unsigned __int64 __cdecl _xgetbv(unsigned int);
293void __cdecl _xrstor(void const *, unsigned __int64);
294void __cdecl _xsave(void *, unsigned __int64);
295void __cdecl _xsaveopt(void *, unsigned __int64);
296void __cdecl _xsetbv(unsigned int, unsigned __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000297
298/* These additional intrinsics are turned on in x64/amd64/x86_64 mode. */
Warren Hunt3f987942013-09-30 21:08:05 +0000299#ifdef __x86_64__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000300void __addgsbyte(unsigned long, unsigned char);
301void __addgsdword(unsigned long, unsigned long);
302void __addgsqword(unsigned long, unsigned __int64);
303void __addgsword(unsigned long, unsigned short);
Reid Klecknerf08d6582014-01-27 19:16:35 +0000304static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000305void __faststorefence(void);
306void __incgsbyte(unsigned long);
307void __incgsdword(unsigned long);
308void __incgsqword(unsigned long);
309void __incgsword(unsigned long);
Eric Christopher439137e2014-01-24 12:13:47 +0000310unsigned char __lwpins64(unsigned __int64, unsigned int, unsigned int);
311void __lwpval64(unsigned __int64, unsigned int, unsigned int);
312unsigned __int64 __lzcnt64(unsigned __int64);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000313static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000314void __movsq(unsigned long long *, unsigned long long const *, size_t);
315__int64 __mulh(__int64, __int64);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000316static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000317unsigned __int64 __popcnt64(unsigned __int64);
Hans Wennborga4421e02014-03-12 21:09:05 +0000318static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000319unsigned char __readgsbyte(unsigned long);
Hans Wennborga4421e02014-03-12 21:09:05 +0000320static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000321unsigned long __readgsdword(unsigned long);
Hans Wennborga4421e02014-03-12 21:09:05 +0000322static __inline__
323unsigned __int64 __readgsqword(unsigned long);
Eric Christopher439137e2014-01-24 12:13:47 +0000324unsigned short __readgsword(unsigned long);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000325unsigned __int64 __shiftleft128(unsigned __int64 _LowPart,
326 unsigned __int64 _HighPart,
327 unsigned char _Shift);
328unsigned __int64 __shiftright128(unsigned __int64 _LowPart,
329 unsigned __int64 _HighPart,
330 unsigned char _Shift);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000331static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000332void __stosq(unsigned __int64 *, unsigned __int64, size_t);
Eric Christopher439137e2014-01-24 12:13:47 +0000333unsigned __int64 __umulh(unsigned __int64, unsigned __int64);
334unsigned char __vmx_on(unsigned __int64 *);
335unsigned char __vmx_vmclear(unsigned __int64 *);
336unsigned char __vmx_vmlaunch(void);
337unsigned char __vmx_vmptrld(unsigned __int64 *);
338unsigned char __vmx_vmread(size_t, size_t *);
339unsigned char __vmx_vmresume(void);
340unsigned char __vmx_vmwrite(size_t, size_t);
341void __writegsbyte(unsigned long, unsigned char);
342void __writegsdword(unsigned long, unsigned long);
343void __writegsqword(unsigned long, unsigned __int64);
344void __writegsword(unsigned long, unsigned short);
Warren Huntd6ffae92013-09-27 23:57:26 +0000345static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000346unsigned char _BitScanForward64(unsigned long *_Index, unsigned __int64 _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000347static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000348unsigned char _BitScanReverse64(unsigned long *_Index, unsigned __int64 _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000349static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000350unsigned char _bittest64(__int64 const *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000351static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000352unsigned char _bittestandcomplement64(__int64 *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000353static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000354unsigned char _bittestandreset64(__int64 *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000355static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000356unsigned char _bittestandset64(__int64 *, __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000357unsigned __int64 __cdecl _byteswap_uint64(unsigned __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000358void __cdecl _fxrstor64(void const *);
359void __cdecl _fxsave64(void *);
360long _InterlockedAnd_np(long volatile *_Value, long _Mask);
361short _InterlockedAnd16_np(short volatile *_Value, short _Mask);
362__int64 _InterlockedAnd64_np(__int64 volatile *_Value, __int64 _Mask);
363char _InterlockedAnd8_np(char volatile *_Value, char _Mask);
364unsigned char _interlockedbittestandreset64(__int64 volatile *, __int64);
Hans Wennborga3169332014-03-13 17:05:09 +0000365static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000366unsigned char _interlockedbittestandset64(__int64 volatile *, __int64);
367long _InterlockedCompareExchange_np(long volatile *_Destination, long _Exchange,
368 long _Comparand);
369unsigned char _InterlockedCompareExchange128(__int64 volatile *_Destination,
370 __int64 _ExchangeHigh,
371 __int64 _ExchangeLow,
372 __int64 *_CompareandResult);
373unsigned char _InterlockedCompareExchange128_np(__int64 volatile *_Destination,
374 __int64 _ExchangeHigh,
375 __int64 _ExchangeLow,
376 __int64 *_ComparandResult);
377short _InterlockedCompareExchange16_np(short volatile *_Destination,
378 short _Exchange, short _Comparand);
Eric Christopher439137e2014-01-24 12:13:47 +0000379__int64 _InterlockedCompareExchange64_HLEAcquire(__int64 volatile *, __int64,
380 __int64);
381__int64 _InterlockedCompareExchange64_HLERelease(__int64 volatile *, __int64,
382 __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000383__int64 _InterlockedCompareExchange64_np(__int64 volatile *_Destination,
384 __int64 _Exchange, __int64 _Comparand);
Eric Christopher58b40432014-01-25 01:38:30 +0000385void *_InterlockedCompareExchangePointer(void *volatile *_Destination,
386 void *_Exchange, void *_Comparand);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000387void *_InterlockedCompareExchangePointer_np(void *volatile *_Destination,
388 void *_Exchange, void *_Comparand);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000389static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000390__int64 _InterlockedDecrement64(__int64 volatile *_Addend);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000391static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000392__int64 _InterlockedExchange64(__int64 volatile *_Target, __int64 _Value);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000393static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000394__int64 _InterlockedExchangeAdd64(__int64 volatile *_Addend, __int64 _Value);
395void *_InterlockedExchangePointer(void *volatile *_Target, void *_Value);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000396static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000397__int64 _InterlockedIncrement64(__int64 volatile *_Addend);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000398long _InterlockedOr_np(long volatile *_Value, long _Mask);
399short _InterlockedOr16_np(short volatile *_Value, short _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000400static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000401__int64 _InterlockedOr64(__int64 volatile *_Value, __int64 _Mask);
Warren Hunt41a993f2013-09-28 00:15:41 +0000402__int64 _InterlockedOr64_np(__int64 volatile *_Value, __int64 _Mask);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000403char _InterlockedOr8_np(char volatile *_Value, char _Mask);
404long _InterlockedXor_np(long volatile *_Value, long _Mask);
405short _InterlockedXor16_np(short volatile *_Value, short _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000406static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000407__int64 _InterlockedXor64(__int64 volatile *_Value, __int64 _Mask);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000408__int64 _InterlockedXor64_np(__int64 volatile *_Value, __int64 _Mask);
409char _InterlockedXor8_np(char volatile *_Value, char _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000410static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000411__int64 _mul128(__int64 _Multiplier, __int64 _Multiplicand,
412 __int64 *_HighProduct);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000413unsigned __int64 _rorx_u64(unsigned __int64, const unsigned int);
Eric Christopher439137e2014-01-24 12:13:47 +0000414__int64 _sarx_i64(__int64, unsigned int);
Nico Webera62cffa2014-07-08 18:34:46 +0000415#if __STDC_HOSTED__
416int __cdecl _setjmpex(jmp_buf);
417#endif
Eric Christopher439137e2014-01-24 12:13:47 +0000418unsigned __int64 _shlx_u64(unsigned __int64, unsigned int);
David Majnemer54507632014-12-02 23:30:26 +0000419unsigned __int64 _shrx_u64(unsigned __int64, unsigned int);
David Majnemer5f9afc52014-12-02 23:30:24 +0000420/*
421 * Multiply two 64-bit integers and obtain a 64-bit result.
422 * The low-half is returned directly and the high half is in an out parameter.
423 */
424static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
425_umul128(unsigned __int64 _Multiplier, unsigned __int64 _Multiplicand,
426 unsigned __int64 *_HighProduct) {
427 unsigned __int128 _FullProduct =
428 (unsigned __int128)_Multiplier * (unsigned __int128)_Multiplicand;
429 *_HighProduct = FullProduct >> 64;
430 return FullProduct;
431}
Eric Christopherd1428bf2013-08-31 00:22:48 +0000432void __cdecl _xrstor64(void const *, unsigned __int64);
433void __cdecl _xsave64(void *, unsigned __int64);
434void __cdecl _xsaveopt64(void *, unsigned __int64);
Eric Christopher0db88a72013-09-18 22:24:01 +0000435
Warren Hunt3f987942013-09-30 21:08:05 +0000436#endif /* __x86_64__ */
Reid Klecknerf0e23222013-09-19 00:19:53 +0000437
Warren Huntd6ffae92013-09-27 23:57:26 +0000438/*----------------------------------------------------------------------------*\
439|* Bit Twiddling
440\*----------------------------------------------------------------------------*/
441static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
442_rotl8(unsigned char _Value, unsigned char _Shift) {
443 _Shift &= 0x7;
444 return _Shift ? (_Value << _Shift) | (_Value >> (8 - _Shift)) : _Value;
445}
446static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
447_rotr8(unsigned char _Value, unsigned char _Shift) {
448 _Shift &= 0x7;
449 return _Shift ? (_Value >> _Shift) | (_Value << (8 - _Shift)) : _Value;
450}
451static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
452_rotl16(unsigned short _Value, unsigned char _Shift) {
453 _Shift &= 0xf;
454 return _Shift ? (_Value << _Shift) | (_Value >> (16 - _Shift)) : _Value;
455}
456static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
457_rotr16(unsigned short _Value, unsigned char _Shift) {
458 _Shift &= 0xf;
459 return _Shift ? (_Value >> _Shift) | (_Value << (16 - _Shift)) : _Value;
460}
461static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
462_rotl(unsigned int _Value, int _Shift) {
463 _Shift &= 0x1f;
464 return _Shift ? (_Value << _Shift) | (_Value >> (32 - _Shift)) : _Value;
465}
466static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
467_rotr(unsigned int _Value, int _Shift) {
468 _Shift &= 0x1f;
469 return _Shift ? (_Value >> _Shift) | (_Value << (32 - _Shift)) : _Value;
470}
471static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
472_lrotl(unsigned long _Value, int _Shift) {
473 _Shift &= 0x1f;
474 return _Shift ? (_Value << _Shift) | (_Value >> (32 - _Shift)) : _Value;
475}
476static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
477_lrotr(unsigned long _Value, int _Shift) {
478 _Shift &= 0x1f;
479 return _Shift ? (_Value >> _Shift) | (_Value << (32 - _Shift)) : _Value;
480}
481static
482__inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
483_rotl64(unsigned __int64 _Value, int _Shift) {
484 _Shift &= 0x3f;
485 return _Shift ? (_Value << _Shift) | (_Value >> (64 - _Shift)) : _Value;
486}
487static
488__inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
489_rotr64(unsigned __int64 _Value, int _Shift) {
490 _Shift &= 0x3f;
491 return _Shift ? (_Value >> _Shift) | (_Value << (64 - _Shift)) : _Value;
492}
493/*----------------------------------------------------------------------------*\
494|* Bit Counting and Testing
495\*----------------------------------------------------------------------------*/
496static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
497_BitScanForward(unsigned long *_Index, unsigned long _Mask) {
498 if (!_Mask)
499 return 0;
500 *_Index = __builtin_ctzl(_Mask);
501 return 1;
502}
503static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
504_BitScanReverse(unsigned long *_Index, unsigned long _Mask) {
505 if (!_Mask)
506 return 0;
507 *_Index = 31 - __builtin_clzl(_Mask);
508 return 1;
509}
Warren Huntd6ffae92013-09-27 23:57:26 +0000510static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
511__popcnt16(unsigned short value) {
512 return __builtin_popcount((int)value);
513}
514static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
515__popcnt(unsigned int value) {
516 return __builtin_popcount(value);
517}
518static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
519_bittest(long const *a, long b) {
520 return (*a >> b) & 1;
521}
522static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
523_bittestandcomplement(long *a, long b) {
524 unsigned char x = (*a >> b) & 1;
525 *a = *a ^ (1 << b);
526 return x;
527}
528static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
529_bittestandreset(long *a, long b) {
530 unsigned char x = (*a >> b) & 1;
531 *a = *a & ~(1 << b);
532 return x;
533}
534static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
535_bittestandset(long *a, long b) {
536 unsigned char x = (*a >> b) & 1;
Warren Hunt2731e3e2013-10-01 17:12:40 +0000537 *a = *a | (1 << b);
Warren Huntd6ffae92013-09-27 23:57:26 +0000538 return x;
539}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000540#if defined(__i386__) || defined(__x86_64__)
Hans Wennborga3169332014-03-13 17:05:09 +0000541static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
542_interlockedbittestandset(long volatile *__BitBase, long __BitPos) {
543 unsigned char __Res;
544 __asm__ ("xor %0, %0\n"
545 "lock bts %2, %1\n"
546 "setc %0\n"
547 : "=r" (__Res), "+m"(*__BitBase)
548 : "Ir"(__BitPos));
549 return __Res;
550}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000551#endif
Warren Hunt3f987942013-09-30 21:08:05 +0000552#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000553static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
554_BitScanForward64(unsigned long *_Index, unsigned __int64 _Mask) {
555 if (!_Mask)
556 return 0;
557 *_Index = __builtin_ctzll(_Mask);
558 return 1;
559}
560static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
561_BitScanReverse64(unsigned long *_Index, unsigned __int64 _Mask) {
562 if (!_Mask)
563 return 0;
564 *_Index = 63 - __builtin_clzll(_Mask);
565 return 1;
566}
Warren Huntd6ffae92013-09-27 23:57:26 +0000567static __inline__
568unsigned __int64 __attribute__((__always_inline__, __nodebug__))
569 __popcnt64(unsigned __int64 value) {
570 return __builtin_popcountll(value);
571}
572static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
573_bittest64(__int64 const *a, __int64 b) {
574 return (*a >> b) & 1;
575}
576static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
577_bittestandcomplement64(__int64 *a, __int64 b) {
578 unsigned char x = (*a >> b) & 1;
579 *a = *a ^ (1ll << b);
580 return x;
581}
582static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
583_bittestandreset64(__int64 *a, __int64 b) {
584 unsigned char x = (*a >> b) & 1;
585 *a = *a & ~(1ll << b);
586 return x;
587}
588static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
589_bittestandset64(__int64 *a, __int64 b) {
590 unsigned char x = (*a >> b) & 1;
Warren Hunt2731e3e2013-10-01 17:12:40 +0000591 *a = *a | (1ll << b);
Warren Huntd6ffae92013-09-27 23:57:26 +0000592 return x;
593}
Hans Wennborga3169332014-03-13 17:05:09 +0000594static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
595_interlockedbittestandset64(__int64 volatile *__BitBase, __int64 __BitPos) {
596 unsigned char __Res;
597 __asm__ ("xor %0, %0\n"
598 "lock bts %2, %1\n"
599 "setc %0\n"
600 : "=r" (__Res), "+m"(*__BitBase)
601 : "Ir"(__BitPos));
602 return __Res;
603}
Warren Huntd6ffae92013-09-27 23:57:26 +0000604#endif
605/*----------------------------------------------------------------------------*\
606|* Interlocked Exchange Add
607\*----------------------------------------------------------------------------*/
608static __inline__ char __attribute__((__always_inline__, __nodebug__))
609_InterlockedExchangeAdd8(char volatile *_Addend, char _Value) {
610 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
611}
612static __inline__ short __attribute__((__always_inline__, __nodebug__))
613_InterlockedExchangeAdd16(short volatile *_Addend, short _Value) {
614 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
615}
Warren Hunt3f987942013-09-30 21:08:05 +0000616#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000617static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
618_InterlockedExchangeAdd64(__int64 volatile *_Addend, __int64 _Value) {
619 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
620}
621#endif
622/*----------------------------------------------------------------------------*\
623|* Interlocked Exchange Sub
624\*----------------------------------------------------------------------------*/
625static __inline__ char __attribute__((__always_inline__, __nodebug__))
626_InterlockedExchangeSub8(char volatile *_Subend, char _Value) {
627 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
628}
629static __inline__ short __attribute__((__always_inline__, __nodebug__))
630_InterlockedExchangeSub16(short volatile *_Subend, short _Value) {
631 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
632}
633static __inline__ long __attribute__((__always_inline__, __nodebug__))
634_InterlockedExchangeSub(long volatile *_Subend, long _Value) {
635 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
636}
Warren Hunt3f987942013-09-30 21:08:05 +0000637#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000638static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
639_InterlockedExchangeSub64(__int64 volatile *_Subend, __int64 _Value) {
640 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
641}
642#endif
643/*----------------------------------------------------------------------------*\
644|* Interlocked Increment
645\*----------------------------------------------------------------------------*/
Hans Wennborg2ed88802014-01-23 19:15:39 +0000646static __inline__ short __attribute__((__always_inline__, __nodebug__))
647_InterlockedIncrement16(short volatile *_Value) {
Warren Huntd6ffae92013-09-27 23:57:26 +0000648 return __atomic_add_fetch(_Value, 1, 0);
649}
Warren Hunt3f987942013-09-30 21:08:05 +0000650#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000651static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
652_InterlockedIncrement64(__int64 volatile *_Value) {
653 return __atomic_add_fetch(_Value, 1, 0);
654}
655#endif
656/*----------------------------------------------------------------------------*\
657|* Interlocked Decrement
658\*----------------------------------------------------------------------------*/
Hans Wennborg2ed88802014-01-23 19:15:39 +0000659static __inline__ short __attribute__((__always_inline__, __nodebug__))
660_InterlockedDecrement16(short volatile *_Value) {
Warren Huntd6ffae92013-09-27 23:57:26 +0000661 return __atomic_sub_fetch(_Value, 1, 0);
662}
Warren Hunt3f987942013-09-30 21:08:05 +0000663#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000664static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
665_InterlockedDecrement64(__int64 volatile *_Value) {
666 return __atomic_sub_fetch(_Value, 1, 0);
667}
668#endif
669/*----------------------------------------------------------------------------*\
670|* Interlocked And
671\*----------------------------------------------------------------------------*/
672static __inline__ char __attribute__((__always_inline__, __nodebug__))
673_InterlockedAnd8(char volatile *_Value, char _Mask) {
674 return __atomic_and_fetch(_Value, _Mask, 0);
675}
676static __inline__ short __attribute__((__always_inline__, __nodebug__))
677_InterlockedAnd16(short volatile *_Value, short _Mask) {
678 return __atomic_and_fetch(_Value, _Mask, 0);
679}
680static __inline__ long __attribute__((__always_inline__, __nodebug__))
681_InterlockedAnd(long volatile *_Value, long _Mask) {
682 return __atomic_and_fetch(_Value, _Mask, 0);
683}
Warren Hunt3f987942013-09-30 21:08:05 +0000684#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000685static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
686_InterlockedAnd64(__int64 volatile *_Value, __int64 _Mask) {
687 return __atomic_and_fetch(_Value, _Mask, 0);
688}
689#endif
690/*----------------------------------------------------------------------------*\
691|* Interlocked Or
692\*----------------------------------------------------------------------------*/
693static __inline__ char __attribute__((__always_inline__, __nodebug__))
694_InterlockedOr8(char volatile *_Value, char _Mask) {
695 return __atomic_or_fetch(_Value, _Mask, 0);
696}
697static __inline__ short __attribute__((__always_inline__, __nodebug__))
698_InterlockedOr16(short volatile *_Value, short _Mask) {
699 return __atomic_or_fetch(_Value, _Mask, 0);
700}
701static __inline__ long __attribute__((__always_inline__, __nodebug__))
702_InterlockedOr(long volatile *_Value, long _Mask) {
703 return __atomic_or_fetch(_Value, _Mask, 0);
704}
Warren Hunt3f987942013-09-30 21:08:05 +0000705#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000706static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
707_InterlockedOr64(__int64 volatile *_Value, __int64 _Mask) {
708 return __atomic_or_fetch(_Value, _Mask, 0);
709}
710#endif
711/*----------------------------------------------------------------------------*\
712|* Interlocked Xor
713\*----------------------------------------------------------------------------*/
714static __inline__ char __attribute__((__always_inline__, __nodebug__))
715_InterlockedXor8(char volatile *_Value, char _Mask) {
716 return __atomic_xor_fetch(_Value, _Mask, 0);
717}
718static __inline__ short __attribute__((__always_inline__, __nodebug__))
719_InterlockedXor16(short volatile *_Value, short _Mask) {
720 return __atomic_xor_fetch(_Value, _Mask, 0);
721}
722static __inline__ long __attribute__((__always_inline__, __nodebug__))
723_InterlockedXor(long volatile *_Value, long _Mask) {
724 return __atomic_xor_fetch(_Value, _Mask, 0);
725}
Warren Hunt3f987942013-09-30 21:08:05 +0000726#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000727static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
728_InterlockedXor64(__int64 volatile *_Value, __int64 _Mask) {
729 return __atomic_xor_fetch(_Value, _Mask, 0);
730}
731#endif
732/*----------------------------------------------------------------------------*\
733|* Interlocked Exchange
734\*----------------------------------------------------------------------------*/
735static __inline__ char __attribute__((__always_inline__, __nodebug__))
736_InterlockedExchange8(char volatile *_Target, char _Value) {
737 __atomic_exchange(_Target, &_Value, &_Value, 0);
738 return _Value;
739}
740static __inline__ short __attribute__((__always_inline__, __nodebug__))
741_InterlockedExchange16(short volatile *_Target, short _Value) {
742 __atomic_exchange(_Target, &_Value, &_Value, 0);
743 return _Value;
744}
Warren Hunt3f987942013-09-30 21:08:05 +0000745#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000746static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
747_InterlockedExchange64(__int64 volatile *_Target, __int64 _Value) {
748 __atomic_exchange(_Target, &_Value, &_Value, 0);
749 return _Value;
750}
751#endif
752/*----------------------------------------------------------------------------*\
753|* Interlocked Compare Exchange
754\*----------------------------------------------------------------------------*/
755static __inline__ char __attribute__((__always_inline__, __nodebug__))
756_InterlockedCompareExchange8(char volatile *_Destination,
757 char _Exchange, char _Comparand) {
758 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
759 return _Comparand;
760}
761static __inline__ short __attribute__((__always_inline__, __nodebug__))
762_InterlockedCompareExchange16(short volatile *_Destination,
763 short _Exchange, short _Comparand) {
764 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
765 return _Comparand;
766}
Warren Huntd6ffae92013-09-27 23:57:26 +0000767static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
768_InterlockedCompareExchange64(__int64 volatile *_Destination,
769 __int64 _Exchange, __int64 _Comparand) {
770 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
771 return _Comparand;
772}
Warren Huntd6ffae92013-09-27 23:57:26 +0000773/*----------------------------------------------------------------------------*\
Reid Kleckner00d33a52013-10-17 01:29:48 +0000774|* Barriers
775\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000776#if defined(__i386__) || defined(__x86_64__)
Reid Kleckner00d33a52013-10-17 01:29:48 +0000777static __inline__ void __attribute__((__always_inline__, __nodebug__))
778__attribute__((deprecated("use other intrinsics or C++11 atomics instead")))
779_ReadWriteBarrier(void) {
780 __asm__ volatile ("" : : : "memory");
781}
782static __inline__ void __attribute__((__always_inline__, __nodebug__))
783__attribute__((deprecated("use other intrinsics or C++11 atomics instead")))
784_ReadBarrier(void) {
785 __asm__ volatile ("" : : : "memory");
786}
787static __inline__ void __attribute__((__always_inline__, __nodebug__))
788__attribute__((deprecated("use other intrinsics or C++11 atomics instead")))
789_WriteBarrier(void) {
790 __asm__ volatile ("" : : : "memory");
791}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000792#endif
Reid Klecknerf08d6582014-01-27 19:16:35 +0000793#ifdef __x86_64__
794static __inline__ void __attribute__((__always_inline__, __nodebug__))
795__faststorefence(void) {
796 __asm__ volatile("lock orq $0, (%%rsp)" : : : "memory");
797}
798#endif
Reid Kleckner00d33a52013-10-17 01:29:48 +0000799/*----------------------------------------------------------------------------*\
Hans Wennborga4421e02014-03-12 21:09:05 +0000800|* readfs, readgs
801|* (Pointers in address space #256 and #257 are relative to the GS and FS
802|* segment registers, respectively.)
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000803\*----------------------------------------------------------------------------*/
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000804#define __ptr_to_addr_space(__addr_space_nbr, __type, __offset) \
805 ((volatile __type __attribute__((__address_space__(__addr_space_nbr)))*) \
806 (__offset))
807
Hans Wennborga4421e02014-03-12 21:09:05 +0000808#ifdef __i386__
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000809static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
810__readfsbyte(unsigned long __offset) {
811 return *__ptr_to_addr_space(257, unsigned char, __offset);
812}
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000813static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
814__readfsqword(unsigned long __offset) {
815 return *__ptr_to_addr_space(257, unsigned __int64, __offset);
816}
817static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
818__readfsword(unsigned long __offset) {
819 return *__ptr_to_addr_space(257, unsigned short, __offset);
820}
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000821#endif
Hans Wennborga4421e02014-03-12 21:09:05 +0000822#ifdef __x86_64__
823static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
824__readgsbyte(unsigned long __offset) {
825 return *__ptr_to_addr_space(256, unsigned char, __offset);
826}
827static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
828__readgsdword(unsigned long __offset) {
829 return *__ptr_to_addr_space(256, unsigned long, __offset);
830}
831static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
832__readgsqword(unsigned long __offset) {
833 return *__ptr_to_addr_space(256, unsigned __int64, __offset);
834}
835static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
836__readgsword(unsigned long __offset) {
837 return *__ptr_to_addr_space(256, unsigned short, __offset);
838}
839#endif
840#undef __ptr_to_addr_space
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000841/*----------------------------------------------------------------------------*\
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000842|* movs, stos
843\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000844#if defined(__i386__) || defined(__x86_64__)
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000845static __inline__ void __attribute__((__always_inline__, __nodebug__))
846__movsb(unsigned char *__dst, unsigned char const *__src, size_t __n) {
847 __asm__("rep movsb" : : "D"(__dst), "S"(__src), "c"(__n)
848 : "%edi", "%esi", "%ecx");
849}
850static __inline__ void __attribute__((__always_inline__, __nodebug__))
851__movsd(unsigned long *__dst, unsigned long const *__src, size_t __n) {
852 __asm__("rep movsl" : : "D"(__dst), "S"(__src), "c"(__n)
853 : "%edi", "%esi", "%ecx");
854}
855static __inline__ void __attribute__((__always_inline__, __nodebug__))
856__movsw(unsigned short *__dst, unsigned short const *__src, size_t __n) {
857 __asm__("rep movsh" : : "D"(__dst), "S"(__src), "c"(__n)
858 : "%edi", "%esi", "%ecx");
859}
860static __inline__ void __attribute__((__always_inline__, __nodebug__))
861__stosb(unsigned char *__dst, unsigned char __x, size_t __n) {
862 __asm__("rep stosb" : : "D"(__dst), "a"(__x), "c"(__n)
863 : "%edi", "%ecx");
864}
865static __inline__ void __attribute__((__always_inline__, __nodebug__))
866__stosd(unsigned long *__dst, unsigned long __x, size_t __n) {
867 __asm__("rep stosl" : : "D"(__dst), "a"(__x), "c"(__n)
868 : "%edi", "%ecx");
869}
870static __inline__ void __attribute__((__always_inline__, __nodebug__))
871__stosw(unsigned short *__dst, unsigned short __x, size_t __n) {
872 __asm__("rep stosh" : : "D"(__dst), "a"(__x), "c"(__n)
873 : "%edi", "%ecx");
874}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000875#endif
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000876#ifdef __x86_64__
877static __inline__ void __attribute__((__always_inline__, __nodebug__))
878__movsq(unsigned long long *__dst, unsigned long long const *__src, size_t __n) {
879 __asm__("rep movsq" : : "D"(__dst), "S"(__src), "c"(__n)
880 : "%edi", "%esi", "%ecx");
881}
882static __inline__ void __attribute__((__always_inline__, __nodebug__))
883__stosq(unsigned __int64 *__dst, unsigned __int64 __x, size_t __n) {
884 __asm__("rep stosq" : : "D"(__dst), "a"(__x), "c"(__n)
885 : "%edi", "%ecx");
886}
887#endif
888
889/*----------------------------------------------------------------------------*\
Warren Huntd6ffae92013-09-27 23:57:26 +0000890|* Misc
891\*----------------------------------------------------------------------------*/
892static __inline__ void * __attribute__((__always_inline__, __nodebug__))
893_AddressOfReturnAddress(void) {
894 return (void*)((char*)__builtin_frame_address(0) + sizeof(void*));
895}
896static __inline__ void * __attribute__((__always_inline__, __nodebug__))
897_ReturnAddress(void) {
898 return __builtin_return_address(0);
899}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000900#if defined(__i386__) || defined(__x86_64__)
Hans Wennborg854f7d32014-01-16 23:39:35 +0000901static __inline__ void __attribute__((__always_inline__, __nodebug__))
902__cpuid(int __info[4], int __level) {
Hans Wennborg854f7d32014-01-16 23:39:35 +0000903 __asm__ ("cpuid" : "=a"(__info[0]), "=b" (__info[1]), "=c"(__info[2]), "=d"(__info[3])
Hans Wennborg12fb89e2014-01-31 19:44:55 +0000904 : "a"(__level));
905}
906static __inline__ void __attribute__((__always_inline__, __nodebug__))
907__cpuidex(int __info[4], int __level, int __ecx) {
908 __asm__ ("cpuid" : "=a"(__info[0]), "=b" (__info[1]), "=c"(__info[2]), "=d"(__info[3])
909 : "a"(__level), "c"(__ecx));
Hans Wennborg854f7d32014-01-16 23:39:35 +0000910}
911static __inline__ unsigned __int64 __cdecl __attribute__((__always_inline__, __nodebug__))
912_xgetbv(unsigned int __xcr_no) {
913 unsigned int __eax, __edx;
914 __asm__ ("xgetbv" : "=a" (__eax), "=d" (__edx) : "c" (__xcr_no));
915 return ((unsigned __int64)__edx << 32) | __eax;
916}
Hans Wennborg740a4d62014-01-28 22:55:01 +0000917static __inline__ void __attribute__((__always_inline__, __nodebug__))
918__halt(void) {
919 __asm__ volatile ("hlt");
920}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000921#endif
Warren Huntd6ffae92013-09-27 23:57:26 +0000922
Reid Kleckner592dc612014-04-08 00:28:22 +0000923/*----------------------------------------------------------------------------*\
924|* Privileged intrinsics
925\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000926#if defined(__i386__) || defined(__x86_64__)
Reid Kleckner592dc612014-04-08 00:28:22 +0000927static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
928__readmsr(unsigned long __register) {
929 // Loads the contents of a 64-bit model specific register (MSR) specified in
930 // the ECX register into registers EDX:EAX. The EDX register is loaded with
931 // the high-order 32 bits of the MSR and the EAX register is loaded with the
932 // low-order 32 bits. If less than 64 bits are implemented in the MSR being
933 // read, the values returned to EDX:EAX in unimplemented bit locations are
934 // undefined.
935 unsigned long __edx;
936 unsigned long __eax;
Reid Kleckner6df52542014-04-08 17:49:16 +0000937 __asm__ ("rdmsr" : "=d"(__edx), "=a"(__eax) : "c"(__register));
Reid Kleckner592dc612014-04-08 00:28:22 +0000938 return (((unsigned __int64)__edx) << 32) | (unsigned __int64)__eax;
939}
940
941static __inline__ unsigned long __attribute__((always_inline, __nodebug__))
942__readcr3(void) {
Reid Kleckner6df52542014-04-08 17:49:16 +0000943 unsigned long __cr3_val;
944 __asm__ __volatile__ ("mov %%cr3, %0" : "=q"(__cr3_val) : : "memory");
945 return __cr3_val;
Reid Kleckner592dc612014-04-08 00:28:22 +0000946}
947
948static __inline__ void __attribute__((always_inline, __nodebug__))
Reid Kleckner6df52542014-04-08 17:49:16 +0000949__writecr3(unsigned int __cr3_val) {
950 __asm__ ("mov %0, %%cr3" : : "q"(__cr3_val) : "memory");
Reid Kleckner592dc612014-04-08 00:28:22 +0000951}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000952#endif
Reid Kleckner592dc612014-04-08 00:28:22 +0000953
Eric Christophercc872532013-09-18 22:40:18 +0000954#ifdef __cplusplus
Eric Christopher0db88a72013-09-18 22:24:01 +0000955}
Eric Christopherd1428bf2013-08-31 00:22:48 +0000956#endif
Reid Klecknerf0e23222013-09-19 00:19:53 +0000957
958#endif /* __INTRIN_H */
959#endif /* _MSC_VER */