blob: 9592cccb15c72bde18cc6e6dc3ff615ca5186d73 [file] [log] [blame]
Eric Christopherd1428bf2013-08-31 00:22:48 +00001/* ===-------- Intrin.h ---------------------------------------------------===
2 *
3 * Permission is hereby granted, free of charge, to any person obtaining a copy
4 * of this software and associated documentation files (the "Software"), to deal
5 * in the Software without restriction, including without limitation the rights
6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7 * copies of the Software, and to permit persons to whom the Software is
8 * furnished to do so, subject to the following conditions:
9 *
10 * The above copyright notice and this permission notice shall be included in
11 * all copies or substantial portions of the Software.
12 *
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19 * THE SOFTWARE.
20 *
21 *===-----------------------------------------------------------------------===
22 */
23
24/* Only include this if we're compiling for the windows platform. */
25#ifndef _MSC_VER
26#include_next <Intrin.h>
27#else
28
29#ifndef __INTRIN_H
30#define __INTRIN_H
31
32/* First include the standard intrinsics. */
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +000033#if defined(__i386__) || defined(__x86_64__)
Eric Christopherd1428bf2013-08-31 00:22:48 +000034#include <x86intrin.h>
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +000035#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +000036
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000037/* For the definition of jmp_buf. */
Nico Webera62cffa2014-07-08 18:34:46 +000038#if __STDC_HOSTED__
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000039#include <setjmp.h>
Nico Webera62cffa2014-07-08 18:34:46 +000040#endif
Hans Wennborg1fd6dd32014-01-28 23:01:59 +000041
Eric Christopher0db88a72013-09-18 22:24:01 +000042#ifdef __cplusplus
43extern "C" {
44#endif
45
Saleem Abdulrasoolc4ebb122014-07-08 05:46:04 +000046#if defined(__MMX__)
Eric Christopherd1428bf2013-08-31 00:22:48 +000047/* And the random ones that aren't in those files. */
48__m64 _m_from_float(float);
49__m64 _m_from_int(int _l);
50void _m_prefetch(void *);
51float _m_to_float(__m64);
52int _m_to_int(__m64 _M);
Saleem Abdulrasoolc4ebb122014-07-08 05:46:04 +000053#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +000054
55/* Other assorted instruction intrinsics. */
56void __addfsbyte(unsigned long, unsigned char);
57void __addfsdword(unsigned long, unsigned long);
58void __addfsword(unsigned long, unsigned short);
59void __code_seg(const char *);
Hans Wennborg854f7d32014-01-16 23:39:35 +000060static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000061void __cpuid(int[4], int);
Hans Wennborg12fb89e2014-01-31 19:44:55 +000062static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000063void __cpuidex(int[4], int, int);
Eric Christopher0db88a72013-09-18 22:24:01 +000064void __debugbreak(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +000065__int64 __emul(int, int);
66unsigned __int64 __emulu(unsigned int, unsigned int);
Eric Christopher0db88a72013-09-18 22:24:01 +000067void __cdecl __fastfail(unsigned int);
Eric Christopherd1428bf2013-08-31 00:22:48 +000068unsigned int __getcallerseflags(void);
Hans Wennborg740a4d62014-01-28 22:55:01 +000069static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000070void __halt(void);
71unsigned char __inbyte(unsigned short);
72void __inbytestring(unsigned short, unsigned char *, unsigned long);
73void __incfsbyte(unsigned long);
74void __incfsdword(unsigned long);
75void __incfsword(unsigned long);
76unsigned long __indword(unsigned short);
77void __indwordstring(unsigned short, unsigned long *, unsigned long);
78void __int2c(void);
79void __invlpg(void *);
80unsigned short __inword(unsigned short);
81void __inwordstring(unsigned short, unsigned short *, unsigned long);
82void __lidt(void *);
83unsigned __int64 __ll_lshift(unsigned __int64, int);
84__int64 __ll_rshift(__int64, int);
85void __llwpcb(void *);
86unsigned char __lwpins32(unsigned int, unsigned int, unsigned int);
87void __lwpval32(unsigned int, unsigned int, unsigned int);
88unsigned int __lzcnt(unsigned int);
89unsigned short __lzcnt16(unsigned short);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000090static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000091void __movsb(unsigned char *, unsigned char const *, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000092static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000093void __movsd(unsigned long *, unsigned long const *, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +000094static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +000095void __movsw(unsigned short *, unsigned short const *, size_t);
96void __nop(void);
97void __nvreg_restore_fence(void);
98void __nvreg_save_fence(void);
99void __outbyte(unsigned short, unsigned char);
100void __outbytestring(unsigned short, unsigned char *, unsigned long);
101void __outdword(unsigned short, unsigned long);
102void __outdwordstring(unsigned short, unsigned long *, unsigned long);
103void __outword(unsigned short, unsigned short);
104void __outwordstring(unsigned short, unsigned short *, unsigned long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000105static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000106unsigned int __popcnt(unsigned int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000107static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000108unsigned short __popcnt16(unsigned short);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000109unsigned long __readcr0(void);
110unsigned long __readcr2(void);
Reid Kleckner592dc612014-04-08 00:28:22 +0000111static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000112unsigned long __readcr3(void);
Eric Christopher439137e2014-01-24 12:13:47 +0000113unsigned long __readcr4(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000114unsigned long __readcr8(void);
115unsigned int __readdr(unsigned int);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000116#ifdef __i386__
117static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000118unsigned char __readfsbyte(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000119static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000120unsigned long __readfsdword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000121static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000122unsigned __int64 __readfsqword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000123static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000124unsigned short __readfsword(unsigned long);
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000125#endif
Reid Kleckner592dc612014-04-08 00:28:22 +0000126static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000127unsigned __int64 __readmsr(unsigned long);
128unsigned __int64 __readpmc(unsigned long);
129unsigned long __segmentlimit(unsigned long);
130void __sidt(void *);
131void *__slwpcb(void);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000132static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000133void __stosb(unsigned char *, unsigned char, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000134static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000135void __stosd(unsigned long *, unsigned long, size_t);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000136static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000137void __stosw(unsigned short *, unsigned short, size_t);
138void __svm_clgi(void);
139void __svm_invlpga(void *, int);
140void __svm_skinit(int);
141void __svm_stgi(void);
142void __svm_vmload(size_t);
143void __svm_vmrun(size_t);
144void __svm_vmsave(size_t);
145void __ud2(void);
146unsigned __int64 __ull_rshift(unsigned __int64, int);
147void __vmx_off(void);
148void __vmx_vmptrst(unsigned __int64 *);
149void __wbinvd(void);
150void __writecr0(unsigned int);
Reid Kleckner592dc612014-04-08 00:28:22 +0000151static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000152void __writecr3(unsigned int);
153void __writecr4(unsigned int);
154void __writecr8(unsigned int);
155void __writedr(unsigned int, unsigned int);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000156void __writefsbyte(unsigned long, unsigned char);
157void __writefsdword(unsigned long, unsigned long);
158void __writefsqword(unsigned long, unsigned __int64);
159void __writefsword(unsigned long, unsigned short);
160void __writemsr(unsigned long, unsigned __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000161static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000162void *_AddressOfReturnAddress(void);
Warren Huntd6ffae92013-09-27 23:57:26 +0000163static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000164unsigned char _BitScanForward(unsigned long *_Index, unsigned long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000165static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000166unsigned char _BitScanReverse(unsigned long *_Index, unsigned long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000167static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000168unsigned char _bittest(long const *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000169static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000170unsigned char _bittestandcomplement(long *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000171static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000172unsigned char _bittestandreset(long *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000173static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000174unsigned char _bittestandset(long *, long);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000175unsigned __int64 __cdecl _byteswap_uint64(unsigned __int64);
176unsigned long __cdecl _byteswap_ulong(unsigned long);
177unsigned short __cdecl _byteswap_ushort(unsigned short);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000178void __cdecl _disable(void);
179void __cdecl _enable(void);
180void __cdecl _fxrstor(void const *);
181void __cdecl _fxsave(void *);
182long _InterlockedAddLargeStatistic(__int64 volatile *_Addend, long _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000183static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000184long _InterlockedAnd(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000185static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000186short _InterlockedAnd16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000187static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000188char _InterlockedAnd8(char volatile *_Value, char _Mask);
189unsigned char _interlockedbittestandreset(long volatile *, long);
Hans Wennborga3169332014-03-13 17:05:09 +0000190static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000191unsigned char _interlockedbittestandset(long volatile *, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000192static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000193long __cdecl _InterlockedCompareExchange(long volatile *_Destination,
194 long _Exchange, long _Comparand);
195long _InterlockedCompareExchange_HLEAcquire(long volatile *, long, long);
196long _InterlockedCompareExchange_HLERelease(long volatile *, long, long);
Warren Huntd6ffae92013-09-27 23:57:26 +0000197static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000198short _InterlockedCompareExchange16(short volatile *_Destination,
199 short _Exchange, short _Comparand);
Warren Huntd6ffae92013-09-27 23:57:26 +0000200static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000201__int64 _InterlockedCompareExchange64(__int64 volatile *_Destination,
202 __int64 _Exchange, __int64 _Comparand);
203__int64 _InterlockedcompareExchange64_HLEAcquire(__int64 volatile *, __int64,
204 __int64);
205__int64 _InterlockedCompareExchange64_HLERelease(__int64 volatile *, __int64,
206 __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000207static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000208char _InterlockedCompareExchange8(char volatile *_Destination, char _Exchange,
209 char _Comparand);
210void *_InterlockedCompareExchangePointer_HLEAcquire(void *volatile *, void *,
211 void *);
212void *_InterlockedCompareExchangePointer_HLERelease(void *volatile *, void *,
213 void *);
Warren Huntd6ffae92013-09-27 23:57:26 +0000214static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000215long __cdecl _InterlockedDecrement(long volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000216static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000217short _InterlockedDecrement16(short volatile *_Addend);
Saleem Abdulrasool114efe02014-06-18 20:51:10 +0000218long _InterlockedExchange(long volatile *_Target, long _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000219static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000220short _InterlockedExchange16(short volatile *_Target, short _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000221static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000222char _InterlockedExchange8(char volatile *_Target, char _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000223static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000224long __cdecl _InterlockedExchangeAdd(long volatile *_Addend, long _Value);
225long _InterlockedExchangeAdd_HLEAcquire(long volatile *, long);
226long _InterlockedExchangeAdd_HLERelease(long volatile *, long);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000227static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000228short _InterlockedExchangeAdd16(short volatile *_Addend, short _Value);
229__int64 _InterlockedExchangeAdd64_HLEAcquire(__int64 volatile *, __int64);
230__int64 _InterlockedExchangeAdd64_HLERelease(__int64 volatile *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000231static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000232char _InterlockedExchangeAdd8(char volatile *_Addend, char _Value);
Warren Huntd6ffae92013-09-27 23:57:26 +0000233static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000234long __cdecl _InterlockedIncrement(long volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000235static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000236short _InterlockedIncrement16(short volatile *_Addend);
Warren Huntd6ffae92013-09-27 23:57:26 +0000237static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000238long _InterlockedOr(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000239static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000240short _InterlockedOr16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000241static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000242char _InterlockedOr8(char volatile *_Value, char _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000243static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000244long _InterlockedXor(long volatile *_Value, long _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000245static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000246short _InterlockedXor16(short volatile *_Value, short _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000247static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000248char _InterlockedXor8(char volatile *_Value, char _Mask);
249void __cdecl _invpcid(unsigned int, void *);
Warren Huntd6ffae92013-09-27 23:57:26 +0000250static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000251unsigned long __cdecl _lrotl(unsigned long, int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000252static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000253unsigned long __cdecl _lrotr(unsigned long, int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000254static __inline__
Reid Kleckner00d33a52013-10-17 01:29:48 +0000255static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000256void _ReadBarrier(void);
Reid Kleckner00d33a52013-10-17 01:29:48 +0000257static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000258void _ReadWriteBarrier(void);
Warren Huntd6ffae92013-09-27 23:57:26 +0000259static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000260void *_ReturnAddress(void);
261unsigned int _rorx_u32(unsigned int, const unsigned int);
Warren Huntd6ffae92013-09-27 23:57:26 +0000262static __inline__
Eric Christopherfb4b4332013-08-31 00:27:38 +0000263unsigned int __cdecl _rotl(unsigned int _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000264static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000265unsigned short _rotl16(unsigned short _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000266static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000267unsigned __int64 __cdecl _rotl64(unsigned __int64 _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000268static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000269unsigned char _rotl8(unsigned char _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000270static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000271unsigned int __cdecl _rotr(unsigned int _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000272static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000273unsigned short _rotr16(unsigned short _Value, unsigned char _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000274static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000275unsigned __int64 __cdecl _rotr64(unsigned __int64 _Value, int _Shift);
Warren Huntd6ffae92013-09-27 23:57:26 +0000276static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000277unsigned char _rotr8(unsigned char _Value, unsigned char _Shift);
278int _sarx_i32(int, unsigned int);
Nico Webera62cffa2014-07-08 18:34:46 +0000279#if __STDC_HOSTED__
Hans Wennborg1fd6dd32014-01-28 23:01:59 +0000280int __cdecl _setjmp(jmp_buf);
Nico Webera62cffa2014-07-08 18:34:46 +0000281#endif
Eric Christopherd1428bf2013-08-31 00:22:48 +0000282unsigned int _shlx_u32(unsigned int, unsigned int);
283unsigned int _shrx_u32(unsigned int, unsigned int);
284void _Store_HLERelease(long volatile *, long);
285void _Store64_HLERelease(__int64 volatile *, __int64);
286void _StorePointer_HLERelease(void *volatile *, void *);
Reid Kleckner00d33a52013-10-17 01:29:48 +0000287static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000288void _WriteBarrier(void);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000289unsigned __int32 xbegin(void);
290void _xend(void);
Hans Wennborg854f7d32014-01-16 23:39:35 +0000291static __inline__
Hans Wennborg2e56d952015-01-27 23:34:35 +0000292#define _XCR_XFEATURE_ENABLED_MASK 0
Eric Christopherd1428bf2013-08-31 00:22:48 +0000293unsigned __int64 __cdecl _xgetbv(unsigned int);
294void __cdecl _xrstor(void const *, unsigned __int64);
295void __cdecl _xsave(void *, unsigned __int64);
296void __cdecl _xsaveopt(void *, unsigned __int64);
297void __cdecl _xsetbv(unsigned int, unsigned __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000298
299/* These additional intrinsics are turned on in x64/amd64/x86_64 mode. */
Warren Hunt3f987942013-09-30 21:08:05 +0000300#ifdef __x86_64__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000301void __addgsbyte(unsigned long, unsigned char);
302void __addgsdword(unsigned long, unsigned long);
303void __addgsqword(unsigned long, unsigned __int64);
304void __addgsword(unsigned long, unsigned short);
Reid Klecknerf08d6582014-01-27 19:16:35 +0000305static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000306void __faststorefence(void);
307void __incgsbyte(unsigned long);
308void __incgsdword(unsigned long);
309void __incgsqword(unsigned long);
310void __incgsword(unsigned long);
Eric Christopher439137e2014-01-24 12:13:47 +0000311unsigned char __lwpins64(unsigned __int64, unsigned int, unsigned int);
312void __lwpval64(unsigned __int64, unsigned int, unsigned int);
313unsigned __int64 __lzcnt64(unsigned __int64);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000314static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000315void __movsq(unsigned long long *, unsigned long long const *, size_t);
316__int64 __mulh(__int64, __int64);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000317static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000318unsigned __int64 __popcnt64(unsigned __int64);
Hans Wennborga4421e02014-03-12 21:09:05 +0000319static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000320unsigned char __readgsbyte(unsigned long);
Hans Wennborga4421e02014-03-12 21:09:05 +0000321static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000322unsigned long __readgsdword(unsigned long);
Hans Wennborga4421e02014-03-12 21:09:05 +0000323static __inline__
324unsigned __int64 __readgsqword(unsigned long);
Eric Christopher439137e2014-01-24 12:13:47 +0000325unsigned short __readgsword(unsigned long);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000326unsigned __int64 __shiftleft128(unsigned __int64 _LowPart,
327 unsigned __int64 _HighPart,
328 unsigned char _Shift);
329unsigned __int64 __shiftright128(unsigned __int64 _LowPart,
330 unsigned __int64 _HighPart,
331 unsigned char _Shift);
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000332static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000333void __stosq(unsigned __int64 *, unsigned __int64, size_t);
Eric Christopher439137e2014-01-24 12:13:47 +0000334unsigned char __vmx_on(unsigned __int64 *);
335unsigned char __vmx_vmclear(unsigned __int64 *);
336unsigned char __vmx_vmlaunch(void);
337unsigned char __vmx_vmptrld(unsigned __int64 *);
338unsigned char __vmx_vmread(size_t, size_t *);
339unsigned char __vmx_vmresume(void);
340unsigned char __vmx_vmwrite(size_t, size_t);
341void __writegsbyte(unsigned long, unsigned char);
342void __writegsdword(unsigned long, unsigned long);
343void __writegsqword(unsigned long, unsigned __int64);
344void __writegsword(unsigned long, unsigned short);
Warren Huntd6ffae92013-09-27 23:57:26 +0000345static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000346unsigned char _BitScanForward64(unsigned long *_Index, unsigned __int64 _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000347static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000348unsigned char _BitScanReverse64(unsigned long *_Index, unsigned __int64 _Mask);
Warren Huntd6ffae92013-09-27 23:57:26 +0000349static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000350unsigned char _bittest64(__int64 const *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000351static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000352unsigned char _bittestandcomplement64(__int64 *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000353static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000354unsigned char _bittestandreset64(__int64 *, __int64);
Warren Huntd6ffae92013-09-27 23:57:26 +0000355static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000356unsigned char _bittestandset64(__int64 *, __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000357unsigned __int64 __cdecl _byteswap_uint64(unsigned __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000358void __cdecl _fxrstor64(void const *);
359void __cdecl _fxsave64(void *);
360long _InterlockedAnd_np(long volatile *_Value, long _Mask);
361short _InterlockedAnd16_np(short volatile *_Value, short _Mask);
362__int64 _InterlockedAnd64_np(__int64 volatile *_Value, __int64 _Mask);
363char _InterlockedAnd8_np(char volatile *_Value, char _Mask);
364unsigned char _interlockedbittestandreset64(__int64 volatile *, __int64);
Hans Wennborga3169332014-03-13 17:05:09 +0000365static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000366unsigned char _interlockedbittestandset64(__int64 volatile *, __int64);
367long _InterlockedCompareExchange_np(long volatile *_Destination, long _Exchange,
368 long _Comparand);
369unsigned char _InterlockedCompareExchange128(__int64 volatile *_Destination,
370 __int64 _ExchangeHigh,
371 __int64 _ExchangeLow,
372 __int64 *_CompareandResult);
373unsigned char _InterlockedCompareExchange128_np(__int64 volatile *_Destination,
374 __int64 _ExchangeHigh,
375 __int64 _ExchangeLow,
376 __int64 *_ComparandResult);
377short _InterlockedCompareExchange16_np(short volatile *_Destination,
378 short _Exchange, short _Comparand);
Eric Christopher439137e2014-01-24 12:13:47 +0000379__int64 _InterlockedCompareExchange64_HLEAcquire(__int64 volatile *, __int64,
380 __int64);
381__int64 _InterlockedCompareExchange64_HLERelease(__int64 volatile *, __int64,
382 __int64);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000383__int64 _InterlockedCompareExchange64_np(__int64 volatile *_Destination,
384 __int64 _Exchange, __int64 _Comparand);
Eric Christopher58b40432014-01-25 01:38:30 +0000385void *_InterlockedCompareExchangePointer(void *volatile *_Destination,
386 void *_Exchange, void *_Comparand);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000387void *_InterlockedCompareExchangePointer_np(void *volatile *_Destination,
388 void *_Exchange, void *_Comparand);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000389static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000390__int64 _InterlockedDecrement64(__int64 volatile *_Addend);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000391static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000392__int64 _InterlockedExchange64(__int64 volatile *_Target, __int64 _Value);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000393static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000394__int64 _InterlockedExchangeAdd64(__int64 volatile *_Addend, __int64 _Value);
395void *_InterlockedExchangePointer(void *volatile *_Target, void *_Value);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000396static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000397__int64 _InterlockedIncrement64(__int64 volatile *_Addend);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000398long _InterlockedOr_np(long volatile *_Value, long _Mask);
399short _InterlockedOr16_np(short volatile *_Value, short _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000400static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000401__int64 _InterlockedOr64(__int64 volatile *_Value, __int64 _Mask);
Warren Hunt41a993f2013-09-28 00:15:41 +0000402__int64 _InterlockedOr64_np(__int64 volatile *_Value, __int64 _Mask);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000403char _InterlockedOr8_np(char volatile *_Value, char _Mask);
404long _InterlockedXor_np(long volatile *_Value, long _Mask);
405short _InterlockedXor16_np(short volatile *_Value, short _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000406static __inline__
Eric Christopher439137e2014-01-24 12:13:47 +0000407__int64 _InterlockedXor64(__int64 volatile *_Value, __int64 _Mask);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000408__int64 _InterlockedXor64_np(__int64 volatile *_Value, __int64 _Mask);
409char _InterlockedXor8_np(char volatile *_Value, char _Mask);
Reid Kleckner924eb2a2014-01-27 18:48:02 +0000410static __inline__
Eric Christopherd1428bf2013-08-31 00:22:48 +0000411__int64 _mul128(__int64 _Multiplier, __int64 _Multiplicand,
412 __int64 *_HighProduct);
Eric Christopherd1428bf2013-08-31 00:22:48 +0000413unsigned __int64 _rorx_u64(unsigned __int64, const unsigned int);
Eric Christopher439137e2014-01-24 12:13:47 +0000414__int64 _sarx_i64(__int64, unsigned int);
Nico Webera62cffa2014-07-08 18:34:46 +0000415#if __STDC_HOSTED__
416int __cdecl _setjmpex(jmp_buf);
417#endif
Eric Christopher439137e2014-01-24 12:13:47 +0000418unsigned __int64 _shlx_u64(unsigned __int64, unsigned int);
David Majnemer54507632014-12-02 23:30:26 +0000419unsigned __int64 _shrx_u64(unsigned __int64, unsigned int);
David Majnemer5f9afc52014-12-02 23:30:24 +0000420/*
421 * Multiply two 64-bit integers and obtain a 64-bit result.
422 * The low-half is returned directly and the high half is in an out parameter.
423 */
424static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
425_umul128(unsigned __int64 _Multiplier, unsigned __int64 _Multiplicand,
426 unsigned __int64 *_HighProduct) {
427 unsigned __int128 _FullProduct =
428 (unsigned __int128)_Multiplier * (unsigned __int128)_Multiplicand;
David Majnemer00973ce2014-12-02 23:44:40 +0000429 *_HighProduct = _FullProduct >> 64;
430 return _FullProduct;
David Majnemer5f9afc52014-12-02 23:30:24 +0000431}
Reid Klecknerbaf77092014-12-03 23:36:14 +0000432static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
433__umulh(unsigned __int64 _Multiplier, unsigned __int64 _Multiplicand) {
434 unsigned __int128 _FullProduct =
435 (unsigned __int128)_Multiplier * (unsigned __int128)_Multiplicand;
436 return _FullProduct >> 64;
437}
Eric Christopherd1428bf2013-08-31 00:22:48 +0000438void __cdecl _xrstor64(void const *, unsigned __int64);
439void __cdecl _xsave64(void *, unsigned __int64);
440void __cdecl _xsaveopt64(void *, unsigned __int64);
Eric Christopher0db88a72013-09-18 22:24:01 +0000441
Warren Hunt3f987942013-09-30 21:08:05 +0000442#endif /* __x86_64__ */
Reid Klecknerf0e23222013-09-19 00:19:53 +0000443
Warren Huntd6ffae92013-09-27 23:57:26 +0000444/*----------------------------------------------------------------------------*\
445|* Bit Twiddling
446\*----------------------------------------------------------------------------*/
447static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
448_rotl8(unsigned char _Value, unsigned char _Shift) {
449 _Shift &= 0x7;
450 return _Shift ? (_Value << _Shift) | (_Value >> (8 - _Shift)) : _Value;
451}
452static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
453_rotr8(unsigned char _Value, unsigned char _Shift) {
454 _Shift &= 0x7;
455 return _Shift ? (_Value >> _Shift) | (_Value << (8 - _Shift)) : _Value;
456}
457static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
458_rotl16(unsigned short _Value, unsigned char _Shift) {
459 _Shift &= 0xf;
460 return _Shift ? (_Value << _Shift) | (_Value >> (16 - _Shift)) : _Value;
461}
462static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
463_rotr16(unsigned short _Value, unsigned char _Shift) {
464 _Shift &= 0xf;
465 return _Shift ? (_Value >> _Shift) | (_Value << (16 - _Shift)) : _Value;
466}
467static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
468_rotl(unsigned int _Value, int _Shift) {
469 _Shift &= 0x1f;
470 return _Shift ? (_Value << _Shift) | (_Value >> (32 - _Shift)) : _Value;
471}
472static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
473_rotr(unsigned int _Value, int _Shift) {
474 _Shift &= 0x1f;
475 return _Shift ? (_Value >> _Shift) | (_Value << (32 - _Shift)) : _Value;
476}
477static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
478_lrotl(unsigned long _Value, int _Shift) {
479 _Shift &= 0x1f;
480 return _Shift ? (_Value << _Shift) | (_Value >> (32 - _Shift)) : _Value;
481}
482static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
483_lrotr(unsigned long _Value, int _Shift) {
484 _Shift &= 0x1f;
485 return _Shift ? (_Value >> _Shift) | (_Value << (32 - _Shift)) : _Value;
486}
487static
488__inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
489_rotl64(unsigned __int64 _Value, int _Shift) {
490 _Shift &= 0x3f;
491 return _Shift ? (_Value << _Shift) | (_Value >> (64 - _Shift)) : _Value;
492}
493static
494__inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
495_rotr64(unsigned __int64 _Value, int _Shift) {
496 _Shift &= 0x3f;
497 return _Shift ? (_Value >> _Shift) | (_Value << (64 - _Shift)) : _Value;
498}
499/*----------------------------------------------------------------------------*\
500|* Bit Counting and Testing
501\*----------------------------------------------------------------------------*/
502static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
503_BitScanForward(unsigned long *_Index, unsigned long _Mask) {
504 if (!_Mask)
505 return 0;
506 *_Index = __builtin_ctzl(_Mask);
507 return 1;
508}
509static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
510_BitScanReverse(unsigned long *_Index, unsigned long _Mask) {
511 if (!_Mask)
512 return 0;
513 *_Index = 31 - __builtin_clzl(_Mask);
514 return 1;
515}
Warren Huntd6ffae92013-09-27 23:57:26 +0000516static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
517__popcnt16(unsigned short value) {
518 return __builtin_popcount((int)value);
519}
520static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__))
521__popcnt(unsigned int value) {
522 return __builtin_popcount(value);
523}
524static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
525_bittest(long const *a, long b) {
526 return (*a >> b) & 1;
527}
528static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
529_bittestandcomplement(long *a, long b) {
530 unsigned char x = (*a >> b) & 1;
531 *a = *a ^ (1 << b);
532 return x;
533}
534static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
535_bittestandreset(long *a, long b) {
536 unsigned char x = (*a >> b) & 1;
537 *a = *a & ~(1 << b);
538 return x;
539}
540static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
541_bittestandset(long *a, long b) {
542 unsigned char x = (*a >> b) & 1;
Warren Hunt2731e3e2013-10-01 17:12:40 +0000543 *a = *a | (1 << b);
Warren Huntd6ffae92013-09-27 23:57:26 +0000544 return x;
545}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000546#if defined(__i386__) || defined(__x86_64__)
Hans Wennborga3169332014-03-13 17:05:09 +0000547static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
548_interlockedbittestandset(long volatile *__BitBase, long __BitPos) {
David Majnemercdffc362015-06-05 18:03:58 +0000549 long __OldVal = __atomic_fetch_or(__BitBase, 1 << __BitPos, 5);
550 return (__OldVal >> __BitPos) & 1;
Hans Wennborga3169332014-03-13 17:05:09 +0000551}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000552#endif
Warren Hunt3f987942013-09-30 21:08:05 +0000553#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000554static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
555_BitScanForward64(unsigned long *_Index, unsigned __int64 _Mask) {
556 if (!_Mask)
557 return 0;
558 *_Index = __builtin_ctzll(_Mask);
559 return 1;
560}
561static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
562_BitScanReverse64(unsigned long *_Index, unsigned __int64 _Mask) {
563 if (!_Mask)
564 return 0;
565 *_Index = 63 - __builtin_clzll(_Mask);
566 return 1;
567}
Warren Huntd6ffae92013-09-27 23:57:26 +0000568static __inline__
569unsigned __int64 __attribute__((__always_inline__, __nodebug__))
570 __popcnt64(unsigned __int64 value) {
571 return __builtin_popcountll(value);
572}
573static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
574_bittest64(__int64 const *a, __int64 b) {
575 return (*a >> b) & 1;
576}
577static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
578_bittestandcomplement64(__int64 *a, __int64 b) {
579 unsigned char x = (*a >> b) & 1;
580 *a = *a ^ (1ll << b);
581 return x;
582}
583static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
584_bittestandreset64(__int64 *a, __int64 b) {
585 unsigned char x = (*a >> b) & 1;
586 *a = *a & ~(1ll << b);
587 return x;
588}
589static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
590_bittestandset64(__int64 *a, __int64 b) {
591 unsigned char x = (*a >> b) & 1;
Warren Hunt2731e3e2013-10-01 17:12:40 +0000592 *a = *a | (1ll << b);
Warren Huntd6ffae92013-09-27 23:57:26 +0000593 return x;
594}
Hans Wennborga3169332014-03-13 17:05:09 +0000595static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
596_interlockedbittestandset64(__int64 volatile *__BitBase, __int64 __BitPos) {
597 unsigned char __Res;
598 __asm__ ("xor %0, %0\n"
599 "lock bts %2, %1\n"
600 "setc %0\n"
601 : "=r" (__Res), "+m"(*__BitBase)
602 : "Ir"(__BitPos));
603 return __Res;
604}
Warren Huntd6ffae92013-09-27 23:57:26 +0000605#endif
606/*----------------------------------------------------------------------------*\
607|* Interlocked Exchange Add
608\*----------------------------------------------------------------------------*/
609static __inline__ char __attribute__((__always_inline__, __nodebug__))
610_InterlockedExchangeAdd8(char volatile *_Addend, char _Value) {
611 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
612}
613static __inline__ short __attribute__((__always_inline__, __nodebug__))
614_InterlockedExchangeAdd16(short volatile *_Addend, short _Value) {
615 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
616}
Warren Hunt3f987942013-09-30 21:08:05 +0000617#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000618static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
619_InterlockedExchangeAdd64(__int64 volatile *_Addend, __int64 _Value) {
620 return __atomic_add_fetch(_Addend, _Value, 0) - _Value;
621}
622#endif
623/*----------------------------------------------------------------------------*\
624|* Interlocked Exchange Sub
625\*----------------------------------------------------------------------------*/
626static __inline__ char __attribute__((__always_inline__, __nodebug__))
627_InterlockedExchangeSub8(char volatile *_Subend, char _Value) {
628 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
629}
630static __inline__ short __attribute__((__always_inline__, __nodebug__))
631_InterlockedExchangeSub16(short volatile *_Subend, short _Value) {
632 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
633}
634static __inline__ long __attribute__((__always_inline__, __nodebug__))
635_InterlockedExchangeSub(long volatile *_Subend, long _Value) {
636 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
637}
Warren Hunt3f987942013-09-30 21:08:05 +0000638#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000639static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
640_InterlockedExchangeSub64(__int64 volatile *_Subend, __int64 _Value) {
641 return __atomic_sub_fetch(_Subend, _Value, 0) + _Value;
642}
643#endif
644/*----------------------------------------------------------------------------*\
645|* Interlocked Increment
646\*----------------------------------------------------------------------------*/
Hans Wennborg2ed88802014-01-23 19:15:39 +0000647static __inline__ short __attribute__((__always_inline__, __nodebug__))
648_InterlockedIncrement16(short volatile *_Value) {
Warren Huntd6ffae92013-09-27 23:57:26 +0000649 return __atomic_add_fetch(_Value, 1, 0);
650}
Warren Hunt3f987942013-09-30 21:08:05 +0000651#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000652static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
653_InterlockedIncrement64(__int64 volatile *_Value) {
654 return __atomic_add_fetch(_Value, 1, 0);
655}
656#endif
657/*----------------------------------------------------------------------------*\
658|* Interlocked Decrement
659\*----------------------------------------------------------------------------*/
Hans Wennborg2ed88802014-01-23 19:15:39 +0000660static __inline__ short __attribute__((__always_inline__, __nodebug__))
661_InterlockedDecrement16(short volatile *_Value) {
Warren Huntd6ffae92013-09-27 23:57:26 +0000662 return __atomic_sub_fetch(_Value, 1, 0);
663}
Warren Hunt3f987942013-09-30 21:08:05 +0000664#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000665static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
666_InterlockedDecrement64(__int64 volatile *_Value) {
667 return __atomic_sub_fetch(_Value, 1, 0);
668}
669#endif
670/*----------------------------------------------------------------------------*\
671|* Interlocked And
672\*----------------------------------------------------------------------------*/
673static __inline__ char __attribute__((__always_inline__, __nodebug__))
674_InterlockedAnd8(char volatile *_Value, char _Mask) {
675 return __atomic_and_fetch(_Value, _Mask, 0);
676}
677static __inline__ short __attribute__((__always_inline__, __nodebug__))
678_InterlockedAnd16(short volatile *_Value, short _Mask) {
679 return __atomic_and_fetch(_Value, _Mask, 0);
680}
681static __inline__ long __attribute__((__always_inline__, __nodebug__))
682_InterlockedAnd(long volatile *_Value, long _Mask) {
683 return __atomic_and_fetch(_Value, _Mask, 0);
684}
Warren Hunt3f987942013-09-30 21:08:05 +0000685#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000686static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
687_InterlockedAnd64(__int64 volatile *_Value, __int64 _Mask) {
688 return __atomic_and_fetch(_Value, _Mask, 0);
689}
690#endif
691/*----------------------------------------------------------------------------*\
692|* Interlocked Or
693\*----------------------------------------------------------------------------*/
694static __inline__ char __attribute__((__always_inline__, __nodebug__))
695_InterlockedOr8(char volatile *_Value, char _Mask) {
696 return __atomic_or_fetch(_Value, _Mask, 0);
697}
698static __inline__ short __attribute__((__always_inline__, __nodebug__))
699_InterlockedOr16(short volatile *_Value, short _Mask) {
700 return __atomic_or_fetch(_Value, _Mask, 0);
701}
702static __inline__ long __attribute__((__always_inline__, __nodebug__))
703_InterlockedOr(long volatile *_Value, long _Mask) {
704 return __atomic_or_fetch(_Value, _Mask, 0);
705}
Warren Hunt3f987942013-09-30 21:08:05 +0000706#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000707static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
708_InterlockedOr64(__int64 volatile *_Value, __int64 _Mask) {
709 return __atomic_or_fetch(_Value, _Mask, 0);
710}
711#endif
712/*----------------------------------------------------------------------------*\
713|* Interlocked Xor
714\*----------------------------------------------------------------------------*/
715static __inline__ char __attribute__((__always_inline__, __nodebug__))
716_InterlockedXor8(char volatile *_Value, char _Mask) {
717 return __atomic_xor_fetch(_Value, _Mask, 0);
718}
719static __inline__ short __attribute__((__always_inline__, __nodebug__))
720_InterlockedXor16(short volatile *_Value, short _Mask) {
721 return __atomic_xor_fetch(_Value, _Mask, 0);
722}
723static __inline__ long __attribute__((__always_inline__, __nodebug__))
724_InterlockedXor(long volatile *_Value, long _Mask) {
725 return __atomic_xor_fetch(_Value, _Mask, 0);
726}
Warren Hunt3f987942013-09-30 21:08:05 +0000727#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000728static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
729_InterlockedXor64(__int64 volatile *_Value, __int64 _Mask) {
730 return __atomic_xor_fetch(_Value, _Mask, 0);
731}
732#endif
733/*----------------------------------------------------------------------------*\
734|* Interlocked Exchange
735\*----------------------------------------------------------------------------*/
736static __inline__ char __attribute__((__always_inline__, __nodebug__))
737_InterlockedExchange8(char volatile *_Target, char _Value) {
738 __atomic_exchange(_Target, &_Value, &_Value, 0);
739 return _Value;
740}
741static __inline__ short __attribute__((__always_inline__, __nodebug__))
742_InterlockedExchange16(short volatile *_Target, short _Value) {
743 __atomic_exchange(_Target, &_Value, &_Value, 0);
744 return _Value;
745}
Warren Hunt3f987942013-09-30 21:08:05 +0000746#ifdef __x86_64__
Warren Huntd6ffae92013-09-27 23:57:26 +0000747static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
748_InterlockedExchange64(__int64 volatile *_Target, __int64 _Value) {
749 __atomic_exchange(_Target, &_Value, &_Value, 0);
750 return _Value;
751}
752#endif
753/*----------------------------------------------------------------------------*\
754|* Interlocked Compare Exchange
755\*----------------------------------------------------------------------------*/
756static __inline__ char __attribute__((__always_inline__, __nodebug__))
757_InterlockedCompareExchange8(char volatile *_Destination,
758 char _Exchange, char _Comparand) {
759 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
760 return _Comparand;
761}
762static __inline__ short __attribute__((__always_inline__, __nodebug__))
763_InterlockedCompareExchange16(short volatile *_Destination,
764 short _Exchange, short _Comparand) {
765 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
766 return _Comparand;
767}
Warren Huntd6ffae92013-09-27 23:57:26 +0000768static __inline__ __int64 __attribute__((__always_inline__, __nodebug__))
769_InterlockedCompareExchange64(__int64 volatile *_Destination,
770 __int64 _Exchange, __int64 _Comparand) {
771 __atomic_compare_exchange(_Destination, &_Comparand, &_Exchange, 0, 0, 0);
772 return _Comparand;
773}
Warren Huntd6ffae92013-09-27 23:57:26 +0000774/*----------------------------------------------------------------------------*\
Reid Kleckner00d33a52013-10-17 01:29:48 +0000775|* Barriers
776\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000777#if defined(__i386__) || defined(__x86_64__)
Reid Kleckner00d33a52013-10-17 01:29:48 +0000778static __inline__ void __attribute__((__always_inline__, __nodebug__))
David Majnemer1cf22e62015-02-04 00:26:10 +0000779__attribute__((__deprecated__("use other intrinsics or C++11 atomics instead")))
Reid Kleckner00d33a52013-10-17 01:29:48 +0000780_ReadWriteBarrier(void) {
781 __asm__ volatile ("" : : : "memory");
782}
783static __inline__ void __attribute__((__always_inline__, __nodebug__))
David Majnemer1cf22e62015-02-04 00:26:10 +0000784__attribute__((__deprecated__("use other intrinsics or C++11 atomics instead")))
Reid Kleckner00d33a52013-10-17 01:29:48 +0000785_ReadBarrier(void) {
786 __asm__ volatile ("" : : : "memory");
787}
788static __inline__ void __attribute__((__always_inline__, __nodebug__))
David Majnemer1cf22e62015-02-04 00:26:10 +0000789__attribute__((__deprecated__("use other intrinsics or C++11 atomics instead")))
Reid Kleckner00d33a52013-10-17 01:29:48 +0000790_WriteBarrier(void) {
791 __asm__ volatile ("" : : : "memory");
792}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000793#endif
Reid Klecknerf08d6582014-01-27 19:16:35 +0000794#ifdef __x86_64__
795static __inline__ void __attribute__((__always_inline__, __nodebug__))
796__faststorefence(void) {
797 __asm__ volatile("lock orq $0, (%%rsp)" : : : "memory");
798}
799#endif
Reid Kleckner00d33a52013-10-17 01:29:48 +0000800/*----------------------------------------------------------------------------*\
Hans Wennborga4421e02014-03-12 21:09:05 +0000801|* readfs, readgs
802|* (Pointers in address space #256 and #257 are relative to the GS and FS
803|* segment registers, respectively.)
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000804\*----------------------------------------------------------------------------*/
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000805#define __ptr_to_addr_space(__addr_space_nbr, __type, __offset) \
806 ((volatile __type __attribute__((__address_space__(__addr_space_nbr)))*) \
807 (__offset))
808
Hans Wennborga4421e02014-03-12 21:09:05 +0000809#ifdef __i386__
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000810static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
811__readfsbyte(unsigned long __offset) {
812 return *__ptr_to_addr_space(257, unsigned char, __offset);
813}
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000814static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
815__readfsqword(unsigned long __offset) {
816 return *__ptr_to_addr_space(257, unsigned __int64, __offset);
817}
818static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
819__readfsword(unsigned long __offset) {
820 return *__ptr_to_addr_space(257, unsigned short, __offset);
821}
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000822#endif
Hans Wennborga4421e02014-03-12 21:09:05 +0000823#ifdef __x86_64__
824static __inline__ unsigned char __attribute__((__always_inline__, __nodebug__))
825__readgsbyte(unsigned long __offset) {
826 return *__ptr_to_addr_space(256, unsigned char, __offset);
827}
828static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
829__readgsdword(unsigned long __offset) {
830 return *__ptr_to_addr_space(256, unsigned long, __offset);
831}
832static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
833__readgsqword(unsigned long __offset) {
834 return *__ptr_to_addr_space(256, unsigned __int64, __offset);
835}
836static __inline__ unsigned short __attribute__((__always_inline__, __nodebug__))
837__readgsword(unsigned long __offset) {
838 return *__ptr_to_addr_space(256, unsigned short, __offset);
839}
840#endif
841#undef __ptr_to_addr_space
Hans Wennborg74ca0c42014-01-24 00:52:39 +0000842/*----------------------------------------------------------------------------*\
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000843|* movs, stos
844\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000845#if defined(__i386__) || defined(__x86_64__)
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000846static __inline__ void __attribute__((__always_inline__, __nodebug__))
847__movsb(unsigned char *__dst, unsigned char const *__src, size_t __n) {
848 __asm__("rep movsb" : : "D"(__dst), "S"(__src), "c"(__n)
849 : "%edi", "%esi", "%ecx");
850}
851static __inline__ void __attribute__((__always_inline__, __nodebug__))
852__movsd(unsigned long *__dst, unsigned long const *__src, size_t __n) {
853 __asm__("rep movsl" : : "D"(__dst), "S"(__src), "c"(__n)
854 : "%edi", "%esi", "%ecx");
855}
856static __inline__ void __attribute__((__always_inline__, __nodebug__))
857__movsw(unsigned short *__dst, unsigned short const *__src, size_t __n) {
858 __asm__("rep movsh" : : "D"(__dst), "S"(__src), "c"(__n)
859 : "%edi", "%esi", "%ecx");
860}
861static __inline__ void __attribute__((__always_inline__, __nodebug__))
862__stosb(unsigned char *__dst, unsigned char __x, size_t __n) {
863 __asm__("rep stosb" : : "D"(__dst), "a"(__x), "c"(__n)
864 : "%edi", "%ecx");
865}
866static __inline__ void __attribute__((__always_inline__, __nodebug__))
867__stosd(unsigned long *__dst, unsigned long __x, size_t __n) {
868 __asm__("rep stosl" : : "D"(__dst), "a"(__x), "c"(__n)
869 : "%edi", "%ecx");
870}
871static __inline__ void __attribute__((__always_inline__, __nodebug__))
872__stosw(unsigned short *__dst, unsigned short __x, size_t __n) {
873 __asm__("rep stosh" : : "D"(__dst), "a"(__x), "c"(__n)
874 : "%edi", "%ecx");
875}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000876#endif
Hans Wennborgd9be72e2014-03-12 22:00:32 +0000877#ifdef __x86_64__
878static __inline__ void __attribute__((__always_inline__, __nodebug__))
879__movsq(unsigned long long *__dst, unsigned long long const *__src, size_t __n) {
880 __asm__("rep movsq" : : "D"(__dst), "S"(__src), "c"(__n)
881 : "%edi", "%esi", "%ecx");
882}
883static __inline__ void __attribute__((__always_inline__, __nodebug__))
884__stosq(unsigned __int64 *__dst, unsigned __int64 __x, size_t __n) {
885 __asm__("rep stosq" : : "D"(__dst), "a"(__x), "c"(__n)
886 : "%edi", "%ecx");
887}
888#endif
889
890/*----------------------------------------------------------------------------*\
Warren Huntd6ffae92013-09-27 23:57:26 +0000891|* Misc
892\*----------------------------------------------------------------------------*/
893static __inline__ void * __attribute__((__always_inline__, __nodebug__))
894_AddressOfReturnAddress(void) {
895 return (void*)((char*)__builtin_frame_address(0) + sizeof(void*));
896}
897static __inline__ void * __attribute__((__always_inline__, __nodebug__))
898_ReturnAddress(void) {
899 return __builtin_return_address(0);
900}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000901#if defined(__i386__) || defined(__x86_64__)
Hans Wennborg854f7d32014-01-16 23:39:35 +0000902static __inline__ void __attribute__((__always_inline__, __nodebug__))
903__cpuid(int __info[4], int __level) {
Hans Wennborg854f7d32014-01-16 23:39:35 +0000904 __asm__ ("cpuid" : "=a"(__info[0]), "=b" (__info[1]), "=c"(__info[2]), "=d"(__info[3])
Hans Wennborg12fb89e2014-01-31 19:44:55 +0000905 : "a"(__level));
906}
907static __inline__ void __attribute__((__always_inline__, __nodebug__))
908__cpuidex(int __info[4], int __level, int __ecx) {
909 __asm__ ("cpuid" : "=a"(__info[0]), "=b" (__info[1]), "=c"(__info[2]), "=d"(__info[3])
910 : "a"(__level), "c"(__ecx));
Hans Wennborg854f7d32014-01-16 23:39:35 +0000911}
912static __inline__ unsigned __int64 __cdecl __attribute__((__always_inline__, __nodebug__))
913_xgetbv(unsigned int __xcr_no) {
914 unsigned int __eax, __edx;
915 __asm__ ("xgetbv" : "=a" (__eax), "=d" (__edx) : "c" (__xcr_no));
916 return ((unsigned __int64)__edx << 32) | __eax;
917}
Hans Wennborg740a4d62014-01-28 22:55:01 +0000918static __inline__ void __attribute__((__always_inline__, __nodebug__))
919__halt(void) {
920 __asm__ volatile ("hlt");
921}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000922#endif
Warren Huntd6ffae92013-09-27 23:57:26 +0000923
Reid Kleckner592dc612014-04-08 00:28:22 +0000924/*----------------------------------------------------------------------------*\
925|* Privileged intrinsics
926\*----------------------------------------------------------------------------*/
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000927#if defined(__i386__) || defined(__x86_64__)
Reid Kleckner592dc612014-04-08 00:28:22 +0000928static __inline__ unsigned __int64 __attribute__((__always_inline__, __nodebug__))
929__readmsr(unsigned long __register) {
930 // Loads the contents of a 64-bit model specific register (MSR) specified in
931 // the ECX register into registers EDX:EAX. The EDX register is loaded with
932 // the high-order 32 bits of the MSR and the EAX register is loaded with the
933 // low-order 32 bits. If less than 64 bits are implemented in the MSR being
934 // read, the values returned to EDX:EAX in unimplemented bit locations are
935 // undefined.
936 unsigned long __edx;
937 unsigned long __eax;
Reid Kleckner6df52542014-04-08 17:49:16 +0000938 __asm__ ("rdmsr" : "=d"(__edx), "=a"(__eax) : "c"(__register));
Reid Kleckner592dc612014-04-08 00:28:22 +0000939 return (((unsigned __int64)__edx) << 32) | (unsigned __int64)__eax;
940}
941
David Majnemer1cf22e62015-02-04 00:26:10 +0000942static __inline__ unsigned long __attribute__((__always_inline__, __nodebug__))
Reid Kleckner592dc612014-04-08 00:28:22 +0000943__readcr3(void) {
Reid Kleckner6df52542014-04-08 17:49:16 +0000944 unsigned long __cr3_val;
945 __asm__ __volatile__ ("mov %%cr3, %0" : "=q"(__cr3_val) : : "memory");
946 return __cr3_val;
Reid Kleckner592dc612014-04-08 00:28:22 +0000947}
948
David Majnemer1cf22e62015-02-04 00:26:10 +0000949static __inline__ void __attribute__((__always_inline__, __nodebug__))
Reid Kleckner6df52542014-04-08 17:49:16 +0000950__writecr3(unsigned int __cr3_val) {
951 __asm__ ("mov %0, %%cr3" : : "q"(__cr3_val) : "memory");
Reid Kleckner592dc612014-04-08 00:28:22 +0000952}
Saleem Abdulrasool702eefe2014-06-25 16:48:40 +0000953#endif
Reid Kleckner592dc612014-04-08 00:28:22 +0000954
Eric Christophercc872532013-09-18 22:40:18 +0000955#ifdef __cplusplus
Eric Christopher0db88a72013-09-18 22:24:01 +0000956}
Eric Christopherd1428bf2013-08-31 00:22:48 +0000957#endif
Reid Klecknerf0e23222013-09-19 00:19:53 +0000958
959#endif /* __INTRIN_H */
960#endif /* _MSC_VER */