Blame - darwin-x86/lib64/clang/12.0.1/include/__clang_hip_math.h - platform/prebuilts/clang-tools

blob: f2365e8844fed3091e0d9e1dc34eb01808cb7ed9 [file] [log] [blame]

Sasha Smundak	4b1f33a	2021-01-11 15:05:07 -0800	[diff] [blame^]	1	/*===---- __clang_hip_math.h - Device-side HIP math support ----------------===
				2	*
				3	* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				4	* See https://llvm.org/LICENSE.txt for license information.
				5	* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
				6	*
				7	*===-----------------------------------------------------------------------===
				8	*/
				9	#ifndef __CLANG_HIP_MATH_H__
				10	#define __CLANG_HIP_MATH_H__
				11
				12	#if !defined(__HIP__)
				13	#error "This file is for HIP and OpenMP AMDGCN device compilation only."
				14	#endif
				15
				16	#if defined(__cplusplus)
				17	#include <algorithm>
				18	#endif
				19	#include <limits.h>
				20	#include <stdint.h>
				21
				22	#pragma push_macro("__DEVICE__")
				23	#define __DEVICE__ static __device__ inline __attribute__((always_inline))
				24
				25	// A few functions return bool type starting only in C++11.
				26	#pragma push_macro("__RETURN_TYPE")
				27	#if defined(__cplusplus)
				28	#define __RETURN_TYPE bool
				29	#else
				30	#define __RETURN_TYPE int
				31	#endif
				32
				33	#if defined (__cplusplus) && __cplusplus < 201103L
				34	// emulate static_assert on type sizes
				35	template<bool>
				36	struct __compare_result{};
				37	template<>
				38	struct __compare_result<true> {
				39	static const bool valid;
				40	};
				41
				42	__DEVICE__
				43	void __suppress_unused_warning(bool b){};
				44	template <unsigned int S, unsigned int T>
				45	__DEVICE__ void __static_assert_equal_size() {
				46	__suppress_unused_warning(__compare_result<S == T>::valid);
				47	}
				48
				49	#define __static_assert_type_size_equal(A, B) \
				50	__static_assert_equal_size<A,B>()
				51
				52	#else
				53	#define __static_assert_type_size_equal(A,B) \
				54	static_assert((A) == (B), "")
				55
				56	#endif
				57
				58	__DEVICE__
				59	uint64_t __make_mantissa_base8(const char *__tagp) {
				60	uint64_t __r = 0;
				61	while (__tagp) {
				62	char __tmp = *__tagp;
				63
				64	if (__tmp >= '0' && __tmp <= '7')
				65	__r = (__r * 8u) + __tmp - '0';
				66	else
				67	return 0;
				68
				69	++__tagp;
				70	}
				71
				72	return __r;
				73	}
				74
				75	__DEVICE__
				76	uint64_t __make_mantissa_base10(const char *__tagp) {
				77	uint64_t __r = 0;
				78	while (__tagp) {
				79	char __tmp = *__tagp;
				80
				81	if (__tmp >= '0' && __tmp <= '9')
				82	__r = (__r * 10u) + __tmp - '0';
				83	else
				84	return 0;
				85
				86	++__tagp;
				87	}
				88
				89	return __r;
				90	}
				91
				92	__DEVICE__
				93	uint64_t __make_mantissa_base16(const char *__tagp) {
				94	uint64_t __r = 0;
				95	while (__tagp) {
				96	char __tmp = *__tagp;
				97
				98	if (__tmp >= '0' && __tmp <= '9')
				99	__r = (__r * 16u) + __tmp - '0';
				100	else if (__tmp >= 'a' && __tmp <= 'f')
				101	__r = (__r * 16u) + __tmp - 'a' + 10;
				102	else if (__tmp >= 'A' && __tmp <= 'F')
				103	__r = (__r * 16u) + __tmp - 'A' + 10;
				104	else
				105	return 0;
				106
				107	++__tagp;
				108	}
				109
				110	return __r;
				111	}
				112
				113	__DEVICE__
				114	uint64_t __make_mantissa(const char *__tagp) {
				115	if (!__tagp)
				116	return 0u;
				117
				118	if (*__tagp == '0') {
				119	++__tagp;
				120
				121	if (__tagp == 'x' \|\| __tagp == 'X')
				122	return __make_mantissa_base16(__tagp);
				123	else
				124	return __make_mantissa_base8(__tagp);
				125	}
				126
				127	return __make_mantissa_base10(__tagp);
				128	}
				129
				130	// BEGIN FLOAT
				131	#if defined(__cplusplus)
				132	__DEVICE__
				133	int abs(int __x) {
				134	int __sgn = __x >> (sizeof(int) * CHAR_BIT - 1);
				135	return (__x ^ __sgn) - __sgn;
				136	}
				137	__DEVICE__
				138	long labs(long __x) {
				139	long __sgn = __x >> (sizeof(long) * CHAR_BIT - 1);
				140	return (__x ^ __sgn) - __sgn;
				141	}
				142	__DEVICE__
				143	long long llabs(long long __x) {
				144	long long __sgn = __x >> (sizeof(long long) * CHAR_BIT - 1);
				145	return (__x ^ __sgn) - __sgn;
				146	}
				147	#endif
				148
				149	__DEVICE__
				150	float acosf(float __x) { return __ocml_acos_f32(__x); }
				151
				152	__DEVICE__
				153	float acoshf(float __x) { return __ocml_acosh_f32(__x); }
				154
				155	__DEVICE__
				156	float asinf(float __x) { return __ocml_asin_f32(__x); }
				157
				158	__DEVICE__
				159	float asinhf(float __x) { return __ocml_asinh_f32(__x); }
				160
				161	__DEVICE__
				162	float atan2f(float __x, float __y) { return __ocml_atan2_f32(__x, __y); }
				163
				164	__DEVICE__
				165	float atanf(float __x) { return __ocml_atan_f32(__x); }
				166
				167	__DEVICE__
				168	float atanhf(float __x) { return __ocml_atanh_f32(__x); }
				169
				170	__DEVICE__
				171	float cbrtf(float __x) { return __ocml_cbrt_f32(__x); }
				172
				173	__DEVICE__
				174	float ceilf(float __x) { return __ocml_ceil_f32(__x); }
				175
				176	__DEVICE__
				177	float copysignf(float __x, float __y) { return __ocml_copysign_f32(__x, __y); }
				178
				179	__DEVICE__
				180	float cosf(float __x) { return __ocml_cos_f32(__x); }
				181
				182	__DEVICE__
				183	float coshf(float __x) { return __ocml_cosh_f32(__x); }
				184
				185	__DEVICE__
				186	float cospif(float __x) { return __ocml_cospi_f32(__x); }
				187
				188	__DEVICE__
				189	float cyl_bessel_i0f(float __x) { return __ocml_i0_f32(__x); }
				190
				191	__DEVICE__
				192	float cyl_bessel_i1f(float __x) { return __ocml_i1_f32(__x); }
				193
				194	__DEVICE__
				195	float erfcf(float __x) { return __ocml_erfc_f32(__x); }
				196
				197	__DEVICE__
				198	float erfcinvf(float __x) { return __ocml_erfcinv_f32(__x); }
				199
				200	__DEVICE__
				201	float erfcxf(float __x) { return __ocml_erfcx_f32(__x); }
				202
				203	__DEVICE__
				204	float erff(float __x) { return __ocml_erf_f32(__x); }
				205
				206	__DEVICE__
				207	float erfinvf(float __x) { return __ocml_erfinv_f32(__x); }
				208
				209	__DEVICE__
				210	float exp10f(float __x) { return __ocml_exp10_f32(__x); }
				211
				212	__DEVICE__
				213	float exp2f(float __x) { return __ocml_exp2_f32(__x); }
				214
				215	__DEVICE__
				216	float expf(float __x) { return __ocml_exp_f32(__x); }
				217
				218	__DEVICE__
				219	float expm1f(float __x) { return __ocml_expm1_f32(__x); }
				220
				221	__DEVICE__
				222	float fabsf(float __x) { return __ocml_fabs_f32(__x); }
				223
				224	__DEVICE__
				225	float fdimf(float __x, float __y) { return __ocml_fdim_f32(__x, __y); }
				226
				227	__DEVICE__
				228	float fdividef(float __x, float __y) { return __x / __y; }
				229
				230	__DEVICE__
				231	float floorf(float __x) { return __ocml_floor_f32(__x); }
				232
				233	__DEVICE__
				234	float fmaf(float __x, float __y, float __z) {
				235	return __ocml_fma_f32(__x, __y, __z);
				236	}
				237
				238	__DEVICE__
				239	float fmaxf(float __x, float __y) { return __ocml_fmax_f32(__x, __y); }
				240
				241	__DEVICE__
				242	float fminf(float __x, float __y) { return __ocml_fmin_f32(__x, __y); }
				243
				244	__DEVICE__
				245	float fmodf(float __x, float __y) { return __ocml_fmod_f32(__x, __y); }
				246
				247	__DEVICE__
				248	float frexpf(float __x, int *__nptr) {
				249	int __tmp;
				250	float __r =
				251	__ocml_frexp_f32(__x, (__attribute__((address_space(5))) int *)&__tmp);
				252	*__nptr = __tmp;
				253
				254	return __r;
				255	}
				256
				257	__DEVICE__
				258	float hypotf(float __x, float __y) { return __ocml_hypot_f32(__x, __y); }
				259
				260	__DEVICE__
				261	int ilogbf(float __x) { return __ocml_ilogb_f32(__x); }
				262
				263	__DEVICE__
				264	__RETURN_TYPE __finitef(float __x) { return __ocml_isfinite_f32(__x); }
				265
				266	__DEVICE__
				267	__RETURN_TYPE __isinff(float __x) { return __ocml_isinf_f32(__x); }
				268
				269	__DEVICE__
				270	__RETURN_TYPE __isnanf(float __x) { return __ocml_isnan_f32(__x); }
				271
				272	__DEVICE__
				273	float j0f(float __x) { return __ocml_j0_f32(__x); }
				274
				275	__DEVICE__
				276	float j1f(float __x) { return __ocml_j1_f32(__x); }
				277
				278	__DEVICE__
				279	float jnf(int __n, float __x) { // TODO: we could use Ahmes multiplication
				280	// and the Miller & Brown algorithm
				281	// for linear recurrences to get O(log n) steps, but it's unclear if
				282	// it'd be beneficial in this case.
				283	if (__n == 0)
				284	return j0f(__x);
				285	if (__n == 1)
				286	return j1f(__x);
				287
				288	float __x0 = j0f(__x);
				289	float __x1 = j1f(__x);
				290	for (int __i = 1; __i < __n; ++__i) {
				291	float __x2 = (2 * __i) / __x * __x1 - __x0;
				292	__x0 = __x1;
				293	__x1 = __x2;
				294	}
				295
				296	return __x1;
				297	}
				298
				299	__DEVICE__
				300	float ldexpf(float __x, int __e) { return __ocml_ldexp_f32(__x, __e); }
				301
				302	__DEVICE__
				303	float lgammaf(float __x) { return __ocml_lgamma_f32(__x); }
				304
				305	__DEVICE__
				306	long long int llrintf(float __x) { return __ocml_rint_f32(__x); }
				307
				308	__DEVICE__
				309	long long int llroundf(float __x) { return __ocml_round_f32(__x); }
				310
				311	__DEVICE__
				312	float log10f(float __x) { return __ocml_log10_f32(__x); }
				313
				314	__DEVICE__
				315	float log1pf(float __x) { return __ocml_log1p_f32(__x); }
				316
				317	__DEVICE__
				318	float log2f(float __x) { return __ocml_log2_f32(__x); }
				319
				320	__DEVICE__
				321	float logbf(float __x) { return __ocml_logb_f32(__x); }
				322
				323	__DEVICE__
				324	float logf(float __x) { return __ocml_log_f32(__x); }
				325
				326	__DEVICE__
				327	long int lrintf(float __x) { return __ocml_rint_f32(__x); }
				328
				329	__DEVICE__
				330	long int lroundf(float __x) { return __ocml_round_f32(__x); }
				331
				332	__DEVICE__
				333	float modff(float __x, float *__iptr) {
				334	float __tmp;
				335	float __r =
				336	__ocml_modf_f32(__x, (__attribute__((address_space(5))) float *)&__tmp);
				337	*__iptr = __tmp;
				338	return __r;
				339	}
				340
				341	__DEVICE__
				342	float nanf(const char *__tagp) {
				343	union {
				344	float val;
				345	struct ieee_float {
				346	unsigned int mantissa : 22;
				347	unsigned int quiet : 1;
				348	unsigned int exponent : 8;
				349	unsigned int sign : 1;
				350	} bits;
				351	} __tmp;
				352	__static_assert_type_size_equal(sizeof(__tmp.val), sizeof(__tmp.bits));
				353
				354	__tmp.bits.sign = 0u;
				355	__tmp.bits.exponent = ~0u;
				356	__tmp.bits.quiet = 1u;
				357	__tmp.bits.mantissa = __make_mantissa(__tagp);
				358
				359	return __tmp.val;
				360	}
				361
				362	__DEVICE__
				363	float nearbyintf(float __x) { return __ocml_nearbyint_f32(__x); }
				364
				365	__DEVICE__
				366	float nextafterf(float __x, float __y) {
				367	return __ocml_nextafter_f32(__x, __y);
				368	}
				369
				370	__DEVICE__
				371	float norm3df(float __x, float __y, float __z) {
				372	return __ocml_len3_f32(__x, __y, __z);
				373	}
				374
				375	__DEVICE__
				376	float norm4df(float __x, float __y, float __z, float __w) {
				377	return __ocml_len4_f32(__x, __y, __z, __w);
				378	}
				379
				380	__DEVICE__
				381	float normcdff(float __x) { return __ocml_ncdf_f32(__x); }
				382
				383	__DEVICE__
				384	float normcdfinvf(float __x) { return __ocml_ncdfinv_f32(__x); }
				385
				386	__DEVICE__
				387	float normf(int __dim,
				388	const float *__a) { // TODO: placeholder until OCML adds support.
				389	float __r = 0;
				390	while (__dim--) {
				391	__r += __a[0] * __a[0];
				392	++__a;
				393	}
				394
				395	return __ocml_sqrt_f32(__r);
				396	}
				397
				398	__DEVICE__
				399	float powf(float __x, float __y) { return __ocml_pow_f32(__x, __y); }
				400
				401	__DEVICE__
				402	float powif(float __x, int __y) { return __ocml_pown_f32(__x, __y); }
				403
				404	__DEVICE__
				405	float rcbrtf(float __x) { return __ocml_rcbrt_f32(__x); }
				406
				407	__DEVICE__
				408	float remainderf(float __x, float __y) {
				409	return __ocml_remainder_f32(__x, __y);
				410	}
				411
				412	__DEVICE__
				413	float remquof(float __x, float __y, int *__quo) {
				414	int __tmp;
				415	float __r = __ocml_remquo_f32(
				416	__x, __y, (__attribute__((address_space(5))) int *)&__tmp);
				417	*__quo = __tmp;
				418
				419	return __r;
				420	}
				421
				422	__DEVICE__
				423	float rhypotf(float __x, float __y) { return __ocml_rhypot_f32(__x, __y); }
				424
				425	__DEVICE__
				426	float rintf(float __x) { return __ocml_rint_f32(__x); }
				427
				428	__DEVICE__
				429	float rnorm3df(float __x, float __y, float __z) {
				430	return __ocml_rlen3_f32(__x, __y, __z);
				431	}
				432
				433	__DEVICE__
				434	float rnorm4df(float __x, float __y, float __z, float __w) {
				435	return __ocml_rlen4_f32(__x, __y, __z, __w);
				436	}
				437
				438	__DEVICE__
				439	float rnormf(int __dim,
				440	const float *__a) { // TODO: placeholder until OCML adds support.
				441	float __r = 0;
				442	while (__dim--) {
				443	__r += __a[0] * __a[0];
				444	++__a;
				445	}
				446
				447	return __ocml_rsqrt_f32(__r);
				448	}
				449
				450	__DEVICE__
				451	float roundf(float __x) { return __ocml_round_f32(__x); }
				452
				453	__DEVICE__
				454	float rsqrtf(float __x) { return __ocml_rsqrt_f32(__x); }
				455
				456	__DEVICE__
				457	float scalblnf(float __x, long int __n) {
				458	return (__n < INT_MAX) ? __ocml_scalbn_f32(__x, __n)
				459	: __ocml_scalb_f32(__x, __n);
				460	}
				461
				462	__DEVICE__
				463	float scalbnf(float __x, int __n) { return __ocml_scalbn_f32(__x, __n); }
				464
				465	__DEVICE__
				466	__RETURN_TYPE __signbitf(float __x) { return __ocml_signbit_f32(__x); }
				467
				468	__DEVICE__
				469	void sincosf(float __x, float __sinptr, float __cosptr) {
				470	float __tmp;
				471	*__sinptr =
				472	__ocml_sincos_f32(__x, (__attribute__((address_space(5))) float *)&__tmp);
				473	*__cosptr = __tmp;
				474	}
				475
				476	__DEVICE__
				477	void sincospif(float __x, float __sinptr, float __cosptr) {
				478	float __tmp;
				479	*__sinptr = __ocml_sincospi_f32(
				480	__x, (__attribute__((address_space(5))) float *)&__tmp);
				481	*__cosptr = __tmp;
				482	}
				483
				484	__DEVICE__
				485	float sinf(float __x) { return __ocml_sin_f32(__x); }
				486
				487	__DEVICE__
				488	float sinhf(float __x) { return __ocml_sinh_f32(__x); }
				489
				490	__DEVICE__
				491	float sinpif(float __x) { return __ocml_sinpi_f32(__x); }
				492
				493	__DEVICE__
				494	float sqrtf(float __x) { return __ocml_sqrt_f32(__x); }
				495
				496	__DEVICE__
				497	float tanf(float __x) { return __ocml_tan_f32(__x); }
				498
				499	__DEVICE__
				500	float tanhf(float __x) { return __ocml_tanh_f32(__x); }
				501
				502	__DEVICE__
				503	float tgammaf(float __x) { return __ocml_tgamma_f32(__x); }
				504
				505	__DEVICE__
				506	float truncf(float __x) { return __ocml_trunc_f32(__x); }
				507
				508	__DEVICE__
				509	float y0f(float __x) { return __ocml_y0_f32(__x); }
				510
				511	__DEVICE__
				512	float y1f(float __x) { return __ocml_y1_f32(__x); }
				513
				514	__DEVICE__
				515	float ynf(int __n, float __x) { // TODO: we could use Ahmes multiplication
				516	// and the Miller & Brown algorithm
				517	// for linear recurrences to get O(log n) steps, but it's unclear if
				518	// it'd be beneficial in this case. Placeholder until OCML adds
				519	// support.
				520	if (__n == 0)
				521	return y0f(__x);
				522	if (__n == 1)
				523	return y1f(__x);
				524
				525	float __x0 = y0f(__x);
				526	float __x1 = y1f(__x);
				527	for (int __i = 1; __i < __n; ++__i) {
				528	float __x2 = (2 * __i) / __x * __x1 - __x0;
				529	__x0 = __x1;
				530	__x1 = __x2;
				531	}
				532
				533	return __x1;
				534	}
				535
				536	// BEGIN INTRINSICS
				537
				538	__DEVICE__
				539	float __cosf(float __x) { return __ocml_native_cos_f32(__x); }
				540
				541	__DEVICE__
				542	float __exp10f(float __x) { return __ocml_native_exp10_f32(__x); }
				543
				544	__DEVICE__
				545	float __expf(float __x) { return __ocml_native_exp_f32(__x); }
				546
				547	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				548	__DEVICE__
				549	float __fadd_rd(float __x, float __y) { return __ocml_add_rtn_f32(__x, __y); }
				550	#endif
				551	__DEVICE__
				552	float __fadd_rn(float __x, float __y) { return __ocml_add_rte_f32(__x, __y); }
				553	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				554	__DEVICE__
				555	float __fadd_ru(float __x, float __y) { return __ocml_add_rtp_f32(__x, __y); }
				556
				557	__DEVICE__
				558	float __fadd_rz(float __x, float __y) { return __ocml_add_rtz_f32(__x, __y); }
				559
				560	__DEVICE__
				561	float __fdiv_rd(float __x, float __y) { return __ocml_div_rtn_f32(__x, __y); }
				562	#endif
				563	__DEVICE__
				564	float __fdiv_rn(float __x, float __y) { return __ocml_div_rte_f32(__x, __y); }
				565	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				566	__DEVICE__
				567	float __fdiv_ru(float __x, float __y) { return __ocml_div_rtp_f32(__x, __y); }
				568
				569	__DEVICE__
				570	float __fdiv_rz(float __x, float __y) { return __ocml_div_rtz_f32(__x, __y); }
				571	#endif
				572	__DEVICE__
				573	float __fdividef(float __x, float __y) { return __x / __y; }
				574	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				575	__DEVICE__
				576	float __fmaf_rd(float __x, float __y, float __z) {
				577	return __ocml_fma_rtn_f32(__x, __y, __z);
				578	}
				579	#endif
				580	__DEVICE__
				581	float __fmaf_rn(float __x, float __y, float __z) {
				582	return __ocml_fma_rte_f32(__x, __y, __z);
				583	}
				584	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				585	__DEVICE__
				586	float __fmaf_ru(float __x, float __y, float __z) {
				587	return __ocml_fma_rtp_f32(__x, __y, __z);
				588	}
				589
				590	__DEVICE__
				591	float __fmaf_rz(float __x, float __y, float __z) {
				592	return __ocml_fma_rtz_f32(__x, __y, __z);
				593	}
				594
				595	__DEVICE__
				596	float __fmul_rd(float __x, float __y) { return __ocml_mul_rtn_f32(__x, __y); }
				597	#endif
				598	__DEVICE__
				599	float __fmul_rn(float __x, float __y) { return __ocml_mul_rte_f32(__x, __y); }
				600	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				601	__DEVICE__
				602	float __fmul_ru(float __x, float __y) { return __ocml_mul_rtp_f32(__x, __y); }
				603
				604	__DEVICE__
				605	float __fmul_rz(float __x, float __y) { return __ocml_mul_rtz_f32(__x, __y); }
				606
				607	__DEVICE__
				608	float __frcp_rd(float __x) { return __llvm_amdgcn_rcp_f32(__x); }
				609	#endif
				610	__DEVICE__
				611	float __frcp_rn(float __x) { return __llvm_amdgcn_rcp_f32(__x); }
				612	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				613	__DEVICE__
				614	float __frcp_ru(float __x) { return __llvm_amdgcn_rcp_f32(__x); }
				615
				616	__DEVICE__
				617	float __frcp_rz(float __x) { return __llvm_amdgcn_rcp_f32(__x); }
				618	#endif
				619	__DEVICE__
				620	float __frsqrt_rn(float __x) { return __llvm_amdgcn_rsq_f32(__x); }
				621	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				622	__DEVICE__
				623	float __fsqrt_rd(float __x) { return __ocml_sqrt_rtn_f32(__x); }
				624	#endif
				625	__DEVICE__
				626	float __fsqrt_rn(float __x) { return __ocml_sqrt_rte_f32(__x); }
				627	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				628	__DEVICE__
				629	float __fsqrt_ru(float __x) { return __ocml_sqrt_rtp_f32(__x); }
				630
				631	__DEVICE__
				632	float __fsqrt_rz(float __x) { return __ocml_sqrt_rtz_f32(__x); }
				633
				634	__DEVICE__
				635	float __fsub_rd(float __x, float __y) { return __ocml_sub_rtn_f32(__x, __y); }
				636	#endif
				637	__DEVICE__
				638	float __fsub_rn(float __x, float __y) { return __ocml_sub_rte_f32(__x, __y); }
				639	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				640	__DEVICE__
				641	float __fsub_ru(float __x, float __y) { return __ocml_sub_rtp_f32(__x, __y); }
				642
				643	__DEVICE__
				644	float __fsub_rz(float __x, float __y) { return __ocml_sub_rtz_f32(__x, __y); }
				645	#endif
				646	__DEVICE__
				647	float __log10f(float __x) { return __ocml_native_log10_f32(__x); }
				648
				649	__DEVICE__
				650	float __log2f(float __x) { return __ocml_native_log2_f32(__x); }
				651
				652	__DEVICE__
				653	float __logf(float __x) { return __ocml_native_log_f32(__x); }
				654
				655	__DEVICE__
				656	float __powf(float __x, float __y) { return __ocml_pow_f32(__x, __y); }
				657
				658	__DEVICE__
				659	float __saturatef(float __x) { return (__x < 0) ? 0 : ((__x > 1) ? 1 : __x); }
				660
				661	__DEVICE__
				662	void __sincosf(float __x, float __sinptr, float __cosptr) {
				663	*__sinptr = __ocml_native_sin_f32(__x);
				664	*__cosptr = __ocml_native_cos_f32(__x);
				665	}
				666
				667	__DEVICE__
				668	float __sinf(float __x) { return __ocml_native_sin_f32(__x); }
				669
				670	__DEVICE__
				671	float __tanf(float __x) { return __ocml_tan_f32(__x); }
				672	// END INTRINSICS
				673	// END FLOAT
				674
				675	// BEGIN DOUBLE
				676	__DEVICE__
				677	double acos(double __x) { return __ocml_acos_f64(__x); }
				678
				679	__DEVICE__
				680	double acosh(double __x) { return __ocml_acosh_f64(__x); }
				681
				682	__DEVICE__
				683	double asin(double __x) { return __ocml_asin_f64(__x); }
				684
				685	__DEVICE__
				686	double asinh(double __x) { return __ocml_asinh_f64(__x); }
				687
				688	__DEVICE__
				689	double atan(double __x) { return __ocml_atan_f64(__x); }
				690
				691	__DEVICE__
				692	double atan2(double __x, double __y) { return __ocml_atan2_f64(__x, __y); }
				693
				694	__DEVICE__
				695	double atanh(double __x) { return __ocml_atanh_f64(__x); }
				696
				697	__DEVICE__
				698	double cbrt(double __x) { return __ocml_cbrt_f64(__x); }
				699
				700	__DEVICE__
				701	double ceil(double __x) { return __ocml_ceil_f64(__x); }
				702
				703	__DEVICE__
				704	double copysign(double __x, double __y) {
				705	return __ocml_copysign_f64(__x, __y);
				706	}
				707
				708	__DEVICE__
				709	double cos(double __x) { return __ocml_cos_f64(__x); }
				710
				711	__DEVICE__
				712	double cosh(double __x) { return __ocml_cosh_f64(__x); }
				713
				714	__DEVICE__
				715	double cospi(double __x) { return __ocml_cospi_f64(__x); }
				716
				717	__DEVICE__
				718	double cyl_bessel_i0(double __x) { return __ocml_i0_f64(__x); }
				719
				720	__DEVICE__
				721	double cyl_bessel_i1(double __x) { return __ocml_i1_f64(__x); }
				722
				723	__DEVICE__
				724	double erf(double __x) { return __ocml_erf_f64(__x); }
				725
				726	__DEVICE__
				727	double erfc(double __x) { return __ocml_erfc_f64(__x); }
				728
				729	__DEVICE__
				730	double erfcinv(double __x) { return __ocml_erfcinv_f64(__x); }
				731
				732	__DEVICE__
				733	double erfcx(double __x) { return __ocml_erfcx_f64(__x); }
				734
				735	__DEVICE__
				736	double erfinv(double __x) { return __ocml_erfinv_f64(__x); }
				737
				738	__DEVICE__
				739	double exp(double __x) { return __ocml_exp_f64(__x); }
				740
				741	__DEVICE__
				742	double exp10(double __x) { return __ocml_exp10_f64(__x); }
				743
				744	__DEVICE__
				745	double exp2(double __x) { return __ocml_exp2_f64(__x); }
				746
				747	__DEVICE__
				748	double expm1(double __x) { return __ocml_expm1_f64(__x); }
				749
				750	__DEVICE__
				751	double fabs(double __x) { return __ocml_fabs_f64(__x); }
				752
				753	__DEVICE__
				754	double fdim(double __x, double __y) { return __ocml_fdim_f64(__x, __y); }
				755
				756	__DEVICE__
				757	double floor(double __x) { return __ocml_floor_f64(__x); }
				758
				759	__DEVICE__
				760	double fma(double __x, double __y, double __z) {
				761	return __ocml_fma_f64(__x, __y, __z);
				762	}
				763
				764	__DEVICE__
				765	double fmax(double __x, double __y) { return __ocml_fmax_f64(__x, __y); }
				766
				767	__DEVICE__
				768	double fmin(double __x, double __y) { return __ocml_fmin_f64(__x, __y); }
				769
				770	__DEVICE__
				771	double fmod(double __x, double __y) { return __ocml_fmod_f64(__x, __y); }
				772
				773	__DEVICE__
				774	double frexp(double __x, int *__nptr) {
				775	int __tmp;
				776	double __r =
				777	__ocml_frexp_f64(__x, (__attribute__((address_space(5))) int *)&__tmp);
				778	*__nptr = __tmp;
				779	return __r;
				780	}
				781
				782	__DEVICE__
				783	double hypot(double __x, double __y) { return __ocml_hypot_f64(__x, __y); }
				784
				785	__DEVICE__
				786	int ilogb(double __x) { return __ocml_ilogb_f64(__x); }
				787
				788	__DEVICE__
				789	__RETURN_TYPE __finite(double __x) { return __ocml_isfinite_f64(__x); }
				790
				791	__DEVICE__
				792	__RETURN_TYPE __isinf(double __x) { return __ocml_isinf_f64(__x); }
				793
				794	__DEVICE__
				795	__RETURN_TYPE __isnan(double __x) { return __ocml_isnan_f64(__x); }
				796
				797	__DEVICE__
				798	double j0(double __x) { return __ocml_j0_f64(__x); }
				799
				800	__DEVICE__
				801	double j1(double __x) { return __ocml_j1_f64(__x); }
				802
				803	__DEVICE__
				804	double jn(int __n, double __x) { // TODO: we could use Ahmes multiplication
				805	// and the Miller & Brown algorithm
				806	// for linear recurrences to get O(log n) steps, but it's unclear if
				807	// it'd be beneficial in this case. Placeholder until OCML adds
				808	// support.
				809	if (__n == 0)
				810	return j0(__x);
				811	if (__n == 1)
				812	return j1(__x);
				813
				814	double __x0 = j0(__x);
				815	double __x1 = j1(__x);
				816	for (int __i = 1; __i < __n; ++__i) {
				817	double __x2 = (2 * __i) / __x * __x1 - __x0;
				818	__x0 = __x1;
				819	__x1 = __x2;
				820	}
				821	return __x1;
				822	}
				823
				824	__DEVICE__
				825	double ldexp(double __x, int __e) { return __ocml_ldexp_f64(__x, __e); }
				826
				827	__DEVICE__
				828	double lgamma(double __x) { return __ocml_lgamma_f64(__x); }
				829
				830	__DEVICE__
				831	long long int llrint(double __x) { return __ocml_rint_f64(__x); }
				832
				833	__DEVICE__
				834	long long int llround(double __x) { return __ocml_round_f64(__x); }
				835
				836	__DEVICE__
				837	double log(double __x) { return __ocml_log_f64(__x); }
				838
				839	__DEVICE__
				840	double log10(double __x) { return __ocml_log10_f64(__x); }
				841
				842	__DEVICE__
				843	double log1p(double __x) { return __ocml_log1p_f64(__x); }
				844
				845	__DEVICE__
				846	double log2(double __x) { return __ocml_log2_f64(__x); }
				847
				848	__DEVICE__
				849	double logb(double __x) { return __ocml_logb_f64(__x); }
				850
				851	__DEVICE__
				852	long int lrint(double __x) { return __ocml_rint_f64(__x); }
				853
				854	__DEVICE__
				855	long int lround(double __x) { return __ocml_round_f64(__x); }
				856
				857	__DEVICE__
				858	double modf(double __x, double *__iptr) {
				859	double __tmp;
				860	double __r =
				861	__ocml_modf_f64(__x, (__attribute__((address_space(5))) double *)&__tmp);
				862	*__iptr = __tmp;
				863
				864	return __r;
				865	}
				866
				867	__DEVICE__
				868	double nan(const char *__tagp) {
				869	#if !_WIN32
				870	union {
				871	double val;
				872	struct ieee_double {
				873	uint64_t mantissa : 51;
				874	uint32_t quiet : 1;
				875	uint32_t exponent : 11;
				876	uint32_t sign : 1;
				877	} bits;
				878	} __tmp;
				879	__static_assert_type_size_equal(sizeof(__tmp.val), sizeof(__tmp.bits));
				880
				881	__tmp.bits.sign = 0u;
				882	__tmp.bits.exponent = ~0u;
				883	__tmp.bits.quiet = 1u;
				884	__tmp.bits.mantissa = __make_mantissa(__tagp);
				885
				886	return __tmp.val;
				887	#else
				888	__static_assert_type_size_equal(sizeof(uint64_t), sizeof(double));
				889	uint64_t __val = __make_mantissa(__tagp);
				890	__val \|= 0xFFF << 51;
				891	return reinterpret_cast<double >(&__val);
				892	#endif
				893	}
				894
				895	__DEVICE__
				896	double nearbyint(double __x) { return __ocml_nearbyint_f64(__x); }
				897
				898	__DEVICE__
				899	double nextafter(double __x, double __y) {
				900	return __ocml_nextafter_f64(__x, __y);
				901	}
				902
				903	__DEVICE__
				904	double norm(int __dim,
				905	const double *__a) { // TODO: placeholder until OCML adds support.
				906	double __r = 0;
				907	while (__dim--) {
				908	__r += __a[0] * __a[0];
				909	++__a;
				910	}
				911
				912	return __ocml_sqrt_f64(__r);
				913	}
				914
				915	__DEVICE__
				916	double norm3d(double __x, double __y, double __z) {
				917	return __ocml_len3_f64(__x, __y, __z);
				918	}
				919
				920	__DEVICE__
				921	double norm4d(double __x, double __y, double __z, double __w) {
				922	return __ocml_len4_f64(__x, __y, __z, __w);
				923	}
				924
				925	__DEVICE__
				926	double normcdf(double __x) { return __ocml_ncdf_f64(__x); }
				927
				928	__DEVICE__
				929	double normcdfinv(double __x) { return __ocml_ncdfinv_f64(__x); }
				930
				931	__DEVICE__
				932	double pow(double __x, double __y) { return __ocml_pow_f64(__x, __y); }
				933
				934	__DEVICE__
				935	double powi(double __x, int __y) { return __ocml_pown_f64(__x, __y); }
				936
				937	__DEVICE__
				938	double rcbrt(double __x) { return __ocml_rcbrt_f64(__x); }
				939
				940	__DEVICE__
				941	double remainder(double __x, double __y) {
				942	return __ocml_remainder_f64(__x, __y);
				943	}
				944
				945	__DEVICE__
				946	double remquo(double __x, double __y, int *__quo) {
				947	int __tmp;
				948	double __r = __ocml_remquo_f64(
				949	__x, __y, (__attribute__((address_space(5))) int *)&__tmp);
				950	*__quo = __tmp;
				951
				952	return __r;
				953	}
				954
				955	__DEVICE__
				956	double rhypot(double __x, double __y) { return __ocml_rhypot_f64(__x, __y); }
				957
				958	__DEVICE__
				959	double rint(double __x) { return __ocml_rint_f64(__x); }
				960
				961	__DEVICE__
				962	double rnorm(int __dim,
				963	const double *__a) { // TODO: placeholder until OCML adds support.
				964	double __r = 0;
				965	while (__dim--) {
				966	__r += __a[0] * __a[0];
				967	++__a;
				968	}
				969
				970	return __ocml_rsqrt_f64(__r);
				971	}
				972
				973	__DEVICE__
				974	double rnorm3d(double __x, double __y, double __z) {
				975	return __ocml_rlen3_f64(__x, __y, __z);
				976	}
				977
				978	__DEVICE__
				979	double rnorm4d(double __x, double __y, double __z, double __w) {
				980	return __ocml_rlen4_f64(__x, __y, __z, __w);
				981	}
				982
				983	__DEVICE__
				984	double round(double __x) { return __ocml_round_f64(__x); }
				985
				986	__DEVICE__
				987	double rsqrt(double __x) { return __ocml_rsqrt_f64(__x); }
				988
				989	__DEVICE__
				990	double scalbln(double __x, long int __n) {
				991	return (__n < INT_MAX) ? __ocml_scalbn_f64(__x, __n)
				992	: __ocml_scalb_f64(__x, __n);
				993	}
				994	__DEVICE__
				995	double scalbn(double __x, int __n) { return __ocml_scalbn_f64(__x, __n); }
				996
				997	__DEVICE__
				998	__RETURN_TYPE __signbit(double __x) { return __ocml_signbit_f64(__x); }
				999
				1000	__DEVICE__
				1001	double sin(double __x) { return __ocml_sin_f64(__x); }
				1002
				1003	__DEVICE__
				1004	void sincos(double __x, double __sinptr, double __cosptr) {
				1005	double __tmp;
				1006	*__sinptr = __ocml_sincos_f64(
				1007	__x, (__attribute__((address_space(5))) double *)&__tmp);
				1008	*__cosptr = __tmp;
				1009	}
				1010
				1011	__DEVICE__
				1012	void sincospi(double __x, double __sinptr, double __cosptr) {
				1013	double __tmp;
				1014	*__sinptr = __ocml_sincospi_f64(
				1015	__x, (__attribute__((address_space(5))) double *)&__tmp);
				1016	*__cosptr = __tmp;
				1017	}
				1018
				1019	__DEVICE__
				1020	double sinh(double __x) { return __ocml_sinh_f64(__x); }
				1021
				1022	__DEVICE__
				1023	double sinpi(double __x) { return __ocml_sinpi_f64(__x); }
				1024
				1025	__DEVICE__
				1026	double sqrt(double __x) { return __ocml_sqrt_f64(__x); }
				1027
				1028	__DEVICE__
				1029	double tan(double __x) { return __ocml_tan_f64(__x); }
				1030
				1031	__DEVICE__
				1032	double tanh(double __x) { return __ocml_tanh_f64(__x); }
				1033
				1034	__DEVICE__
				1035	double tgamma(double __x) { return __ocml_tgamma_f64(__x); }
				1036
				1037	__DEVICE__
				1038	double trunc(double __x) { return __ocml_trunc_f64(__x); }
				1039
				1040	__DEVICE__
				1041	double y0(double __x) { return __ocml_y0_f64(__x); }
				1042
				1043	__DEVICE__
				1044	double y1(double __x) { return __ocml_y1_f64(__x); }
				1045
				1046	__DEVICE__
				1047	double yn(int __n, double __x) { // TODO: we could use Ahmes multiplication
				1048	// and the Miller & Brown algorithm
				1049	// for linear recurrences to get O(log n) steps, but it's unclear if
				1050	// it'd be beneficial in this case. Placeholder until OCML adds
				1051	// support.
				1052	if (__n == 0)
				1053	return y0(__x);
				1054	if (__n == 1)
				1055	return y1(__x);
				1056
				1057	double __x0 = y0(__x);
				1058	double __x1 = y1(__x);
				1059	for (int __i = 1; __i < __n; ++__i) {
				1060	double __x2 = (2 * __i) / __x * __x1 - __x0;
				1061	__x0 = __x1;
				1062	__x1 = __x2;
				1063	}
				1064
				1065	return __x1;
				1066	}
				1067
				1068	// BEGIN INTRINSICS
				1069	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1070	__DEVICE__
				1071	double __dadd_rd(double __x, double __y) {
				1072	return __ocml_add_rtn_f64(__x, __y);
				1073	}
				1074	#endif
				1075	__DEVICE__
				1076	double __dadd_rn(double __x, double __y) {
				1077	return __ocml_add_rte_f64(__x, __y);
				1078	}
				1079	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1080	__DEVICE__
				1081	double __dadd_ru(double __x, double __y) {
				1082	return __ocml_add_rtp_f64(__x, __y);
				1083	}
				1084
				1085	__DEVICE__
				1086	double __dadd_rz(double __x, double __y) {
				1087	return __ocml_add_rtz_f64(__x, __y);
				1088	}
				1089
				1090	__DEVICE__
				1091	double __ddiv_rd(double __x, double __y) {
				1092	return __ocml_div_rtn_f64(__x, __y);
				1093	}
				1094	#endif
				1095	__DEVICE__
				1096	double __ddiv_rn(double __x, double __y) {
				1097	return __ocml_div_rte_f64(__x, __y);
				1098	}
				1099	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1100	__DEVICE__
				1101	double __ddiv_ru(double __x, double __y) {
				1102	return __ocml_div_rtp_f64(__x, __y);
				1103	}
				1104
				1105	__DEVICE__
				1106	double __ddiv_rz(double __x, double __y) {
				1107	return __ocml_div_rtz_f64(__x, __y);
				1108	}
				1109
				1110	__DEVICE__
				1111	double __dmul_rd(double __x, double __y) {
				1112	return __ocml_mul_rtn_f64(__x, __y);
				1113	}
				1114	#endif
				1115	__DEVICE__
				1116	double __dmul_rn(double __x, double __y) {
				1117	return __ocml_mul_rte_f64(__x, __y);
				1118	}
				1119	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1120	__DEVICE__
				1121	double __dmul_ru(double __x, double __y) {
				1122	return __ocml_mul_rtp_f64(__x, __y);
				1123	}
				1124
				1125	__DEVICE__
				1126	double __dmul_rz(double __x, double __y) {
				1127	return __ocml_mul_rtz_f64(__x, __y);
				1128	}
				1129
				1130	__DEVICE__
				1131	double __drcp_rd(double __x) { return __llvm_amdgcn_rcp_f64(__x); }
				1132	#endif
				1133	__DEVICE__
				1134	double __drcp_rn(double __x) { return __llvm_amdgcn_rcp_f64(__x); }
				1135	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1136	__DEVICE__
				1137	double __drcp_ru(double __x) { return __llvm_amdgcn_rcp_f64(__x); }
				1138
				1139	__DEVICE__
				1140	double __drcp_rz(double __x) { return __llvm_amdgcn_rcp_f64(__x); }
				1141
				1142	__DEVICE__
				1143	double __dsqrt_rd(double __x) { return __ocml_sqrt_rtn_f64(__x); }
				1144	#endif
				1145	__DEVICE__
				1146	double __dsqrt_rn(double __x) { return __ocml_sqrt_rte_f64(__x); }
				1147	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1148	__DEVICE__
				1149	double __dsqrt_ru(double __x) { return __ocml_sqrt_rtp_f64(__x); }
				1150
				1151	__DEVICE__
				1152	double __dsqrt_rz(double __x) { return __ocml_sqrt_rtz_f64(__x); }
				1153
				1154	__DEVICE__
				1155	double __dsub_rd(double __x, double __y) {
				1156	return __ocml_sub_rtn_f64(__x, __y);
				1157	}
				1158	#endif
				1159	__DEVICE__
				1160	double __dsub_rn(double __x, double __y) {
				1161	return __ocml_sub_rte_f64(__x, __y);
				1162	}
				1163	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1164	__DEVICE__
				1165	double __dsub_ru(double __x, double __y) {
				1166	return __ocml_sub_rtp_f64(__x, __y);
				1167	}
				1168
				1169	__DEVICE__
				1170	double __dsub_rz(double __x, double __y) {
				1171	return __ocml_sub_rtz_f64(__x, __y);
				1172	}
				1173
				1174	__DEVICE__
				1175	double __fma_rd(double __x, double __y, double __z) {
				1176	return __ocml_fma_rtn_f64(__x, __y, __z);
				1177	}
				1178	#endif
				1179	__DEVICE__
				1180	double __fma_rn(double __x, double __y, double __z) {
				1181	return __ocml_fma_rte_f64(__x, __y, __z);
				1182	}
				1183	#if defined OCML_BASIC_ROUNDED_OPERATIONS
				1184	__DEVICE__
				1185	double __fma_ru(double __x, double __y, double __z) {
				1186	return __ocml_fma_rtp_f64(__x, __y, __z);
				1187	}
				1188
				1189	__DEVICE__
				1190	double __fma_rz(double __x, double __y, double __z) {
				1191	return __ocml_fma_rtz_f64(__x, __y, __z);
				1192	}
				1193	#endif
				1194	// END INTRINSICS
				1195	// END DOUBLE
				1196
				1197	// C only macros
				1198	#if !defined(__cplusplus) && __STDC_VERSION__ >= 201112L
				1199	#define isfinite(__x) _Generic((__x), float : __finitef, double : __finite)(__x)
				1200	#define isinf(__x) _Generic((__x), float : __isinff, double : __isinf)(__x)
				1201	#define isnan(__x) _Generic((__x), float : __isnanf, double : __isnan)(__x)
				1202	#define signbit(__x) \
				1203	_Generic((__x), float : __signbitf, double : __signbit)(__x)
				1204	#endif // !defined(__cplusplus) && __STDC_VERSION__ >= 201112L
				1205
				1206	#if defined(__cplusplus)
				1207	template <class T> __DEVICE__ T min(T __arg1, T __arg2) {
				1208	return (__arg1 < __arg2) ? __arg1 : __arg2;
				1209	}
				1210
				1211	template <class T> __DEVICE__ T max(T __arg1, T __arg2) {
				1212	return (__arg1 > __arg2) ? __arg1 : __arg2;
				1213	}
				1214
				1215	__DEVICE__ int min(int __arg1, int __arg2) {
				1216	return (__arg1 < __arg2) ? __arg1 : __arg2;
				1217	}
				1218	__DEVICE__ int max(int __arg1, int __arg2) {
				1219	return (__arg1 > __arg2) ? __arg1 : __arg2;
				1220	}
				1221
				1222	__DEVICE__
				1223	float max(float __x, float __y) { return fmaxf(__x, __y); }
				1224
				1225	__DEVICE__
				1226	double max(double __x, double __y) { return fmax(__x, __y); }
				1227
				1228	__DEVICE__
				1229	float min(float __x, float __y) { return fminf(__x, __y); }
				1230
				1231	__DEVICE__
				1232	double min(double __x, double __y) { return fmin(__x, __y); }
				1233
				1234	__host__ inline static int min(int __arg1, int __arg2) {
				1235	return std::min(__arg1, __arg2);
				1236	}
				1237
				1238	__host__ inline static int max(int __arg1, int __arg2) {
				1239	return std::max(__arg1, __arg2);
				1240	}
				1241	#endif
				1242
				1243	#pragma pop_macro("__DEVICE__")
				1244	#pragma pop_macro("__RETURN_TYPE")
				1245
				1246	#endif // __CLANG_HIP_MATH_H__