https://github.com/arsenm created https://github.com/llvm/llvm-project/pull/128022
These should probably be dropped from the library. >From c6c75b5d7a9a1869bfcdc413a98b00fe4b9f07d1 Mon Sep 17 00:00:00 2001 From: Matt Arsenault <matthew.arsena...@amd.com> Date: Tue, 22 Nov 2022 12:05:12 -0500 Subject: [PATCH] clang/HIP: Remove some unused ocml function declarations These should probably be dropped from the library. --- .../Headers/__clang_hip_libdevice_declares.h | 86 ---------- clang/lib/Headers/__clang_hip_math.h | 150 ++++++++++++++++++ 2 files changed, 150 insertions(+), 86 deletions(-) diff --git a/clang/lib/Headers/__clang_hip_libdevice_declares.h b/clang/lib/Headers/__clang_hip_libdevice_declares.h index f15198b3d9f93..c9f20300eb268 100644 --- a/clang/lib/Headers/__clang_hip_libdevice_declares.h +++ b/clang/lib/Headers/__clang_hip_libdevice_declares.h @@ -27,9 +27,6 @@ __device__ __attribute__((const)) float __ocml_atan2_f32(float, float); __device__ __attribute__((const)) float __ocml_atan_f32(float); __device__ __attribute__((pure)) float __ocml_atanh_f32(float); __device__ __attribute__((pure)) float __ocml_cbrt_f32(float); -__device__ __attribute__((const)) float __ocml_ceil_f32(float); -__device__ __attribute__((const)) __device__ float __ocml_copysign_f32(float, - float); __device__ float __ocml_cos_f32(float); __device__ float __ocml_native_cos_f32(float); __device__ __attribute__((pure)) __device__ float __ocml_cosh_f32(float); @@ -43,40 +40,22 @@ __device__ __attribute__((pure)) float __ocml_erf_f32(float); __device__ __attribute__((pure)) float __ocml_erfinv_f32(float); __device__ __attribute__((pure)) float __ocml_exp10_f32(float); __device__ __attribute__((pure)) float __ocml_native_exp10_f32(float); -__device__ __attribute__((pure)) float __ocml_exp2_f32(float); -__device__ __attribute__((pure)) float __ocml_exp_f32(float); -__device__ __attribute__((pure)) float __ocml_native_exp_f32(float); __device__ __attribute__((pure)) float __ocml_expm1_f32(float); -__device__ __attribute__((const)) float __ocml_fabs_f32(float); __device__ __attribute__((const)) float __ocml_fdim_f32(float, float); -__device__ __attribute__((const)) float __ocml_floor_f32(float); -__device__ __attribute__((const)) float __ocml_fma_f32(float, float, float); -__device__ __attribute__((const)) float __ocml_fmax_f32(float, float); -__device__ __attribute__((const)) float __ocml_fmin_f32(float, float); __device__ __attribute__((const)) __device__ float __ocml_fmod_f32(float, float); __device__ float __ocml_frexp_f32(float, __attribute__((address_space(5))) int *); __device__ __attribute__((const)) float __ocml_hypot_f32(float, float); __device__ __attribute__((const)) int __ocml_ilogb_f32(float); -__device__ __attribute__((const)) int __ocml_isfinite_f32(float); -__device__ __attribute__((const)) int __ocml_isinf_f32(float); -__device__ __attribute__((const)) int __ocml_isnan_f32(float); __device__ float __ocml_j0_f32(float); __device__ float __ocml_j1_f32(float); -__device__ __attribute__((const)) float __ocml_ldexp_f32(float, int); __device__ float __ocml_lgamma_f32(float); -__device__ __attribute__((pure)) float __ocml_log10_f32(float); __device__ __attribute__((pure)) float __ocml_native_log10_f32(float); __device__ __attribute__((pure)) float __ocml_log1p_f32(float); -__device__ __attribute__((pure)) float __ocml_log2_f32(float); -__device__ __attribute__((pure)) float __ocml_native_log2_f32(float); __device__ __attribute__((const)) float __ocml_logb_f32(float); -__device__ __attribute__((pure)) float __ocml_log_f32(float); -__device__ __attribute__((pure)) float __ocml_native_log_f32(float); __device__ float __ocml_modf_f32(float, __attribute__((address_space(5))) float *); -__device__ __attribute__((const)) float __ocml_nearbyint_f32(float); __device__ __attribute__((const)) float __ocml_nextafter_f32(float, float); __device__ __attribute__((const)) float __ocml_len3_f32(float, float, float); __device__ __attribute__((const)) float __ocml_len4_f32(float, float, float, @@ -90,15 +69,10 @@ __device__ __attribute__((const)) float __ocml_remainder_f32(float, float); __device__ float __ocml_remquo_f32(float, float, __attribute__((address_space(5))) int *); __device__ __attribute__((const)) float __ocml_rhypot_f32(float, float); -__device__ __attribute__((const)) float __ocml_rint_f32(float); __device__ __attribute__((const)) float __ocml_rlen3_f32(float, float, float); __device__ __attribute__((const)) float __ocml_rlen4_f32(float, float, float, float); -__device__ __attribute__((const)) float __ocml_round_f32(float); __device__ __attribute__((pure)) float __ocml_rsqrt_f32(float); -__device__ __attribute__((const)) float __ocml_scalb_f32(float, float); -__device__ __attribute__((const)) float __ocml_scalbn_f32(float, int); -__device__ __attribute__((const)) int __ocml_signbit_f32(float); __device__ float __ocml_sincos_f32(float, __attribute__((address_space(5))) float *); __device__ float __ocml_sincospi_f32(float, @@ -108,11 +82,9 @@ __device__ float __ocml_native_sin_f32(float); __device__ __attribute__((pure)) float __ocml_sinh_f32(float); __device__ float __ocml_sinpi_f32(float); __device__ __attribute__((const)) float __ocml_sqrt_f32(float); -__device__ __attribute__((const)) float __ocml_native_sqrt_f32(float); __device__ float __ocml_tan_f32(float); __device__ __attribute__((pure)) float __ocml_tanh_f32(float); __device__ float __ocml_tgamma_f32(float); -__device__ __attribute__((const)) float __ocml_trunc_f32(float); __device__ float __ocml_y0_f32(float); __device__ float __ocml_y1_f32(float); @@ -153,8 +125,6 @@ __device__ __attribute__((const)) double __ocml_atan2_f64(double, double); __device__ __attribute__((const)) double __ocml_atan_f64(double); __device__ __attribute__((pure)) double __ocml_atanh_f64(double); __device__ __attribute__((pure)) double __ocml_cbrt_f64(double); -__device__ __attribute__((const)) double __ocml_ceil_f64(double); -__device__ __attribute__((const)) double __ocml_copysign_f64(double, double); __device__ double __ocml_cos_f64(double); __device__ __attribute__((pure)) double __ocml_cosh_f64(double); __device__ double __ocml_cospi_f64(double); @@ -169,23 +139,12 @@ __device__ __attribute__((pure)) double __ocml_exp10_f64(double); __device__ __attribute__((pure)) double __ocml_exp2_f64(double); __device__ __attribute__((pure)) double __ocml_exp_f64(double); __device__ __attribute__((pure)) double __ocml_expm1_f64(double); -__device__ __attribute__((const)) double __ocml_fabs_f64(double); __device__ __attribute__((const)) double __ocml_fdim_f64(double, double); -__device__ __attribute__((const)) double __ocml_floor_f64(double); -__device__ __attribute__((const)) double __ocml_fma_f64(double, double, double); -__device__ __attribute__((const)) double __ocml_fmax_f64(double, double); -__device__ __attribute__((const)) double __ocml_fmin_f64(double, double); __device__ __attribute__((const)) double __ocml_fmod_f64(double, double); -__device__ double __ocml_frexp_f64(double, - __attribute__((address_space(5))) int *); __device__ __attribute__((const)) double __ocml_hypot_f64(double, double); __device__ __attribute__((const)) int __ocml_ilogb_f64(double); -__device__ __attribute__((const)) int __ocml_isfinite_f64(double); -__device__ __attribute__((const)) int __ocml_isinf_f64(double); -__device__ __attribute__((const)) int __ocml_isnan_f64(double); __device__ double __ocml_j0_f64(double); __device__ double __ocml_j1_f64(double); -__device__ __attribute__((const)) double __ocml_ldexp_f64(double, int); __device__ double __ocml_lgamma_f64(double); __device__ __attribute__((pure)) double __ocml_log10_f64(double); __device__ __attribute__((pure)) double __ocml_log1p_f64(double); @@ -194,7 +153,6 @@ __device__ __attribute__((const)) double __ocml_logb_f64(double); __device__ __attribute__((pure)) double __ocml_log_f64(double); __device__ double __ocml_modf_f64(double, __attribute__((address_space(5))) double *); -__device__ __attribute__((const)) double __ocml_nearbyint_f64(double); __device__ __attribute__((const)) double __ocml_nextafter_f64(double, double); __device__ __attribute__((const)) double __ocml_len3_f64(double, double, double); @@ -209,16 +167,11 @@ __device__ __attribute__((const)) double __ocml_remainder_f64(double, double); __device__ double __ocml_remquo_f64(double, double, __attribute__((address_space(5))) int *); __device__ __attribute__((const)) double __ocml_rhypot_f64(double, double); -__device__ __attribute__((const)) double __ocml_rint_f64(double); __device__ __attribute__((const)) double __ocml_rlen3_f64(double, double, double); __device__ __attribute__((const)) double __ocml_rlen4_f64(double, double, double, double); -__device__ __attribute__((const)) double __ocml_round_f64(double); __device__ __attribute__((pure)) double __ocml_rsqrt_f64(double); -__device__ __attribute__((const)) double __ocml_scalb_f64(double, double); -__device__ __attribute__((const)) double __ocml_scalbn_f64(double, int); -__device__ __attribute__((const)) int __ocml_signbit_f64(double); __device__ double __ocml_sincos_f64(double, __attribute__((address_space(5))) double *); __device__ double @@ -230,7 +183,6 @@ __device__ __attribute__((const)) double __ocml_sqrt_f64(double); __device__ double __ocml_tan_f64(double); __device__ __attribute__((pure)) double __ocml_tanh_f64(double); __device__ double __ocml_tgamma_f64(double); -__device__ __attribute__((const)) double __ocml_trunc_f64(double); __device__ double __ocml_y0_f64(double); __device__ double __ocml_y1_f64(double); @@ -264,30 +216,13 @@ __device__ __attribute__((const)) double __ocml_fma_rtp_f64(double, double, __device__ __attribute__((const)) double __ocml_fma_rtz_f64(double, double, double); -__device__ __attribute__((const)) _Float16 __ocml_ceil_f16(_Float16); __device__ _Float16 __ocml_cos_f16(_Float16); __device__ __attribute__((const)) _Float16 __ocml_cvtrtn_f16_f32(float); __device__ __attribute__((const)) _Float16 __ocml_cvtrtp_f16_f32(float); __device__ __attribute__((const)) _Float16 __ocml_cvtrtz_f16_f32(float); -__device__ __attribute__((pure)) _Float16 __ocml_exp_f16(_Float16); __device__ __attribute__((pure)) _Float16 __ocml_exp10_f16(_Float16); -__device__ __attribute__((pure)) _Float16 __ocml_exp2_f16(_Float16); -__device__ __attribute__((const)) _Float16 __ocml_floor_f16(_Float16); -__device__ __attribute__((const)) _Float16 __ocml_fma_f16(_Float16, _Float16, - _Float16); -__device__ __attribute__((const)) _Float16 __ocml_fmax_f16(_Float16, _Float16); -__device__ __attribute__((const)) _Float16 __ocml_fmin_f16(_Float16, _Float16); -__device__ __attribute__((const)) _Float16 __ocml_fabs_f16(_Float16); -__device__ __attribute__((const)) int __ocml_isinf_f16(_Float16); -__device__ __attribute__((const)) int __ocml_isnan_f16(_Float16); -__device__ __attribute__((pure)) _Float16 __ocml_log_f16(_Float16); -__device__ __attribute__((pure)) _Float16 __ocml_log10_f16(_Float16); -__device__ __attribute__((pure)) _Float16 __ocml_log2_f16(_Float16); -__device__ __attribute__((const)) _Float16 __ocml_rint_f16(_Float16); __device__ __attribute__((const)) _Float16 __ocml_rsqrt_f16(_Float16); __device__ _Float16 __ocml_sin_f16(_Float16); -__device__ __attribute__((const)) _Float16 __ocml_sqrt_f16(_Float16); -__device__ __attribute__((const)) _Float16 __ocml_trunc_f16(_Float16); __device__ __attribute__((pure)) _Float16 __ocml_pown_f16(_Float16, int); typedef _Float16 __2f16 __attribute__((ext_vector_type(2))); @@ -302,20 +237,6 @@ typedef _Bool __ockl_bool; __device__ __attribute__((const)) float __ockl_fdot2(__2f16 a, __2f16 b, float c, __ockl_bool s); -__device__ __attribute__((const)) __2f16 __ocml_ceil_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_fabs_2f16(__2f16); -__device__ __2f16 __ocml_cos_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_exp_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_exp10_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_exp2_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_floor_2f16(__2f16); -__device__ __attribute__((const)) -__2f16 __ocml_fma_2f16(__2f16, __2f16, __2f16); -__device__ __attribute__((const)) __2i16 __ocml_isinf_2f16(__2f16); -__device__ __attribute__((const)) __2i16 __ocml_isnan_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_log_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_log10_2f16(__2f16); -__device__ __attribute__((pure)) __2f16 __ocml_log2_2f16(__2f16); #if HIP_VERSION_MAJOR * 100 + HIP_VERSION_MINOR >= 560 #define __DEPRECATED_SINCE_HIP_560(X) __attribute__((deprecated(X))) @@ -339,13 +260,6 @@ __llvm_amdgcn_rcp_2f16(__2f16 __x) #undef __DEPRECATED_SINCE_HIP_560 -__device__ __attribute__((const)) __2f16 __ocml_rint_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_rsqrt_2f16(__2f16); -__device__ __2f16 __ocml_sin_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_sqrt_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_trunc_2f16(__2f16); -__device__ __attribute__((const)) __2f16 __ocml_pown_2f16(__2f16, __2i16); - #ifdef __cplusplus } // extern "C" #endif diff --git a/clang/lib/Headers/__clang_hip_math.h b/clang/lib/Headers/__clang_hip_math.h index 8468751d9de26..79cb7906852c4 100644 --- a/clang/lib/Headers/__clang_hip_math.h +++ b/clang/lib/Headers/__clang_hip_math.h @@ -727,6 +727,156 @@ float ynf(int __n, float __x) { // TODO: we could use Ahmes multiplication } +__DEVICE__ +float __cosf(float __x) { return __ocml_native_cos_f32(__x); } + +__DEVICE__ +float __exp10f(float __x) { return __ocml_native_exp10_f32(__x); } + +__DEVICE__ +float __expf(float __x) { return __ocml_native_exp_f32(__x); } + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fadd_rd(float __x, float __y) { return __ocml_add_rtn_f32(__x, __y); } +__DEVICE__ +float __fadd_rn(float __x, float __y) { return __ocml_add_rte_f32(__x, __y); } +__DEVICE__ +float __fadd_ru(float __x, float __y) { return __ocml_add_rtp_f32(__x, __y); } +__DEVICE__ +float __fadd_rz(float __x, float __y) { return __ocml_add_rtz_f32(__x, __y); } +#else +__DEVICE__ +float __fadd_rn(float __x, float __y) { return __x + __y; } +#endif + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fdiv_rd(float __x, float __y) { return __ocml_div_rtn_f32(__x, __y); } +__DEVICE__ +float __fdiv_rn(float __x, float __y) { return __ocml_div_rte_f32(__x, __y); } +__DEVICE__ +float __fdiv_ru(float __x, float __y) { return __ocml_div_rtp_f32(__x, __y); } +__DEVICE__ +float __fdiv_rz(float __x, float __y) { return __ocml_div_rtz_f32(__x, __y); } +#else +__DEVICE__ +float __fdiv_rn(float __x, float __y) { return __x / __y; } +#endif + +__DEVICE__ +float __fdividef(float __x, float __y) { return __x / __y; } + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fmaf_rd(float __x, float __y, float __z) { + return __ocml_fma_rtn_f32(__x, __y, __z); +} +__DEVICE__ +float __fmaf_rn(float __x, float __y, float __z) { + return __ocml_fma_rte_f32(__x, __y, __z); +} +__DEVICE__ +float __fmaf_ru(float __x, float __y, float __z) { + return __ocml_fma_rtp_f32(__x, __y, __z); +} +__DEVICE__ +float __fmaf_rz(float __x, float __y, float __z) { + return __ocml_fma_rtz_f32(__x, __y, __z); +} +#else +__DEVICE__ +float __fmaf_rn(float __x, float __y, float __z) { + return __builtin_fmaf(__x, __y, __z); +} +#endif + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fmul_rd(float __x, float __y) { return __ocml_mul_rtn_f32(__x, __y); } +__DEVICE__ +float __fmul_rn(float __x, float __y) { return __ocml_mul_rte_f32(__x, __y); } +__DEVICE__ +float __fmul_ru(float __x, float __y) { return __ocml_mul_rtp_f32(__x, __y); } +__DEVICE__ +float __fmul_rz(float __x, float __y) { return __ocml_mul_rtz_f32(__x, __y); } +#else +__DEVICE__ +float __fmul_rn(float __x, float __y) { return __x * __y; } +#endif + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __frcp_rd(float __x) { return __ocml_div_rtn_f32(1.0f, __x); } +__DEVICE__ +float __frcp_rn(float __x) { return __ocml_div_rte_f32(1.0f, __x); } +__DEVICE__ +float __frcp_ru(float __x) { return __ocml_div_rtp_f32(1.0f, __x); } +__DEVICE__ +float __frcp_rz(float __x) { return __ocml_div_rtz_f32(1.0f, __x); } +#else +__DEVICE__ +float __frcp_rn(float __x) { return 1.0f / __x; } +#endif + +__DEVICE__ +float __frsqrt_rn(float __x) { return __builtin_amdgcn_rsqf(__x); } + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fsqrt_rd(float __x) { return __ocml_sqrt_rtn_f32(__x); } +__DEVICE__ +float __fsqrt_rn(float __x) { return __ocml_sqrt_rte_f32(__x); } +__DEVICE__ +float __fsqrt_ru(float __x) { return __ocml_sqrt_rtp_f32(__x); } +__DEVICE__ +float __fsqrt_rz(float __x) { return __ocml_sqrt_rtz_f32(__x); } +#else +__DEVICE__ +float __fsqrt_rn(float __x) { return __builtin_sqrtf(__x); } +#endif + +#if defined OCML_BASIC_ROUNDED_OPERATIONS +__DEVICE__ +float __fsub_rd(float __x, float __y) { return __ocml_sub_rtn_f32(__x, __y); } +__DEVICE__ +float __fsub_rn(float __x, float __y) { return __ocml_sub_rte_f32(__x, __y); } +__DEVICE__ +float __fsub_ru(float __x, float __y) { return __ocml_sub_rtp_f32(__x, __y); } +__DEVICE__ +float __fsub_rz(float __x, float __y) { return __ocml_sub_rtz_f32(__x, __y); } +#else +__DEVICE__ +float __fsub_rn(float __x, float __y) { return __x - __y; } +#endif + +__DEVICE__ +float __log10f(float __x) { return __ocml_native_log10_f32(__x); } + +__DEVICE__ +float __log2f(float __x) { return __ocml_native_log2_f32(__x); } + +__DEVICE__ +float __logf(float __x) { return __ocml_native_log_f32(__x); } + +__DEVICE__ +float __powf(float __x, float __y) { return __ocml_pow_f32(__x, __y); } + +__DEVICE__ +float __saturatef(float __x) { return (__x < 0) ? 0 : ((__x > 1) ? 1 : __x); } + +__DEVICE__ +void __sincosf(float __x, float *__sinptr, float *__cosptr) { + *__sinptr = __ocml_native_sin_f32(__x); + *__cosptr = __ocml_native_cos_f32(__x); +} + +__DEVICE__ +float __sinf(float __x) { return __ocml_native_sin_f32(__x); } + +__DEVICE__ +float __tanf(float __x) { return __ocml_tan_f32(__x); } +// END INTRINSICS // END FLOAT // BEGIN DOUBLE _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits