| /*===---- __clang_hip_libdevice_declares.h - HIP device library decls -------=== |
| * |
| * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| * See https://llvm.org/LICENSE.txt for license information. |
| * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| * |
| *===-----------------------------------------------------------------------=== |
| */ |
| |
| #ifndef __CLANG_HIP_LIBDEVICE_DECLARES_H__ |
| #define __CLANG_HIP_LIBDEVICE_DECLARES_H__ |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| // BEGIN FLOAT |
| __device__ __attribute__((const)) float __ocml_acos_f32(float); |
| __device__ __attribute__((pure)) float __ocml_acosh_f32(float); |
| __device__ __attribute__((const)) float __ocml_asin_f32(float); |
| __device__ __attribute__((pure)) float __ocml_asinh_f32(float); |
| __device__ __attribute__((const)) float __ocml_atan2_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_atan_f32(float); |
| __device__ __attribute__((pure)) float __ocml_atanh_f32(float); |
| __device__ __attribute__((pure)) float __ocml_cbrt_f32(float); |
| __device__ __attribute__((const)) float __ocml_ceil_f32(float); |
| __device__ __attribute__((const)) __device__ float __ocml_copysign_f32(float, |
| float); |
| __device__ float __ocml_cos_f32(float); |
| __device__ float __ocml_native_cos_f32(float); |
| __device__ __attribute__((pure)) __device__ float __ocml_cosh_f32(float); |
| __device__ float __ocml_cospi_f32(float); |
| __device__ float __ocml_i0_f32(float); |
| __device__ float __ocml_i1_f32(float); |
| __device__ __attribute__((pure)) float __ocml_erfc_f32(float); |
| __device__ __attribute__((pure)) float __ocml_erfcinv_f32(float); |
| __device__ __attribute__((pure)) float __ocml_erfcx_f32(float); |
| __device__ __attribute__((pure)) float __ocml_erf_f32(float); |
| __device__ __attribute__((pure)) float __ocml_erfinv_f32(float); |
| __device__ __attribute__((pure)) float __ocml_exp10_f32(float); |
| __device__ __attribute__((pure)) float __ocml_native_exp10_f32(float); |
| __device__ __attribute__((pure)) float __ocml_exp2_f32(float); |
| __device__ __attribute__((pure)) float __ocml_exp_f32(float); |
| __device__ __attribute__((pure)) float __ocml_native_exp_f32(float); |
| __device__ __attribute__((pure)) float __ocml_expm1_f32(float); |
| __device__ __attribute__((const)) float __ocml_fabs_f32(float); |
| __device__ __attribute__((const)) float __ocml_fdim_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_floor_f32(float); |
| __device__ __attribute__((const)) float __ocml_fma_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_fmax_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_fmin_f32(float, float); |
| __device__ __attribute__((const)) __device__ float __ocml_fmod_f32(float, |
| float); |
| __device__ float __ocml_frexp_f32(float, |
| __attribute__((address_space(5))) int *); |
| __device__ __attribute__((const)) float __ocml_hypot_f32(float, float); |
| __device__ __attribute__((const)) int __ocml_ilogb_f32(float); |
| __device__ __attribute__((const)) int __ocml_isfinite_f32(float); |
| __device__ __attribute__((const)) int __ocml_isinf_f32(float); |
| __device__ __attribute__((const)) int __ocml_isnan_f32(float); |
| __device__ float __ocml_j0_f32(float); |
| __device__ float __ocml_j1_f32(float); |
| __device__ __attribute__((const)) float __ocml_ldexp_f32(float, int); |
| __device__ float __ocml_lgamma_f32(float); |
| __device__ __attribute__((pure)) float __ocml_log10_f32(float); |
| __device__ __attribute__((pure)) float __ocml_native_log10_f32(float); |
| __device__ __attribute__((pure)) float __ocml_log1p_f32(float); |
| __device__ __attribute__((pure)) float __ocml_log2_f32(float); |
| __device__ __attribute__((pure)) float __ocml_native_log2_f32(float); |
| __device__ __attribute__((const)) float __ocml_logb_f32(float); |
| __device__ __attribute__((pure)) float __ocml_log_f32(float); |
| __device__ __attribute__((pure)) float __ocml_native_log_f32(float); |
| __device__ float __ocml_modf_f32(float, |
| __attribute__((address_space(5))) float *); |
| __device__ __attribute__((const)) float __ocml_nearbyint_f32(float); |
| __device__ __attribute__((const)) float __ocml_nextafter_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_len3_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_len4_f32(float, float, float, |
| float); |
| __device__ __attribute__((pure)) float __ocml_ncdf_f32(float); |
| __device__ __attribute__((pure)) float __ocml_ncdfinv_f32(float); |
| __device__ __attribute__((pure)) float __ocml_pow_f32(float, float); |
| __device__ __attribute__((pure)) float __ocml_pown_f32(float, int); |
| __device__ __attribute__((pure)) float __ocml_rcbrt_f32(float); |
| __device__ __attribute__((const)) float __ocml_remainder_f32(float, float); |
| __device__ float __ocml_remquo_f32(float, float, |
| __attribute__((address_space(5))) int *); |
| __device__ __attribute__((const)) float __ocml_rhypot_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_rint_f32(float); |
| __device__ __attribute__((const)) float __ocml_rlen3_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_rlen4_f32(float, float, float, |
| float); |
| __device__ __attribute__((const)) float __ocml_round_f32(float); |
| __device__ __attribute__((pure)) float __ocml_rsqrt_f32(float); |
| __device__ __attribute__((const)) float __ocml_scalb_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_scalbn_f32(float, int); |
| __device__ __attribute__((const)) int __ocml_signbit_f32(float); |
| __device__ float __ocml_sincos_f32(float, |
| __attribute__((address_space(5))) float *); |
| __device__ float __ocml_sincospi_f32(float, |
| __attribute__((address_space(5))) float *); |
| __device__ float __ocml_sin_f32(float); |
| __device__ float __ocml_native_sin_f32(float); |
| __device__ __attribute__((pure)) float __ocml_sinh_f32(float); |
| __device__ float __ocml_sinpi_f32(float); |
| __device__ __attribute__((const)) float __ocml_sqrt_f32(float); |
| __device__ __attribute__((const)) float __ocml_native_sqrt_f32(float); |
| __device__ float __ocml_tan_f32(float); |
| __device__ __attribute__((pure)) float __ocml_tanh_f32(float); |
| __device__ float __ocml_tgamma_f32(float); |
| __device__ __attribute__((const)) float __ocml_trunc_f32(float); |
| __device__ float __ocml_y0_f32(float); |
| __device__ float __ocml_y1_f32(float); |
| |
| // BEGIN INTRINSICS |
| __device__ __attribute__((const)) float __ocml_add_rte_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_add_rtn_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_add_rtp_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_add_rtz_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_sub_rte_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_sub_rtn_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_sub_rtp_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_sub_rtz_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_mul_rte_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_mul_rtn_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_mul_rtp_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_mul_rtz_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_div_rte_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_div_rtn_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_div_rtp_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_div_rtz_f32(float, float); |
| __device__ __attribute__((const)) float __ocml_sqrt_rte_f32(float); |
| __device__ __attribute__((const)) float __ocml_sqrt_rtn_f32(float); |
| __device__ __attribute__((const)) float __ocml_sqrt_rtp_f32(float); |
| __device__ __attribute__((const)) float __ocml_sqrt_rtz_f32(float); |
| __device__ __attribute__((const)) float __ocml_fma_rte_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_fma_rtn_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_fma_rtp_f32(float, float, float); |
| __device__ __attribute__((const)) float __ocml_fma_rtz_f32(float, float, float); |
| |
| __device__ inline __attribute__((const)) float |
| __llvm_amdgcn_cos_f32(float __x) { |
| return __builtin_amdgcn_cosf(__x); |
| } |
| __device__ inline __attribute__((const)) float |
| __llvm_amdgcn_rcp_f32(float __x) { |
| return __builtin_amdgcn_rcpf(__x); |
| } |
| __device__ inline __attribute__((const)) float |
| __llvm_amdgcn_rsq_f32(float __x) { |
| return __builtin_amdgcn_rsqf(__x); |
| } |
| __device__ inline __attribute__((const)) float |
| __llvm_amdgcn_sin_f32(float __x) { |
| return __builtin_amdgcn_sinf(__x); |
| } |
| // END INTRINSICS |
| // END FLOAT |
| |
| // BEGIN DOUBLE |
| __device__ __attribute__((const)) double __ocml_acos_f64(double); |
| __device__ __attribute__((pure)) double __ocml_acosh_f64(double); |
| __device__ __attribute__((const)) double __ocml_asin_f64(double); |
| __device__ __attribute__((pure)) double __ocml_asinh_f64(double); |
| __device__ __attribute__((const)) double __ocml_atan2_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_atan_f64(double); |
| __device__ __attribute__((pure)) double __ocml_atanh_f64(double); |
| __device__ __attribute__((pure)) double __ocml_cbrt_f64(double); |
| __device__ __attribute__((const)) double __ocml_ceil_f64(double); |
| __device__ __attribute__((const)) double __ocml_copysign_f64(double, double); |
| __device__ double __ocml_cos_f64(double); |
| __device__ __attribute__((pure)) double __ocml_cosh_f64(double); |
| __device__ double __ocml_cospi_f64(double); |
| __device__ double __ocml_i0_f64(double); |
| __device__ double __ocml_i1_f64(double); |
| __device__ __attribute__((pure)) double __ocml_erfc_f64(double); |
| __device__ __attribute__((pure)) double __ocml_erfcinv_f64(double); |
| __device__ __attribute__((pure)) double __ocml_erfcx_f64(double); |
| __device__ __attribute__((pure)) double __ocml_erf_f64(double); |
| __device__ __attribute__((pure)) double __ocml_erfinv_f64(double); |
| __device__ __attribute__((pure)) double __ocml_exp10_f64(double); |
| __device__ __attribute__((pure)) double __ocml_exp2_f64(double); |
| __device__ __attribute__((pure)) double __ocml_exp_f64(double); |
| __device__ __attribute__((pure)) double __ocml_expm1_f64(double); |
| __device__ __attribute__((const)) double __ocml_fabs_f64(double); |
| __device__ __attribute__((const)) double __ocml_fdim_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_floor_f64(double); |
| __device__ __attribute__((const)) double __ocml_fma_f64(double, double, double); |
| __device__ __attribute__((const)) double __ocml_fmax_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_fmin_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_fmod_f64(double, double); |
| __device__ double __ocml_frexp_f64(double, |
| __attribute__((address_space(5))) int *); |
| __device__ __attribute__((const)) double __ocml_hypot_f64(double, double); |
| __device__ __attribute__((const)) int __ocml_ilogb_f64(double); |
| __device__ __attribute__((const)) int __ocml_isfinite_f64(double); |
| __device__ __attribute__((const)) int __ocml_isinf_f64(double); |
| __device__ __attribute__((const)) int __ocml_isnan_f64(double); |
| __device__ double __ocml_j0_f64(double); |
| __device__ double __ocml_j1_f64(double); |
| __device__ __attribute__((const)) double __ocml_ldexp_f64(double, int); |
| __device__ double __ocml_lgamma_f64(double); |
| __device__ __attribute__((pure)) double __ocml_log10_f64(double); |
| __device__ __attribute__((pure)) double __ocml_log1p_f64(double); |
| __device__ __attribute__((pure)) double __ocml_log2_f64(double); |
| __device__ __attribute__((const)) double __ocml_logb_f64(double); |
| __device__ __attribute__((pure)) double __ocml_log_f64(double); |
| __device__ double __ocml_modf_f64(double, |
| __attribute__((address_space(5))) double *); |
| __device__ __attribute__((const)) double __ocml_nearbyint_f64(double); |
| __device__ __attribute__((const)) double __ocml_nextafter_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_len3_f64(double, double, |
| double); |
| __device__ __attribute__((const)) double __ocml_len4_f64(double, double, double, |
| double); |
| __device__ __attribute__((pure)) double __ocml_ncdf_f64(double); |
| __device__ __attribute__((pure)) double __ocml_ncdfinv_f64(double); |
| __device__ __attribute__((pure)) double __ocml_pow_f64(double, double); |
| __device__ __attribute__((pure)) double __ocml_pown_f64(double, int); |
| __device__ __attribute__((pure)) double __ocml_rcbrt_f64(double); |
| __device__ __attribute__((const)) double __ocml_remainder_f64(double, double); |
| __device__ double __ocml_remquo_f64(double, double, |
| __attribute__((address_space(5))) int *); |
| __device__ __attribute__((const)) double __ocml_rhypot_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_rint_f64(double); |
| __device__ __attribute__((const)) double __ocml_rlen3_f64(double, double, |
| double); |
| __device__ __attribute__((const)) double __ocml_rlen4_f64(double, double, |
| double, double); |
| __device__ __attribute__((const)) double __ocml_round_f64(double); |
| __device__ __attribute__((pure)) double __ocml_rsqrt_f64(double); |
| __device__ __attribute__((const)) double __ocml_scalb_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_scalbn_f64(double, int); |
| __device__ __attribute__((const)) int __ocml_signbit_f64(double); |
| __device__ double __ocml_sincos_f64(double, |
| __attribute__((address_space(5))) double *); |
| __device__ double |
| __ocml_sincospi_f64(double, __attribute__((address_space(5))) double *); |
| __device__ double __ocml_sin_f64(double); |
| __device__ __attribute__((pure)) double __ocml_sinh_f64(double); |
| __device__ double __ocml_sinpi_f64(double); |
| __device__ __attribute__((const)) double __ocml_sqrt_f64(double); |
| __device__ double __ocml_tan_f64(double); |
| __device__ __attribute__((pure)) double __ocml_tanh_f64(double); |
| __device__ double __ocml_tgamma_f64(double); |
| __device__ __attribute__((const)) double __ocml_trunc_f64(double); |
| __device__ double __ocml_y0_f64(double); |
| __device__ double __ocml_y1_f64(double); |
| |
| // BEGIN INTRINSICS |
| __device__ __attribute__((const)) double __ocml_add_rte_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_add_rtn_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_add_rtp_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_add_rtz_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_sub_rte_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_sub_rtn_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_sub_rtp_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_sub_rtz_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_mul_rte_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_mul_rtn_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_mul_rtp_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_mul_rtz_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_div_rte_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_div_rtn_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_div_rtp_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_div_rtz_f64(double, double); |
| __device__ __attribute__((const)) double __ocml_sqrt_rte_f64(double); |
| __device__ __attribute__((const)) double __ocml_sqrt_rtn_f64(double); |
| __device__ __attribute__((const)) double __ocml_sqrt_rtp_f64(double); |
| __device__ __attribute__((const)) double __ocml_sqrt_rtz_f64(double); |
| __device__ __attribute__((const)) double __ocml_fma_rte_f64(double, double, |
| double); |
| __device__ __attribute__((const)) double __ocml_fma_rtn_f64(double, double, |
| double); |
| __device__ __attribute__((const)) double __ocml_fma_rtp_f64(double, double, |
| double); |
| __device__ __attribute__((const)) double __ocml_fma_rtz_f64(double, double, |
| double); |
| |
| __device__ inline __attribute__((const)) double |
| __llvm_amdgcn_rcp_f64(double __x) { |
| return __builtin_amdgcn_rcp(__x); |
| } |
| __device__ inline __attribute__((const)) double |
| __llvm_amdgcn_rsq_f64(double __x) { |
| return __builtin_amdgcn_rsq(__x); |
| } |
| |
| __device__ __attribute__((const)) _Float16 __ocml_ceil_f16(_Float16); |
| __device__ _Float16 __ocml_cos_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_exp_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_exp10_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_exp2_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_floor_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_fma_f16(_Float16, _Float16, |
| _Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_fabs_f16(_Float16); |
| __device__ __attribute__((const)) int __ocml_isinf_f16(_Float16); |
| __device__ __attribute__((const)) int __ocml_isnan_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_log_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_log10_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_log2_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __llvm_amdgcn_rcp_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_rint_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_rsqrt_f16(_Float16); |
| __device__ _Float16 __ocml_sin_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_sqrt_f16(_Float16); |
| __device__ __attribute__((const)) _Float16 __ocml_trunc_f16(_Float16); |
| __device__ __attribute__((pure)) _Float16 __ocml_pown_f16(_Float16, int); |
| |
| typedef _Float16 __2f16 __attribute__((ext_vector_type(2))); |
| typedef short __2i16 __attribute__((ext_vector_type(2))); |
| |
| __device__ __attribute__((const)) float __ockl_fdot2(__2f16 a, __2f16 b, |
| float c, bool s); |
| __device__ __attribute__((const)) __2f16 __ocml_ceil_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_fabs_2f16(__2f16); |
| __device__ __2f16 __ocml_cos_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_exp_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_exp10_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_exp2_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_floor_2f16(__2f16); |
| __device__ __attribute__((const)) |
| __2f16 __ocml_fma_2f16(__2f16, __2f16, __2f16); |
| __device__ __attribute__((const)) __2i16 __ocml_isinf_2f16(__2f16); |
| __device__ __attribute__((const)) __2i16 __ocml_isnan_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_log_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_log10_2f16(__2f16); |
| __device__ __attribute__((pure)) __2f16 __ocml_log2_2f16(__2f16); |
| __device__ inline __2f16 |
| __llvm_amdgcn_rcp_2f16(__2f16 __x) // Not currently exposed by ROCDL. |
| { |
| return (__2f16)(__llvm_amdgcn_rcp_f16(__x.x), __llvm_amdgcn_rcp_f16(__x.y)); |
| } |
| __device__ __attribute__((const)) __2f16 __ocml_rint_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_rsqrt_2f16(__2f16); |
| __device__ __2f16 __ocml_sin_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_sqrt_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_trunc_2f16(__2f16); |
| __device__ __attribute__((const)) __2f16 __ocml_pown_2f16(__2f16, __2i16); |
| |
| #ifdef __cplusplus |
| } // extern "C" |
| #endif |
| |
| #endif // __CLANG_HIP_LIBDEVICE_DECLARES_H__ |