amd-builtins/math32/math32.h - libclc - Git at Google

 /*
  * Copyright (c) 2014 Advanced Micro Devices, Inc.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to deal
  * in the Software without restriction, including without limitation the rights
  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  * copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in
  * all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  * THE SOFTWARE.
  */
 #ifndef MATH32_H
 #define MATH32_H 1

 extern __attribute__((pure)) float  __amdil_copysign_f32(float, float);
 extern __attribute__((pure)) float  __amdil_fma_f32(float, float, float);
 extern __attribute__((pure)) float  __amdil_mad_f32(float, float, float);
 extern __attribute__((pure)) float  __amdil_min_f32(float, float);
 extern __attribute__((pure)) float  __amdil_max_f32(float, float);
 extern __attribute__((pure)) float  __ftz_f32(float);
 extern __attribute__((pure)) float  __amdil_round_nearest_f32(float);
 extern __attribute__((pure)) float  __amdil_round_neginf_f32(float);
 extern __attribute__((pure)) float  __amdil_round_posinf_f32(float);
 extern __attribute__((pure)) float  __amdil_round_zero_f32(float);
 extern __attribute__((pure)) float  __amdil_fabs_f32(float);
 extern __attribute__((pure)) float __amdil_improved_div_f32(float, float);
 extern __attribute__((pure)) float  __amdil_fraction_f32(float);
 extern __attribute__((pure)) uint  __amdil_cmov_logical_i32(uint,  uint,  uint);
 extern __attribute__((pure)) uint __amdil_is_asic_id_i32(uint);
 extern __attribute__((pure)) uint __amdil_is_constant_f32(float);

 #define SNAN 0x001
 #define QNAN 0x002
 #define NINF 0x004
 #define NNOR 0x008
 #define NSUB 0x010
 #define NZER 0x020
 #define PZER 0x040
 #define PSUB 0x080
 #define PNOR 0x100
 #define PINF 0x200

 extern __attribute__((pure)) int __amdil_class_f32(float, int);

 // HSA definitions for these macros
 #define HAVE_HW_FMA32() (1)
 #define HAVE_BITALIGN() (0)
 #define HAVE_FAST_FMA32() (0)


 // Allow control over how division is done
 #define MATH_DIVIDE(X, Y) native_divide(X, Y)
 // #define MATH_DIVIDE(X,Y) ((X) / (Y))
 #define MATH_RECIP(X) native_recip(X)
 // #define MATH_RECIP(X) (1.0f / (X))

 // Allow control over square root
 #define MATH_SQRT(X) native_sqrt(X)

 // Force a flush of a subnormal to zero by feeding it through a functional unit
 #define FTZ(X) __ftz_f32(X)

 // Table stuff
 #define TABLE_SPACE __constant

 #define TABLE_MANGLE(NAME) __math32_##NAME

 #define USE_TABLE(TYPE,PTR,NAME) \
     extern TABLE_SPACE TYPE TABLE_MANGLE(NAME) []; \
     TABLE_SPACE TYPE * PTR = TABLE_MANGLE(NAME)

 #define DECLARE_TABLE(TYPE,NAME,LENGTH,...) \
     TABLE_SPACE TYPE TABLE_MANGLE(NAME) [ LENGTH ] = { __VA_ARGS__ };

 /* These definitions, used by float functions,
    are for both 32 and 64 bit machines */
 #define SIGNBIT_SP32      0x80000000
 #define EXSIGNBIT_SP32    0x7fffffff
 #define EXPBITS_SP32      0x7f800000
 #define MANTBITS_SP32     0x007fffff
 #define ONEEXPBITS_SP32   0x3f800000
 #define TWOEXPBITS_SP32   0x40000000
 #define HALFEXPBITS_SP32  0x3f000000
 #define IMPBIT_SP32       0x00800000
 #define QNANBITPATT_SP32  0x7fc00000
 #define INDEFBITPATT_SP32 0xffc00000
 #define PINFBITPATT_SP32  0x7f800000
 #define NINFBITPATT_SP32  0xff800000
 #define EXPBIAS_SP32      127
 #define EXPSHIFTBITS_SP32 23
 #define BIASEDEMIN_SP32   1
 #define EMIN_SP32         -126
 #define BIASEDEMAX_SP32   254
 #define EMAX_SP32         127
 #define LAMBDA_SP32       1.0e30
 #define MANTLENGTH_SP32   24
 #define BASEDIGITS_SP32   7

 #define ALIGNED(x)	__attribute__((aligned(x)))

 // Workaround a bug in the Apple linker that prevents inlining of large,
 // frequently-used static functions that only have the inline attribute.
 // Force all inline functions to be always_inlined.
 #ifdef USE_APPLE
 #define inline __attribute__((always_inline))
 #endif

 #endif /* MATH32_H */
	/*
	* Copyright (c) 2014 Advanced Micro Devices, Inc.
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to deal
	* in the Software without restriction, including without limitation the rights
	* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
	* copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in
	* all copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
	* THE SOFTWARE.
	*/
	#ifndef MATH32_H
	#define MATH32_H 1

	extern __attribute__((pure)) float __amdil_copysign_f32(float, float);
	extern __attribute__((pure)) float __amdil_fma_f32(float, float, float);
	extern __attribute__((pure)) float __amdil_mad_f32(float, float, float);
	extern __attribute__((pure)) float __amdil_min_f32(float, float);
	extern __attribute__((pure)) float __amdil_max_f32(float, float);
	extern __attribute__((pure)) float __ftz_f32(float);
	extern __attribute__((pure)) float __amdil_round_nearest_f32(float);
	extern __attribute__((pure)) float __amdil_round_neginf_f32(float);
	extern __attribute__((pure)) float __amdil_round_posinf_f32(float);
	extern __attribute__((pure)) float __amdil_round_zero_f32(float);
	extern __attribute__((pure)) float __amdil_fabs_f32(float);
	extern __attribute__((pure)) float __amdil_improved_div_f32(float, float);
	extern __attribute__((pure)) float __amdil_fraction_f32(float);
	extern __attribute__((pure)) uint __amdil_cmov_logical_i32(uint, uint, uint);
	extern __attribute__((pure)) uint __amdil_is_asic_id_i32(uint);
	extern __attribute__((pure)) uint __amdil_is_constant_f32(float);

	#define SNAN 0x001
	#define QNAN 0x002
	#define NINF 0x004
	#define NNOR 0x008
	#define NSUB 0x010
	#define NZER 0x020
	#define PZER 0x040
	#define PSUB 0x080
	#define PNOR 0x100
	#define PINF 0x200

	extern __attribute__((pure)) int __amdil_class_f32(float, int);

	// HSA definitions for these macros
	#define HAVE_HW_FMA32() (1)
	#define HAVE_BITALIGN() (0)
	#define HAVE_FAST_FMA32() (0)


	// Allow control over how division is done
	#define MATH_DIVIDE(X, Y) native_divide(X, Y)
	// #define MATH_DIVIDE(X,Y) ((X) / (Y))
	#define MATH_RECIP(X) native_recip(X)
	// #define MATH_RECIP(X) (1.0f / (X))

	// Allow control over square root
	#define MATH_SQRT(X) native_sqrt(X)

	// Force a flush of a subnormal to zero by feeding it through a functional unit
	#define FTZ(X) __ftz_f32(X)

	// Table stuff
	#define TABLE_SPACE __constant

	#define TABLE_MANGLE(NAME) __math32_##NAME

	#define USE_TABLE(TYPE,PTR,NAME) \
	extern TABLE_SPACE TYPE TABLE_MANGLE(NAME) []; \
	TABLE_SPACE TYPE * PTR = TABLE_MANGLE(NAME)

	#define DECLARE_TABLE(TYPE,NAME,LENGTH,...) \
	TABLE_SPACE TYPE TABLE_MANGLE(NAME) [ LENGTH ] = { __VA_ARGS__ };

	/* These definitions, used by float functions,
	are for both 32 and 64 bit machines */
	#define SIGNBIT_SP32 0x80000000
	#define EXSIGNBIT_SP32 0x7fffffff
	#define EXPBITS_SP32 0x7f800000
	#define MANTBITS_SP32 0x007fffff
	#define ONEEXPBITS_SP32 0x3f800000
	#define TWOEXPBITS_SP32 0x40000000
	#define HALFEXPBITS_SP32 0x3f000000
	#define IMPBIT_SP32 0x00800000
	#define QNANBITPATT_SP32 0x7fc00000
	#define INDEFBITPATT_SP32 0xffc00000
	#define PINFBITPATT_SP32 0x7f800000
	#define NINFBITPATT_SP32 0xff800000
	#define EXPBIAS_SP32 127
	#define EXPSHIFTBITS_SP32 23
	#define BIASEDEMIN_SP32 1
	#define EMIN_SP32 -126
	#define BIASEDEMAX_SP32 254
	#define EMAX_SP32 127
	#define LAMBDA_SP32 1.0e30
	#define MANTLENGTH_SP32 24
	#define BASEDIGITS_SP32 7

	#define ALIGNED(x) __attribute__((aligned(x)))

	// Workaround a bug in the Apple linker that prevents inlining of large,
	// frequently-used static functions that only have the inline attribute.
	// Force all inline functions to be always_inlined.
	#ifdef USE_APPLE
	#define inline __attribute__((always_inline))
	#endif

	#endif /* MATH32_H */