clang/lib/Headers/avx512erintrin.h - llvm-project - Git at Google

 /*===---- avx512fintrin.h - AVX2 intrinsics -----------------------------------===
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to deal
  * in the Software without restriction, including without limitation the rights
  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  * copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in
  * all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  * THE SOFTWARE.
  *
  *===-----------------------------------------------------------------------===
  */
 #ifndef __IMMINTRIN_H
 #error "Never use <avx512erintrin.h> directly; include <immintrin.h> instead."
 #endif

 #ifndef __AVX512ERINTRIN_H
 #define __AVX512ERINTRIN_H


 // rsqrt28
 static  __inline__ __m512d __attribute__((__always_inline__, __nodebug__))
 _mm512_rsqrt28_round_pd (__m512d __A, int __R)
 {
   return (__m512d)__builtin_ia32_rsqrt28pd_mask ((__v8df)__A,
                                                  (__v8df)_mm512_setzero_pd(),
                                                  (__mmask8)-1,
                                                  __R);
 }
 static  __inline__ __m512 __attribute__((__always_inline__, __nodebug__))
 _mm512_rsqrt28_round_ps(__m512 __A, int __R)
 {
   return (__m512)__builtin_ia32_rsqrt28ps_mask ((__v16sf)__A,
                                                 (__v16sf)_mm512_setzero_ps(),
                                                 (__mmask16)-1,
                                                 __R);
 }

 static  __inline__ __m128 __attribute__((__always_inline__, __nodebug__))
 _mm_rsqrt28_round_ss(__m128 __A, __m128 __B, int __R)
 {
   return (__m128) __builtin_ia32_rsqrt28ss_mask ((__v4sf) __A,
              (__v4sf) __B,
              (__v4sf)
              _mm_setzero_ps (),
              (__mmask8) -1,
              __R);
 }

 static  __inline__ __m128d __attribute__((__always_inline__, __nodebug__))
 _mm_rsqrt28_round_sd (__m128d __A, __m128d __B, int __R)
 {
   return (__m128d) __builtin_ia32_rsqrt28sd_mask ((__v2df) __A,
               (__v2df) __B,
               (__v2df)
               _mm_setzero_pd (),
               (__mmask8) -1,
              __R);
 }


 // rcp28
 static  __inline__ __m512d __attribute__((__always_inline__, __nodebug__))
 _mm512_rcp28_round_pd (__m512d __A, int __R)
 {
   return (__m512d)__builtin_ia32_rcp28pd_mask ((__v8df)__A,
                                                (__v8df)_mm512_setzero_pd(),
                                                (__mmask8)-1,
                                                __R);
 }

 static  __inline__ __m512 __attribute__((__always_inline__, __nodebug__))
 _mm512_rcp28_round_ps (__m512 __A, int __R)
 {
   return (__m512)__builtin_ia32_rcp28ps_mask ((__v16sf)__A,
                                               (__v16sf)_mm512_setzero_ps (),
                                               (__mmask16)-1,
                                               __R);
 }

 static  __inline__ __m128 __attribute__((__always_inline__, __nodebug__))
 _mm_rcp28_round_ss (__m128 __A, __m128 __B, int __R)
 {
   return (__m128) __builtin_ia32_rcp28ss_mask ((__v4sf) __A,
              (__v4sf) __B,
              (__v4sf)
              _mm_setzero_ps (),
              (__mmask8) -1,
              __R);
 }
 static  __inline__ __m128d __attribute__((__always_inline__, __nodebug__))
 _mm_rcp28_round_sd (__m128d __A, __m128d __B, int __R)
 {
   return (__m128d) __builtin_ia32_rcp28sd_mask ((__v2df) __A,
               (__v2df) __B,
               (__v2df)
               _mm_setzero_pd (),
               (__mmask8) -1,
              __R);
 }

 #endif // __AVX512ERINTRIN_H
	/*===---- avx512fintrin.h - AVX2 intrinsics -----------------------------------===
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to deal
	* in the Software without restriction, including without limitation the rights
	* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
	* copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in
	* all copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
	* THE SOFTWARE.
	*
	*===-----------------------------------------------------------------------===
	*/
	#ifndef __IMMINTRIN_H
	#error "Never use <avx512erintrin.h> directly; include <immintrin.h> instead."
	#endif

	#ifndef __AVX512ERINTRIN_H
	#define __AVX512ERINTRIN_H


	// rsqrt28
	static __inline__ __m512d __attribute__((__always_inline__, __nodebug__))
	_mm512_rsqrt28_round_pd (__m512d __A, int __R)
	{
	return (__m512d)__builtin_ia32_rsqrt28pd_mask ((__v8df)__A,
	(__v8df)_mm512_setzero_pd(),
	(__mmask8)-1,
	__R);
	}
	static __inline__ __m512 __attribute__((__always_inline__, __nodebug__))
	_mm512_rsqrt28_round_ps(__m512 __A, int __R)
	{
	return (__m512)__builtin_ia32_rsqrt28ps_mask ((__v16sf)__A,
	(__v16sf)_mm512_setzero_ps(),
	(__mmask16)-1,
	__R);
	}

	static __inline__ __m128 __attribute__((__always_inline__, __nodebug__))
	_mm_rsqrt28_round_ss(__m128 __A, __m128 __B, int __R)
	{
	return (__m128) __builtin_ia32_rsqrt28ss_mask ((__v4sf) __A,
	(__v4sf) __B,
	(__v4sf)
	_mm_setzero_ps (),
	(__mmask8) -1,
	__R);
	}

	static __inline__ __m128d __attribute__((__always_inline__, __nodebug__))
	_mm_rsqrt28_round_sd (__m128d __A, __m128d __B, int __R)
	{
	return (__m128d) __builtin_ia32_rsqrt28sd_mask ((__v2df) __A,
	(__v2df) __B,
	(__v2df)
	_mm_setzero_pd (),
	(__mmask8) -1,
	__R);
	}


	// rcp28
	static __inline__ __m512d __attribute__((__always_inline__, __nodebug__))
	_mm512_rcp28_round_pd (__m512d __A, int __R)
	{
	return (__m512d)__builtin_ia32_rcp28pd_mask ((__v8df)__A,
	(__v8df)_mm512_setzero_pd(),
	(__mmask8)-1,
	__R);
	}

	static __inline__ __m512 __attribute__((__always_inline__, __nodebug__))
	_mm512_rcp28_round_ps (__m512 __A, int __R)
	{
	return (__m512)__builtin_ia32_rcp28ps_mask ((__v16sf)__A,
	(__v16sf)_mm512_setzero_ps (),
	(__mmask16)-1,
	__R);
	}

	static __inline__ __m128 __attribute__((__always_inline__, __nodebug__))
	_mm_rcp28_round_ss (__m128 __A, __m128 __B, int __R)
	{
	return (__m128) __builtin_ia32_rcp28ss_mask ((__v4sf) __A,
	(__v4sf) __B,
	(__v4sf)
	_mm_setzero_ps (),
	(__mmask8) -1,
	__R);
	}
	static __inline__ __m128d __attribute__((__always_inline__, __nodebug__))
	_mm_rcp28_round_sd (__m128d __A, __m128d __B, int __R)
	{
	return (__m128d) __builtin_ia32_rcp28sd_mask ((__v2df) __A,
	(__v2df) __B,
	(__v2df)
	_mm_setzero_pd (),
	(__mmask8) -1,
	__R);
	}

	#endif // __AVX512ERINTRIN_H