src/__support/FPUtil/x86_64/sqrt.h - llvm-project/libc - Git at Google

 //===-- Square root of IEEE 754 floating point numbers ----------*- C++ -*-===//
 //
 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//

 #ifndef LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H
 #define LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H

 #include "src/__support/common.h"
 #include "src/__support/macros/properties/architectures.h"
 #include "src/__support/macros/properties/cpu_features.h"

 #if !(defined(LIBC_TARGET_ARCH_IS_X86_64) && defined(LIBC_TARGET_CPU_HAS_SSE2))
 #error "sqrtss / sqrtsd need SSE2"
 #endif

 #include "src/__support/FPUtil/generic/sqrt.h"

 namespace LIBC_NAMESPACE {
 namespace fputil {

 template <> LIBC_INLINE float sqrt<float>(float x) {
   float result;
   __asm__ __volatile__("sqrtss %x1, %x0" : "=x"(result) : "x"(x));
   return result;
 }

 template <> LIBC_INLINE double sqrt<double>(double x) {
   double result;
   __asm__ __volatile__("sqrtsd %x1, %x0" : "=x"(result) : "x"(x));
   return result;
 }

 #ifdef LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64
 template <> LIBC_INLINE long double sqrt<long double>(long double x) {
   long double result;
   __asm__ __volatile__("sqrtsd %x1, %x0" : "=x"(result) : "x"(x));
   return result;
 }
 #else
 template <> LIBC_INLINE long double sqrt<long double>(long double x) {
   __asm__ __volatile__("fsqrt" : "+t"(x));
   return x;
 }
 #endif

 } // namespace fputil
 } // namespace LIBC_NAMESPACE

 #endif // LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H
	//===-- Square root of IEEE 754 floating point numbers ----------- C++ --===//
	//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//
	//===----------------------------------------------------------------------===//

	#ifndef LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H
	#define LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H

	#include "src/__support/common.h"
	#include "src/__support/macros/properties/architectures.h"
	#include "src/__support/macros/properties/cpu_features.h"

	#if !(defined(LIBC_TARGET_ARCH_IS_X86_64) && defined(LIBC_TARGET_CPU_HAS_SSE2))
	#error "sqrtss / sqrtsd need SSE2"
	#endif

	#include "src/__support/FPUtil/generic/sqrt.h"

	namespace LIBC_NAMESPACE {
	namespace fputil {

	template <> LIBC_INLINE float sqrt<float>(float x) {
	float result;
	__asm__ __volatile__("sqrtss %x1, %x0" : "=x"(result) : "x"(x));
	return result;
	}

	template <> LIBC_INLINE double sqrt<double>(double x) {
	double result;
	__asm__ __volatile__("sqrtsd %x1, %x0" : "=x"(result) : "x"(x));
	return result;
	}

	#ifdef LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64
	template <> LIBC_INLINE long double sqrt<long double>(long double x) {
	long double result;
	__asm__ __volatile__("sqrtsd %x1, %x0" : "=x"(result) : "x"(x));
	return result;
	}
	#else
	template <> LIBC_INLINE long double sqrt<long double>(long double x) {
	__asm__ __volatile__("fsqrt" : "+t"(x));
	return x;
	}
	#endif

	} // namespace fputil
	} // namespace LIBC_NAMESPACE

	#endif // LLVM_LIBC_SRC___SUPPORT_FPUTIL_X86_64_SQRT_H