blob: 95403aecae9bd902b4a58f67581e50803f5dcea6 [file] [log] [blame] [edit]
// REQUIRES: x86-registered-target
// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=UNCONSTRAINED --check-prefix=COMMON
// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=CONSTRAINED --check-prefix=COMMON
// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON
// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON
// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=UNCONSTRAINED --check-prefix=COMMON
// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=CONSTRAINED --check-prefix=COMMON
// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON
// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON
#ifdef STRICT
// Test that the constrained intrinsics are picking up the exception
// metadata from the AST instead of the global default from the command line.
#pragma float_control(except, on)
#endif
#include <immintrin.h>
__m128h test_mm_sqrt_sh(__m128h x, __m128h y) {
// COMMON-LABEL: test_mm_sqrt_sh
// UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half {{.*}})
// CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half {{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtsh %xmm{{.*}},
return _mm_sqrt_sh(x, y);
}
__m128h test_mm_mask_sqrt_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B){
// COMMON-LABEL: test_mm_mask_sqrt_sh
// COMMONIR: extractelement <8 x half> %{{.*}}, i64 0
// UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half %{{.*}})
// CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half %{{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtsh %xmm{{.*}},
// COMMONIR-NEXT: extractelement <8 x half> %{{.*}}, i64 0
// COMMONIR-NEXT: bitcast i8 %{{.*}} to <8 x i1>
// COMMONIR-NEXT: extractelement <8 x i1> %{{.*}}, i64 0
// COMMONIR-NEXT: select i1 {{.*}}, half {{.*}}, half {{.*}}
// COMMONIR-NEXT: insertelement <8 x half> %{{.*}}, half {{.*}}, i64 0
return _mm_mask_sqrt_sh(__W,__U,__A,__B);
}
__m128h test_mm_maskz_sqrt_sh(__mmask8 __U, __m128h __A, __m128h __B){
// COMMON-LABEL: test_mm_maskz_sqrt_sh
// COMMONIR: extractelement <2 x half> %{{.*}}, i64 0
// UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half %{{.*}})
// CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half %{{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtsh %xmm{{.*}},
// COMMONIR-NEXT: extractelement <2 x half> %{{.*}}, i64 0
// COMMONIR-NEXT: bitcast i8 %{{.*}} to <8 x i1>
// COMMONIR-NEXT: extractelement <8 x i1> %{{.*}}, i64 0
// COMMONIR-NEXT: select i1 {{.*}}, half {{.*}}, half {{.*}}
// COMMONIR-NEXT: insertelement <2 x half> %{{.*}}, half {{.*}}, i64 0
return _mm_maskz_sqrt_sh(__U,__A,__B);
}
__m512h test_mm512_sqrt_ph(__m512h x) {
// COMMON-LABEL: test_mm512_sqrt_ph
// UNCONSTRAINED: call {{.*}}<32 x half> @llvm.sqrt.v32f16(<32 x half> {{.*}})
// CONSTRAINED: call {{.*}}<32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> {{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtph %zmm{{.*}},
return _mm512_sqrt_ph(x);
}
__m512h test_mm512_mask_sqrt_ph (__m512h __W, __mmask32 __U, __m512h __A)
{
// COMMON-LABEL: test_mm512_mask_sqrt_ph
// UNCONSTRAINED: call {{.*}}<32 x half> @llvm.sqrt.v32f16(<32 x half> %{{.*}})
// CONSTRAINED: call {{.*}}<32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> %{{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtph %zmm{{.*}},
// COMMONIR: bitcast i32 %{{.*}} to <32 x i1>
// COMMONIR: select <32 x i1> %{{.*}}, <32 x half> %{{.*}}, <32 x half> %{{.*}}
return _mm512_mask_sqrt_ph (__W,__U,__A);
}
__m512h test_mm512_maskz_sqrt_ph (__mmask32 __U, __m512h __A)
{
// COMMON-LABEL: test_mm512_maskz_sqrt_ph
// UNCONSTRAINED: call {{.*}}<32 x half> @llvm.sqrt.v32f16(<32 x half> %{{.*}})
// CONSTRAINED: call {{.*}}<32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> %{{.*}}, metadata !{{.*}})
// CHECK-ASM: vsqrtph %zmm{{.*}},
// COMMONIR: bitcast i32 %{{.*}} to <32 x i1>
// COMMONIR: select <32 x i1> %{{.*}}, <32 x half> %{{.*}}, <32 x half> {{.*}}
return _mm512_maskz_sqrt_ph (__U,__A);
}