blob: f3649d52e0091154a9ce786e7daf8f1ab98a8154 [file] [log] [blame]
// RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown | FileCheck --check-prefix=CHECK --check-prefix=NODIVOPT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown -cl-fp32-correctly-rounded-divide-sqrt | FileCheck --check-prefix=CHECK --check-prefix=DIVOPT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL1.2 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL1.2 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s
typedef __attribute__(( ext_vector_type(4) )) float float4;
float spscalardiv(float a, float b) {
// CHECK: @spscalardiv
// CHECK: fdiv{{.*}},
// NODIVOPT: !fpmath ![[MD_FDIV:[0-9]+]]
// DIVOPT-NOT: !fpmath !{{[0-9]+}}
return a / b;
}
float4 spvectordiv(float4 a, float4 b) {
// CHECK: @spvectordiv
// CHECK: fdiv{{.*}},
// NODIVOPT: !fpmath ![[MD_FDIV]]
// DIVOPT-NOT: !fpmath !{{[0-9]+}}
return a / b;
}
float spscalarsqrt(float a) {
// CHECK-LABEL: @spscalarsqrt
// NODIVOPT: call float @llvm.sqrt.f32(float %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
// DIVOPT: call float @llvm.sqrt.f32(float %{{.+}}){{$}}
return __builtin_sqrtf(a);
}
float elementwise_sqrt_f32(float a) {
// CHECK-LABEL: @elementwise_sqrt_f32
// NODIVOPT: call float @llvm.sqrt.f32(float %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
// DIVOPT: call float @llvm.sqrt.f32(float %{{.+}}){{$}}
return __builtin_elementwise_sqrt(a);
}
float4 elementwise_sqrt_v4f32(float4 a) {
// CHECK-LABEL: @elementwise_sqrt_v4f32
// NODIVOPT: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
// DIVOPT: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{.+}}){{$}}
return __builtin_elementwise_sqrt(a);
}
#if __OPENCL_C_VERSION__ >=120
void printf(constant char* fmt, ...);
void testdbllit(long *val) {
// CHECK-FLT: float noundef 2.000000e+01
// CHECK-DBL: double noundef 2.000000e+01
printf("%f", 20.0);
}
#endif
#ifndef NOFP64
#pragma OPENCL EXTENSION cl_khr_fp64 : enable
typedef __attribute__(( ext_vector_type(4) )) double double4;
double dpscalardiv(double a, double b) {
// CHECK: @dpscalardiv
// CHECK-NOT: !fpmath
return a / b;
}
double4 dpvectordiv(double4 a, double4 b) {
// CHECK: @dpvectordiv
// CHECK-NOT: !fpmath
return a / b;
}
double dpscalarsqrt(double a) {
// CHECK-LABEL: @dpscalarsqrt
// CHECK: call double @llvm.sqrt.f64(double %{{.+}}){{$}}
return __builtin_sqrt(a);
}
double elementwise_sqrt_f64(double a) {
// CHECK-LABEL: @elementwise_sqrt_f64
// CHECK: call double @llvm.sqrt.f64(double %{{.+}}){{$}}
return __builtin_elementwise_sqrt(a);
}
double4 elementwise_sqrt_v4f64(double4 a) {
// CHECK-LABEL: @elementwise_sqrt_v4f64
// CHECK: call <4 x double> @llvm.sqrt.v4f64(<4 x double> %{{.+}}){{$}}
return __builtin_elementwise_sqrt(a);
}
#endif
// NODIVOPT: ![[MD_FDIV]] = !{float 2.500000e+00}
// NODIVOPT: ![[MD_SQRT]] = !{float 3.000000e+00}