| ; RUN: llc -O3 -mtriple=x86_64-pc-linux < %s | FileCheck --check-prefix=COMMON --check-prefix=NO-FMA --check-prefix=FMACALL64 --check-prefix=FMACALL32 %s |
| ; RUN: llc -O3 -mtriple=x86_64-pc-linux -mattr=+fma < %s | FileCheck -check-prefix=COMMON --check-prefix=HAS-FMA --check-prefix=FMA64 --check-prefix=FMA32 %s |
| |
| ; Verify that constants aren't folded to inexact results when the rounding mode |
| ; is unknown. |
| ; |
| ; double f1() { |
| ; // Because 0.1 cannot be represented exactly, this shouldn't be folded. |
| ; return 1.0/10.0; |
| ; } |
| ; |
| ; CHECK-LABEL: f1 |
| ; COMMON: divsd |
| define double @f1() #0 { |
| entry: |
| %div = call double @llvm.experimental.constrained.fdiv.f64( |
| double 1.000000e+00, |
| double 1.000000e+01, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %div |
| } |
| |
| ; Verify that 'a - 0' isn't simplified to 'a' when the rounding mode is unknown. |
| ; |
| ; double f2(double a) { |
| ; // Because the result of '0 - 0' is negative zero if rounding mode is |
| ; // downward, this shouldn't be simplified. |
| ; return a - 0; |
| ; } |
| ; |
| ; CHECK-LABEL: f2 |
| ; COMMON: subsd |
| define double @f2(double %a) #0 { |
| entry: |
| %sub = call double @llvm.experimental.constrained.fsub.f64( |
| double %a, |
| double 0.000000e+00, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %sub |
| } |
| |
| ; Verify that '-((-a)*b)' isn't simplified to 'a*b' when the rounding mode is |
| ; unknown. |
| ; |
| ; double f3(double a, double b) { |
| ; // Because the intermediate value involved in this calculation may require |
| ; // rounding, this shouldn't be simplified. |
| ; return -((-a)*b); |
| ; } |
| ; |
| ; CHECK-LABEL: f3: |
| ; COMMON: subsd |
| ; COMMON: mulsd |
| ; COMMON: subsd |
| define double @f3(double %a, double %b) #0 { |
| entry: |
| %sub = call double @llvm.experimental.constrained.fsub.f64( |
| double -0.000000e+00, double %a, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| %mul = call double @llvm.experimental.constrained.fmul.f64( |
| double %sub, double %b, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| %ret = call double @llvm.experimental.constrained.fsub.f64( |
| double -0.000000e+00, |
| double %mul, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %ret |
| } |
| |
| ; Verify that FP operations are not performed speculatively when FP exceptions |
| ; are not being ignored. |
| ; |
| ; double f4(int n, double a) { |
| ; // Because a + 1 may overflow, this should not be simplified. |
| ; if (n > 0) |
| ; return a + 1.0; |
| ; return a; |
| ; } |
| ; |
| ; |
| ; CHECK-LABEL: f4: |
| ; COMMON: testl |
| ; COMMON: jle |
| ; COMMON: addsd |
| define double @f4(i32 %n, double %a) #0 { |
| entry: |
| %cmp = icmp sgt i32 %n, 0 |
| br i1 %cmp, label %if.then, label %if.end |
| |
| if.then: |
| %add = call double @llvm.experimental.constrained.fadd.f64( |
| double 1.000000e+00, double %a, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| br label %if.end |
| |
| if.end: |
| %a.0 = phi double [%add, %if.then], [ %a, %entry ] |
| ret double %a.0 |
| } |
| |
| ; Verify that sqrt(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f5 |
| ; COMMON: sqrtsd |
| define double @f5() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.sqrt.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that pow(42.1, 3.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f6 |
| ; COMMON: pow |
| define double @f6() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.pow.f64(double 42.1, |
| double 3.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that powi(42.1, 3) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f7 |
| ; COMMON: powi |
| define double @f7() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.powi.f64(double 42.1, |
| i32 3, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that sin(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f8 |
| ; COMMON: sin |
| define double @f8() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.sin.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that cos(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f9 |
| ; COMMON: cos |
| define double @f9() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.cos.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that exp(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f10 |
| ; COMMON: exp |
| define double @f10() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.exp.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that exp2(42.1) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f11 |
| ; COMMON: exp2 |
| define double @f11() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.exp2.f64(double 42.1, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that log(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f12 |
| ; COMMON: log |
| define double @f12() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.log.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that log10(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f13 |
| ; COMMON: log10 |
| define double @f13() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.log10.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that log2(42.0) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f14 |
| ; COMMON: log2 |
| define double @f14() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.log2.f64(double 42.0, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that rint(42.1) isn't simplified when the rounding mode is unknown. |
| ; CHECK-LABEL: f15 |
| ; NO-FMA: rint |
| ; HAS-FMA: vroundsd |
| define double @f15() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.rint.f64(double 42.1, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that nearbyint(42.1) isn't simplified when the rounding mode is |
| ; unknown. |
| ; CHECK-LABEL: f16 |
| ; NO-FMA: nearbyint |
| ; HAS-FMA: vroundsd |
| define double @f16() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.nearbyint.f64( |
| double 42.1, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; Verify that fma(3.5) isn't simplified when the rounding mode is |
| ; unknown. |
| ; CHECK-LABEL: f17 |
| ; FMACALL32: jmp fmaf # TAILCALL |
| ; FMA32: vfmadd213ss |
| define float @f17() #0 { |
| entry: |
| %result = call float @llvm.experimental.constrained.fma.f32( |
| float 3.5, |
| float 3.5, |
| float 3.5, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret float %result |
| } |
| |
| ; Verify that fma(42.1) isn't simplified when the rounding mode is |
| ; unknown. |
| ; CHECK-LABEL: f18 |
| ; FMACALL64: jmp fma # TAILCALL |
| ; FMA64: vfmadd213sd |
| define double @f18() #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.fma.f64( |
| double 42.1, |
| double 42.1, |
| double 42.1, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; CHECK-LABEL: f19 |
| ; COMMON: fmod |
| define double @f19() #0 { |
| entry: |
| %rem = call double @llvm.experimental.constrained.frem.f64( |
| double 1.000000e+00, |
| double 1.000000e+01, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret double %rem |
| } |
| |
| ; Verify that fptoui(%x) isn't simplified when the rounding mode is |
| ; unknown. The expansion should have only one conversion instruction. |
| ; Verify that no gross errors happen. |
| ; CHECK-LABEL: @f20u |
| ; NO-FMA: cmpltsd |
| ; NO-FMA: movapd |
| ; NO-FMA: andpd |
| ; NO-FMA: xorl |
| ; NO-FMA: ucomisd |
| ; NO-FMA: subsd |
| ; NO-FMA: andnpd |
| ; NO-FMA: orpd |
| ; NO-FMA: cvttsd2si |
| ; NO-FMA: setae |
| ; NO-FMA: shll |
| ; NO-FMA: xorl |
| ; |
| ; HAS-FMA: vcmpltsd |
| ; HAS-FMA: vsubsd |
| ; HAS-FMA: vblendvpd |
| ; HAS-FMA: vcvttsd2si |
| ; HAS-FMA: xorl |
| ; HAS-FMA: vucomisd |
| ; HAS-FMA: setae |
| ; HAS-FMA: shll |
| ; HAS-FMA: xorl |
| define i32 @f20u(double %x) #0 { |
| entry: |
| %result = call i32 @llvm.experimental.constrained.fptoui.i32.f64(double %x, |
| metadata !"fpexcept.strict") #0 |
| ret i32 %result |
| } |
| |
| ; Verify that round(42.1) isn't simplified when the rounding mode is |
| ; unknown. |
| ; Verify that no gross errors happen. |
| ; CHECK-LABEL: @f21 |
| ; COMMON: cvtsd2ss |
| define float @f21() #0 { |
| entry: |
| %result = call float @llvm.experimental.constrained.fptrunc.f32.f64( |
| double 42.1, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret float %result |
| } |
| |
| ; CHECK-LABEL: @f22 |
| ; COMMON: cvtss2sd |
| define double @f22(float %x) #0 { |
| entry: |
| %result = call double @llvm.experimental.constrained.fpext.f64.f32(float %x, |
| metadata !"fpexcept.strict") #0 |
| ret double %result |
| } |
| |
| ; CHECK-LABEL: f23 |
| ; COMMON: jmp lrint |
| define i32 @f23(double %x) #0 { |
| entry: |
| %result = call i32 @llvm.experimental.constrained.lrint.i32.f64(double %x, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret i32 %result |
| } |
| |
| ; CHECK-LABEL: f24 |
| ; COMMON: jmp lrintf |
| define i32 @f24(float %x) #0 { |
| entry: |
| %result = call i32 @llvm.experimental.constrained.lrint.i32.f32(float %x, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret i32 %result |
| } |
| |
| ; CHECK-LABEL: f25 |
| ; COMMON: jmp llrint |
| define i64 @f25(double %x) #0 { |
| entry: |
| %result = call i64 @llvm.experimental.constrained.llrint.i64.f64(double %x, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret i64 %result |
| } |
| |
| ; CHECK-LABEL: f26 |
| ; COMMON: jmp llrintf |
| define i64 @f26(float %x) { |
| entry: |
| %result = call i64 @llvm.experimental.constrained.llrint.i64.f32(float %x, |
| metadata !"round.dynamic", |
| metadata !"fpexcept.strict") #0 |
| ret i64 %result |
| } |
| |
| ; CHECK-LABEL: f27 |
| ; COMMON: jmp lround |
| define i32 @f27(double %x) #0 { |
| entry: |
| %result = call i32 @llvm.experimental.constrained.lround.i32.f64(double %x, |
| metadata !"fpexcept.strict") #0 |
| ret i32 %result |
| } |
| |
| ; CHECK-LABEL: f28 |
| ; COMMON: jmp lroundf |
| define i32 @f28(float %x) #0 { |
| entry: |
| %result = call i32 @llvm.experimental.constrained.lround.i32.f32(float %x, |
| metadata !"fpexcept.strict") #0 |
| ret i32 %result |
| } |
| |
| ; CHECK-LABEL: f29 |
| ; COMMON: jmp llround |
| define i64 @f29(double %x) #0 { |
| entry: |
| %result = call i64 @llvm.experimental.constrained.llround.i64.f64(double %x, |
| metadata !"fpexcept.strict") #0 |
| ret i64 %result |
| } |
| |
| ; CHECK-LABEL: f30 |
| ; COMMON: jmp llroundf |
| define i64 @f30(float %x) #0 { |
| entry: |
| %result = call i64 @llvm.experimental.constrained.llround.i64.f32(float %x, |
| metadata !"fpexcept.strict") #0 |
| ret i64 %result |
| } |
| |
| attributes #0 = { strictfp } |
| |
| @llvm.fp.env = thread_local global i8 zeroinitializer, section "llvm.metadata" |
| declare double @llvm.experimental.constrained.fadd.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.fsub.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.fmul.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.fdiv.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.frem.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.sqrt.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.pow.f64(double, double, metadata, metadata) |
| declare double @llvm.experimental.constrained.powi.f64(double, i32, metadata, metadata) |
| declare double @llvm.experimental.constrained.sin.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.cos.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.exp.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.exp2.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.log.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.log10.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.log2.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.rint.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.nearbyint.f64(double, metadata, metadata) |
| declare float @llvm.experimental.constrained.fma.f32(float, float, float, metadata, metadata) |
| declare double @llvm.experimental.constrained.fma.f64(double, double, double, metadata, metadata) |
| declare i32 @llvm.experimental.constrained.fptosi.i32.f64(double, metadata) |
| declare i32 @llvm.experimental.constrained.fptoui.i32.f64(double, metadata) |
| declare float @llvm.experimental.constrained.fptrunc.f32.f64(double, metadata, metadata) |
| declare double @llvm.experimental.constrained.fpext.f64.f32(float, metadata) |
| declare i32 @llvm.experimental.constrained.lrint.i32.f64(double, metadata, metadata) |
| declare i32 @llvm.experimental.constrained.lrint.i32.f32(float, metadata, metadata) |
| declare i64 @llvm.experimental.constrained.llrint.i64.f64(double, metadata, metadata) |
| declare i64 @llvm.experimental.constrained.llrint.i64.f32(float, metadata, metadata) |
| declare i32 @llvm.experimental.constrained.lround.i32.f64(double, metadata) |
| declare i32 @llvm.experimental.constrained.lround.i32.f32(float, metadata) |
| declare i64 @llvm.experimental.constrained.llround.i64.f64(double, metadata) |
| declare i64 @llvm.experimental.constrained.llround.i64.f32(float, metadata) |