llvm/test/Transforms/InstSimplify/const-fold-nvvm-mul.ll - llvm-project - Git at Google

 ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
 ; RUN: opt < %s -passes=instsimplify -march=nvptx64 --mcpu=sm_86 --mattr=+ptx72 -S | FileCheck %s

 ; Check constant-folding for NVVM multiply intrinsics with different rounding modes

 ;###############################################################
 ;#                    Mul(1.25, 2.0)                           #
 ;###############################################################
 ; Tests multiplication of two normal numbers (1.25 and 2.0) where the result
 ; is exactly representable. All rounding modes should produce the same result.

 define double @test_1_25_times_2_rm_d() {
 ; CHECK-LABEL: define double @test_1_25_times_2_rm_d() {
 ; CHECK-NEXT:    ret double 2.500000e+00
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 1.25, double 2.0)
   ret double %res
 }

 define double @test_1_25_times_2_rn_d() {
 ; CHECK-LABEL: define double @test_1_25_times_2_rn_d() {
 ; CHECK-NEXT:    ret double 2.500000e+00
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 1.25, double 2.0)
   ret double %res
 }

 define double @test_1_25_times_2_rp_d() {
 ; CHECK-LABEL: define double @test_1_25_times_2_rp_d() {
 ; CHECK-NEXT:    ret double 2.500000e+00
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 1.25, double 2.0)
   ret double %res
 }

 define double @test_1_25_times_2_rz_d() {
 ; CHECK-LABEL: define double @test_1_25_times_2_rz_d() {
 ; CHECK-NEXT:    ret double 2.500000e+00
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 1.25, double 2.0)
   ret double %res
 }

 define float @test_1_25_times_2_rm_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rm_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rn_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rn_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rp_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rp_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rz_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rz_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rp_ftz_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 1.25, float 2.0)
   ret float %res
 }

 define float @test_1_25_times_2_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_1_25_times_2_rz_ftz_f() {
 ; CHECK-NEXT:    ret float 2.500000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 1.25, float 2.0)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(1.0, Subnormal)                      #
 ;###############################################################
 ; Tests multiplication of 1.0 by a subnormal number to verify FTZ behavior.
 ; For float, we use 2^-149 (smallest subnormal float).
 ; For double, we use 2^-1074 (smallest subnormal double).
 ; Without FTZ, the result should be the subnormal number.
 ; With FTZ, the result should be 0.0.

 define double @test_1_times_subnorm_rm_d() {
 ; CHECK-LABEL: define double @test_1_times_subnorm_rm_d() {
 ; CHECK-NEXT:    ret double 4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 1.0, double 0x0000000000000001)
   ret double %res
 }

 define double @test_1_times_subnorm_rn_d() {
 ; CHECK-LABEL: define double @test_1_times_subnorm_rn_d() {
 ; CHECK-NEXT:    ret double 4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 1.0, double 0x0000000000000001)
   ret double %res
 }

 define double @test_1_times_subnorm_rp_d() {
 ; CHECK-LABEL: define double @test_1_times_subnorm_rp_d() {
 ; CHECK-NEXT:    ret double 4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 1.0, double 0x0000000000000001)
   ret double %res
 }

 define double @test_1_times_subnorm_rz_d() {
 ; CHECK-LABEL: define double @test_1_times_subnorm_rz_d() {
 ; CHECK-NEXT:    ret double 4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 1.0, double 0x0000000000000001)
   ret double %res
 }

 define float @test_1_times_subnorm_rm_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rm_f() {
 ; CHECK-NEXT:    ret float 0x36A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rn_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rn_f() {
 ; CHECK-NEXT:    ret float 0x36A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rp_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rp_f() {
 ; CHECK-NEXT:    ret float 0x36A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rz_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rz_f() {
 ; CHECK-NEXT:    ret float 0x36A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rp_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 define float @test_1_times_subnorm_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_subnorm_rz_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 1.0, float 0x36A0000000000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(1.0, -Subnormal)                     #
 ;###############################################################
 ; Tests multiplication of 1.0 by a negative subnormal number to verify FTZ behavior.
 ; For float, we use -2^-149 (negative smallest subnormal).
 ; For double, we use -2^-1074 (negative smallest subnormal).
 ; Without FTZ, the result should be the negative subnormal number.
 ; With FTZ, the result should be -0.0.

 define double @test_1_times_neg_subnorm_rm_d() {
 ; CHECK-LABEL: define double @test_1_times_neg_subnorm_rm_d() {
 ; CHECK-NEXT:    ret double -4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 1.0, double 0x8000000000000001)
   ret double %res
 }

 define double @test_1_times_neg_subnorm_rn_d() {
 ; CHECK-LABEL: define double @test_1_times_neg_subnorm_rn_d() {
 ; CHECK-NEXT:    ret double -4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 1.0, double 0x8000000000000001)
   ret double %res
 }

 define double @test_1_times_neg_subnorm_rp_d() {
 ; CHECK-LABEL: define double @test_1_times_neg_subnorm_rp_d() {
 ; CHECK-NEXT:    ret double -4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 1.0, double 0x8000000000000001)
   ret double %res
 }

 define double @test_1_times_neg_subnorm_rz_d() {
 ; CHECK-LABEL: define double @test_1_times_neg_subnorm_rz_d() {
 ; CHECK-NEXT:    ret double -4.940660e-324
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 1.0, double 0x8000000000000001)
   ret double %res
 }

 define float @test_1_times_neg_subnorm_rm_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rm_f() {
 ; CHECK-NEXT:    ret float 0xB6A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rn_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rn_f() {
 ; CHECK-NEXT:    ret float 0xB6A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rp_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rp_f() {
 ; CHECK-NEXT:    ret float 0xB6A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rz_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rz_f() {
 ; CHECK-NEXT:    ret float 0xB6A0000000000000
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rm_ftz_f() {
 ; CHECK-NEXT:    ret float -0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rn_ftz_f() {
 ; CHECK-NEXT:    ret float -0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rp_ftz_f() {
 ; CHECK-NEXT:    ret float -0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 define float @test_1_times_neg_subnorm_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_1_times_neg_subnorm_rz_ftz_f() {
 ; CHECK-NEXT:    ret float -0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 1.0, float 0xB6A0000000000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(Normal, Normal) -> Subnormal         #
 ;###############################################################
 ; Tests multiplication of two normal numbers that produces a subnormal result.
 ; We multiply the smallest normal float (2^-126 = 0x3810000000000000) by 0.5 to get 2^-127,
 ; which is subnormal. This tests the transition from normal to subnormal numbers.
 ; For double precision, we just use the same float value since there is no FTZ variant.

 define double @test_normal_times_normal_to_subnorm_rm_d() {
 ; CHECK-LABEL: define double @test_normal_times_normal_to_subnorm_rm_d() {
 ; CHECK-NEXT:    ret double 0x3800000000000000
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 0x3810000000000000, double 0.5)
   ret double %res
 }

 define double @test_normal_times_normal_to_subnorm_rn_d() {
 ; CHECK-LABEL: define double @test_normal_times_normal_to_subnorm_rn_d() {
 ; CHECK-NEXT:    ret double 0x3800000000000000
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 0x3810000000000000, double 0.5)
   ret double %res
 }

 define double @test_normal_times_normal_to_subnorm_rp_d() {
 ; CHECK-LABEL: define double @test_normal_times_normal_to_subnorm_rp_d() {
 ; CHECK-NEXT:    ret double 0x3800000000000000
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 0x3810000000000000, double 0.5)
   ret double %res
 }

 define double @test_normal_times_normal_to_subnorm_rz_d() {
 ; CHECK-LABEL: define double @test_normal_times_normal_to_subnorm_rz_d() {
 ; CHECK-NEXT:    ret double 0x3800000000000000
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 0x3810000000000000, double 0.5)
   ret double %res
 }

 define float @test_normal_times_normal_to_subnorm_rm_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rm_f() {
 ; CHECK-NEXT:    ret float 0x3800000000000000
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rn_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rn_f() {
 ; CHECK-NEXT:    ret float 0x3800000000000000
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rp_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rp_f() {
 ; CHECK-NEXT:    ret float 0x3800000000000000
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rz_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rz_f() {
 ; CHECK-NEXT:    ret float 0x3800000000000000
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rp_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 define float @test_normal_times_normal_to_subnorm_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_normal_times_normal_to_subnorm_rz_ftz_f() {
 ; CHECK-NEXT:    ret float 0.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 0x3810000000000000, float 0.5)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(2.0, NaN)                            #
 ;###############################################################
 ; Tests multiplication with NaN to verify that we do not fold these,
 ; as host and device NaNs may be different.

 define double @test_2_times_nan_rm_d() {
 ; CHECK-LABEL: define double @test_2_times_nan_rm_d() {
 ; CHECK-NEXT:    [[RES:%.*]] = call double @llvm.nvvm.mul.rm.d(double 2.000000e+00, double 0x7FF4444400000000)
 ; CHECK-NEXT:    ret double [[RES]]
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 2.0, double 0x7FF4444400000000)
   ret double %res
 }

 define double @test_2_times_nan_rn_d() {
 ; CHECK-LABEL: define double @test_2_times_nan_rn_d() {
 ; CHECK-NEXT:    [[RES:%.*]] = call double @llvm.nvvm.mul.rn.d(double 2.000000e+00, double 0x7FF4444400000000)
 ; CHECK-NEXT:    ret double [[RES]]
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 2.0, double 0x7FF4444400000000)
   ret double %res
 }

 define double @test_2_times_nan_rp_d() {
 ; CHECK-LABEL: define double @test_2_times_nan_rp_d() {
 ; CHECK-NEXT:    [[RES:%.*]] = call double @llvm.nvvm.mul.rp.d(double 2.000000e+00, double 0x7FF4444400000000)
 ; CHECK-NEXT:    ret double [[RES]]
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 2.0, double 0x7FF4444400000000)
   ret double %res
 }

 define double @test_2_times_nan_rz_d() {
 ; CHECK-LABEL: define double @test_2_times_nan_rz_d() {
 ; CHECK-NEXT:    [[RES:%.*]] = call double @llvm.nvvm.mul.rz.d(double 2.000000e+00, double 0x7FF4444400000000)
 ; CHECK-NEXT:    ret double [[RES]]
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 2.0, double 0x7FF4444400000000)
   ret double %res
 }

 define float @test_2_times_nan_rm_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rm_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rm.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rn_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rn_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rn.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rp_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rp_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rp.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rz_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rz_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rz.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rm_ftz_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rm.ftz.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rn_ftz_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rn.ftz.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rp_ftz_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rp.ftz.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 define float @test_2_times_nan_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_2_times_nan_rz_ftz_f() {
 ; CHECK-NEXT:    [[RES:%.*]] = call float @llvm.nvvm.mul.rz.ftz.f(float 2.000000e+00, float 0x7FFF444400000000)
 ; CHECK-NEXT:    ret float [[RES]]
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 2.0, float 0x7FFF444400000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(0.75, 4/3 + epsilon)                 #
 ;###############################################################
 ; Tests multiplication of 0.75 (3/4) by a value slightly above 4/3,
 ; where different rounding modes produce different results.
 ; The exact result would be 1.0, but since 4/3 cannot be exactly encoded
 ; as a float, the calculated result falls between 1.0 and 1.0 + 2^-23.
 ; - RN, RZ, RM round to 1.0 (rounding to nearest/zero/down)
 ; - RP rounds to 1.0 + 2^-23 (rounding up)

 define float @test_mul_just_above_1_rm_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rm_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rn_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rn_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rp_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rp_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rz_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rp_ftz_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_above_1_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_above_1_rz_ftz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 0.75, float 0x3FF5555560000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(0.75, 4/3 + epsilon)                 #
 ;###############################################################
 ; Tests multiplication of 0.75 by a value slightly above 4/3,
 ; where different rounding modes produce different results.
 ; The exact result would be 1.0, but since 4/3 cannot be exactly encoded
 ; as a double, the calculated result falls between 1.0 and 1.0 + 2^-52.
 ; - RN, RZ, RM round to 1.0 (rounding to nearest/zero/down)
 ; - RP rounds to 1.0 + 2^-52 (rounding up)

 define double @test_mul_just_above_1_rm_d() {
 ; CHECK-LABEL: define double @test_mul_just_above_1_rm_d() {
 ; CHECK-NEXT:    ret double 1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_above_1_rn_d() {
 ; CHECK-LABEL: define double @test_mul_just_above_1_rn_d() {
 ; CHECK-NEXT:    ret double 1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_above_1_rp_d() {
 ; CHECK-LABEL: define double @test_mul_just_above_1_rp_d() {
 ; CHECK-NEXT:    ret double 0x3FF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_above_1_rz_d() {
 ; CHECK-LABEL: define double @test_mul_just_above_1_rz_d() {
 ; CHECK-NEXT:    ret double 1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 0.75, double 0x3FF5555555555556)
   ret double %res
 }

 ;###############################################################
 ;#                    Mul(-0.75, 4/3 + epsilon)                #
 ;###############################################################
 ; Tests multiplication of -0.75 by a value slightly above 4/3,
 ; where different rounding modes produce different results.
 ; The exact result would be -1.0, but since 4/3 cannot be exactly encoded
 ; as a double, the calculated result falls between -1.0 and -1.0 - 2^-23.
 ; - RN, RZ, RP round to -1.0 (rounding to nearest/zero/up)
 ; - RM rounds to -1.0 - 2^-23 (rounding down)

 define float @test_mul_just_below_negative_1_rm_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rm_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rn_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rn_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rp_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rp_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rz_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rn_ftz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rp_ftz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 define float @test_mul_just_below_negative_1_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_just_below_negative_1_rz_ftz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float -0.75, float 0x3FF5555560000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(-0.75, 4/3 + epsilon)                #
 ;###############################################################
 ; Tests multiplication of -0.75 by a value slightly above 4/3,
 ; where different rounding modes produce different results.
 ; The exact result would be -1.0, but since 4/3 cannot be exactly encoded
 ; as a double, the calculated result falls between -1.0 and -1.0 - 2^-52.
 ; - RN, RZ, RP round to -1.0 (rounding to nearest/zero/up)
 ; - RM rounds to -1.0 - 2^-52 (rounding down)

 define double @test_mul_just_below_negative_1_rm_d() {
 ; CHECK-LABEL: define double @test_mul_just_below_negative_1_rm_d() {
 ; CHECK-NEXT:    ret double 0xBFF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double -0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_below_negative_1_rn_d() {
 ; CHECK-LABEL: define double @test_mul_just_below_negative_1_rn_d() {
 ; CHECK-NEXT:    ret double -1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double -0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_below_negative_1_rp_d() {
 ; CHECK-LABEL: define double @test_mul_just_below_negative_1_rp_d() {
 ; CHECK-NEXT:    ret double -1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double -0.75, double 0x3FF5555555555556)
   ret double %res
 }

 define double @test_mul_just_below_negative_1_rz_d() {
 ; CHECK-LABEL: define double @test_mul_just_below_negative_1_rz_d() {
 ; CHECK-NEXT:    ret double -1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double -0.75, double 0x3FF5555555555556)
   ret double %res
 }

 ;###############################################################
 ;#                   Mul(0.625, 1.6 + epsilon)                 #
 ;###############################################################
 ; Tests multiplication of 5/8 * ~8/5 with different rounding modes.
 ; Multiply 0.625 (5/8) by a value very slightly above 8/5 = 1.6 + epsilon.
 ; The exact result is between 1.0 and 1.0 + 2^-23
 ; - RN, RP round to 1.0 + 2^-23 (rounding towards nearest/up)
 ; - RZ, RM round to 1.0 (rounding towards zero/down)

 define float @test_mul_slightly_more_above_1_rm_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rm_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 0x3FE4000000000000, float 0x3FF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rn_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rn_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 0x3FE4000000000000, float 0x3FF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rp_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rp_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rp_ftz_f() {
 ; CHECK-NEXT:    ret float 0x3FF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 define float @test_mul_slightly_more_above_1_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_above_1_rz_ftz_f() {
 ; CHECK-NEXT:    ret float 1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 0x3FE4000000000000, float 0x3FF99999C0000000 )
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(0.625, 1.6 + epsilon)                #
 ;###############################################################
 ; Tests multiplication of 5/8 * ~8/5  with different rounding modes.
 ; Multiply 0.625 (5/8) by a value very slightly above 8/5 = 1.6 + epsilon.
 ; The exact result is between 1.0 and 1.0 + 2^-52
 ; - RN, RP round to 1.0 + 2^-52 (rounding towards nearest/up)
 ; - RZ, RM round to 1.0 (rounding towards zero/down)

 define double @test_mul_slightly_more_above_1_rm_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_above_1_rm_d() {
 ; CHECK-NEXT:    ret double 1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 0x3FE4000000000000, double 0x3FF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_above_1_rn_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_above_1_rn_d() {
 ; CHECK-NEXT:    ret double 0x3FF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 0x3FE4000000000000, double 0x3FF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_above_1_rp_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_above_1_rp_d() {
 ; CHECK-NEXT:    ret double 0x3FF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 0x3FE4000000000000, double 0x3FF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_above_1_rz_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_above_1_rz_d() {
 ; CHECK-NEXT:    ret double 1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 0x3FE4000000000000, double 0x3FF999999999999B)
   ret double %res
 }

 ;###############################################################
 ;#                    Mul(0.625, -(1.6 + epsilon)              #
 ;###############################################################
 ; Tests multiplication of 5/8 * ~-8/5 with different rounding modes.
 ; Multiply 0.625 (5/8) by a value very slightly below -8/5 = -(1.6 + epsilon).
 ; The exact result is between -1.0 and -1.0 + 2^-23
 ; - RN, RM round to -1.0 - 2^-23 (rounding towards nearest/down)
 ; - RZ, RP round to -1.0 (rounding towards zero/up)

 define float @test_mul_slightly_more_below_negative_1_rm_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rm_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rm.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rn_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rn_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rn.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rp_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rp_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rm_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rm_ftz_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rm.ftz.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rn_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rn_ftz_f() {
 ; CHECK-NEXT:    ret float 0xBFF0000020000000
 ;
   %res = call float @llvm.nvvm.mul.rn.ftz.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rp_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rp_ftz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rp.ftz.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 define float @test_mul_slightly_more_below_negative_1_rz_ftz_f() {
 ; CHECK-LABEL: define float @test_mul_slightly_more_below_negative_1_rz_ftz_f() {
 ; CHECK-NEXT:    ret float -1.000000e+00
 ;
   %res = call float @llvm.nvvm.mul.rz.ftz.f(float 0x3FE4000000000000, float 0xBFF99999C0000000)
   ret float %res
 }

 ;###############################################################
 ;#                    Mul(0.625, -(1.6 + epsilon)              #
 ;###############################################################
 ; Tests multiplication of 5/8 * ~-8/5 with different rounding modes.
 ; Multiply 0.625 (5/8) by a value very slightly below -8/5 = -(1.6 + epsilon).
 ; The exact result is between -1.0 and -1.0 + 2^-52
 ; - RN, RM round to -1.0 - 2^-52 (rounding towards nearest/down)
 ; - RZ, RP round to -1.0 (rounding towards zero/up)

 define double @test_mul_slightly_more_below_negative_1_rm_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_below_negative_1_rm_d() {
 ; CHECK-NEXT:    ret double 0xBFF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rm.d(double 0x3FE4000000000000, double 0xBFF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_below_negative_1_rn_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_below_negative_1_rn_d() {
 ; CHECK-NEXT:    ret double 0xBFF0000000000001
 ;
   %res = call double @llvm.nvvm.mul.rn.d(double 0x3FE4000000000000, double 0xBFF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_below_negative_1_rp_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_below_negative_1_rp_d() {
 ; CHECK-NEXT:    ret double -1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rp.d(double 0x3FE4000000000000, double 0xBFF999999999999B)
   ret double %res
 }

 define double @test_mul_slightly_more_below_negative_1_rz_d() {
 ; CHECK-LABEL: define double @test_mul_slightly_more_below_negative_1_rz_d() {
 ; CHECK-NEXT:    ret double -1.000000e+00
 ;
   %res = call double @llvm.nvvm.mul.rz.d(double 0x3FE4000000000000, double 0xBFF999999999999B)
   ret double %res
 }