blob: 9f002b1e0da55ea7d441898652c44c2bb376eb75 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc < %s -mtriple aarch64-unknown-unknown | FileCheck %s --check-prefixes=CHECK,CHECK-CVT
; RUN: llc < %s -mtriple aarch64-unknown-unknown -mattr=+bf16 | FileCheck %s --check-prefixes=CHECK,CHECK-BF16,CHECK-SD
; RUN: llc < %s -mtriple aarch64-unknown-unknown -mattr=+bf16,+fullfp16 -global-isel -global-isel-abort=2 2>&1 | FileCheck %s --check-prefixes=CHECK,CHECK-BF16,CHECK-GI
; CHECK-GI: warning: Instruction selection used fallback path for test_fadd
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fsub
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fmul
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fmadd
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fdiv
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_frem
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_call
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_call_flipped
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_tailcall_flipped
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_select_cc
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_select_cc_f32_f16
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_une
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ueq
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ugt
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_uge
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ult
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ule
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_uno
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_one
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_oeq
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ogt
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_oge
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_olt
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ole
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fcmp_ord
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fccmp
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_br_cc
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptosi_i32
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptosi_i64
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptoui_i32
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptoui_i64
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_uitofp_i32
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_uitofp_i64
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sitofp_i32
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sitofp_i64
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_uitofp_i32_fadd
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sitofp_i32_fadd
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptrunc_float
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fptrunc_double
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fpext_float
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fpext_double
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sqrt
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_powi
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sin
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_cos
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_tan
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_acos
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_asin
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_atan
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_atan2
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_cosh
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_sinh
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_tanh
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_pow
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_exp
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_exp2
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_log
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_log10
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_log2
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fma
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fabs
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_minnum
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_maxnum
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_copysign
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_copysign_f32
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_copysign_f64
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_copysign_extended
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_floor
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_ceil
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_trunc
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_rint
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_nearbyint
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_round
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_roundeven
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for test_fmuladd
define bfloat @test_fadd(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_fadd:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fadd s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fadd:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fadd s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fadd bfloat %a, %b
ret bfloat %r
}
define bfloat @test_fsub(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_fsub:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fsub s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fsub:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fsub s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fsub bfloat %a, %b
ret bfloat %r
}
define bfloat @test_fmul(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_fmul:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fmul s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fmul:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fmul s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fmul bfloat %a, %b
ret bfloat %r
}
define bfloat @test_fmadd(bfloat %a, bfloat %b, bfloat %c) #0 {
; CHECK-CVT-LABEL: test_fmadd:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w10, #32767 // =0x7fff
; CHECK-CVT-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fmul s0, s0, s1
; CHECK-CVT-NEXT: shll v1.4s, v2.4h, #16
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: ubfx w9, w8, #16, #1
; CHECK-CVT-NEXT: add w8, w8, w10
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fadd s0, s0, s1
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: ubfx w9, w8, #16, #1
; CHECK-CVT-NEXT: add w8, w8, w10
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fmadd:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: shll v2.4s, v2.4h, #16
; CHECK-BF16-NEXT: fmadd s0, s0, s1, s2
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%mul = fmul fast bfloat %a, %b
%r = fadd fast bfloat %mul, %c
ret bfloat %r
}
define bfloat @test_fdiv(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_fdiv:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fdiv s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fdiv:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fdiv s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fdiv bfloat %a, %b
ret bfloat %r
}
define bfloat @test_frem(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_frem:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-CVT-NEXT: bl fmodf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_frem:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-BF16-NEXT: bl fmodf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = frem bfloat %a, %b
ret bfloat %r
}
define void @test_store(bfloat %a, ptr %b) #0 {
; CHECK-LABEL: test_store:
; CHECK: // %bb.0:
; CHECK-NEXT: str h0, [x0]
; CHECK-NEXT: ret
store bfloat %a, ptr %b
ret void
}
define bfloat @test_load(ptr %a) #0 {
; CHECK-LABEL: test_load:
; CHECK: // %bb.0:
; CHECK-NEXT: ldr h0, [x0]
; CHECK-NEXT: ret
%r = load bfloat, ptr %a
ret bfloat %r
}
declare bfloat @test_callee(bfloat %a, bfloat %b) #0
define bfloat @test_call(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_call:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: bl test_callee
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%r = call bfloat @test_callee(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_call_flipped(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_call_flipped:
; CHECK: // %bb.0:
; CHECK-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-NEXT: fmov s2, s0
; CHECK-NEXT: fmov s0, s1
; CHECK-NEXT: fmov s1, s2
; CHECK-NEXT: bl test_callee
; CHECK-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-NEXT: ret
%r = call bfloat @test_callee(bfloat %b, bfloat %a)
ret bfloat %r
}
define bfloat @test_tailcall_flipped(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_tailcall_flipped:
; CHECK: // %bb.0:
; CHECK-NEXT: fmov s2, s0
; CHECK-NEXT: fmov s0, s1
; CHECK-NEXT: fmov s1, s2
; CHECK-NEXT: b test_callee
%r = tail call bfloat @test_callee(bfloat %b, bfloat %a)
ret bfloat %r
}
define bfloat @test_select(bfloat %a, bfloat %b, i1 zeroext %c) #0 {
; CHECK-CVT-LABEL: test_select:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-CVT-NEXT: cmp w0, #0
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-CVT-NEXT: fcsel s0, s0, s1, ne
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_select:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-SD-NEXT: cmp w0, #0
; CHECK-SD-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-SD-NEXT: fcsel s0, s0, s1, ne
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_select:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-GI-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-GI-NEXT: fmov w8, s0
; CHECK-GI-NEXT: fmov w9, s1
; CHECK-GI-NEXT: tst w0, #0x1
; CHECK-GI-NEXT: csel w8, w8, w9, ne
; CHECK-GI-NEXT: fmov s0, w8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-GI-NEXT: ret
%r = select i1 %c, bfloat %a, bfloat %b
ret bfloat %r
}
define bfloat @test_select_cc(bfloat %a, bfloat %b, bfloat %c, bfloat %d) #0 {
; CHECK-CVT-LABEL: test_select_cc:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h3 killed $h3 def $d3
; CHECK-CVT-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-CVT-NEXT: shll v3.4s, v3.4h, #16
; CHECK-CVT-NEXT: shll v2.4s, v2.4h, #16
; CHECK-CVT-NEXT: fcmp s2, s3
; CHECK-CVT-NEXT: fcsel s0, s0, s1, ne
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_select_cc:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h3 killed $h3 def $d3
; CHECK-SD-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-SD-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-SD-NEXT: shll v3.4s, v3.4h, #16
; CHECK-SD-NEXT: shll v2.4s, v2.4h, #16
; CHECK-SD-NEXT: fcmp s2, s3
; CHECK-SD-NEXT: fcsel s0, s0, s1, ne
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_select_cc:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: // kill: def $h3 killed $h3 def $d3
; CHECK-GI-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-GI-NEXT: shll v3.4s, v3.4h, #16
; CHECK-GI-NEXT: shll v2.4s, v2.4h, #16
; CHECK-GI-NEXT: fcmp s2, s3
; CHECK-GI-NEXT: fcsel h0, h0, h1, ne
; CHECK-GI-NEXT: ret
%cc = fcmp une bfloat %c, %d
%r = select i1 %cc, bfloat %a, bfloat %b
ret bfloat %r
}
define float @test_select_cc_f32_f16(float %a, float %b, bfloat %c, bfloat %d) #0 {
; CHECK-LABEL: test_select_cc_f32_f16:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h3 killed $h3 def $d3
; CHECK-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-NEXT: shll v3.4s, v3.4h, #16
; CHECK-NEXT: shll v2.4s, v2.4h, #16
; CHECK-NEXT: fcmp s2, s3
; CHECK-NEXT: fcsel s0, s0, s1, ne
; CHECK-NEXT: ret
%cc = fcmp une bfloat %c, %d
%r = select i1 %cc, float %a, float %b
ret float %r
}
define bfloat @test_select_cc_f16_f32(bfloat %a, bfloat %b, float %c, float %d) #0 {
; CHECK-CVT-LABEL: test_select_cc_f16_f32:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: fcmp s2, s3
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-CVT-NEXT: fcsel s0, s0, s1, ne
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_select_cc_f16_f32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: fcmp s2, s3
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-SD-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-SD-NEXT: fcsel s0, s0, s1, ne
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_select_cc_f16_f32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-GI-NEXT: // kill: def $h1 killed $h1 def $s1
; CHECK-GI-NEXT: fcmp s2, s3
; CHECK-GI-NEXT: fmov w8, s0
; CHECK-GI-NEXT: fmov w9, s1
; CHECK-GI-NEXT: csel w8, w8, w9, ne
; CHECK-GI-NEXT: fmov s0, w8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-GI-NEXT: ret
%cc = fcmp une float %c, %d
%r = select i1 %cc, bfloat %a, bfloat %b
ret bfloat %r
}
define i1 @test_fcmp_une(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_une:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, ne
; CHECK-NEXT: ret
%r = fcmp une bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ueq(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ueq:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w8, eq
; CHECK-NEXT: csinc w0, w8, wzr, vc
; CHECK-NEXT: ret
%r = fcmp ueq bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ugt(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ugt:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, hi
; CHECK-NEXT: ret
%r = fcmp ugt bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_uge(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_uge:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, pl
; CHECK-NEXT: ret
%r = fcmp uge bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ult(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ult:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, lt
; CHECK-NEXT: ret
%r = fcmp ult bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ule(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ule:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, le
; CHECK-NEXT: ret
%r = fcmp ule bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_uno(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_uno:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, vs
; CHECK-NEXT: ret
%r = fcmp uno bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_one(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_one:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w8, mi
; CHECK-NEXT: csinc w0, w8, wzr, le
; CHECK-NEXT: ret
%r = fcmp one bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_oeq(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_oeq:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, eq
; CHECK-NEXT: ret
%r = fcmp oeq bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ogt(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ogt:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, gt
; CHECK-NEXT: ret
%r = fcmp ogt bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_oge(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_oge:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, ge
; CHECK-NEXT: ret
%r = fcmp oge bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_olt(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_olt:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, mi
; CHECK-NEXT: ret
%r = fcmp olt bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ole(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ole:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, ls
; CHECK-NEXT: ret
%r = fcmp ole bfloat %a, %b
ret i1 %r
}
define i1 @test_fcmp_ord(bfloat %a, bfloat %b) #0 {
; CHECK-LABEL: test_fcmp_ord:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: cset w0, vc
; CHECK-NEXT: ret
%r = fcmp ord bfloat %a, %b
ret i1 %r
}
define void @test_fccmp(bfloat %in, ptr %out) {
; CHECK-CVT-LABEL: test_fccmp:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: movi v1.2s, #69, lsl #24
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v2.4s, v0.4h, #16
; CHECK-CVT-NEXT: adrp x8, .LCPI29_0
; CHECK-CVT-NEXT: movi v3.2s, #72, lsl #24
; CHECK-CVT-NEXT: fcmp s2, s1
; CHECK-CVT-NEXT: ldr h1, [x8, :lo12:.LCPI29_0]
; CHECK-CVT-NEXT: fccmp s2, s3, #4, mi
; CHECK-CVT-NEXT: fcsel s0, s0, s1, gt
; CHECK-CVT-NEXT: str h0, [x0]
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_fccmp:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: movi v1.2s, #69, lsl #24
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-SD-NEXT: shll v2.4s, v0.4h, #16
; CHECK-SD-NEXT: adrp x8, .LCPI29_0
; CHECK-SD-NEXT: movi v3.2s, #72, lsl #24
; CHECK-SD-NEXT: fcmp s2, s1
; CHECK-SD-NEXT: ldr h1, [x8, :lo12:.LCPI29_0]
; CHECK-SD-NEXT: fccmp s2, s3, #4, mi
; CHECK-SD-NEXT: fcsel s0, s0, s1, gt
; CHECK-SD-NEXT: str h0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_fccmp:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi v1.2s, #69, lsl #24
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-GI-NEXT: shll v2.4s, v0.4h, #16
; CHECK-GI-NEXT: movi v3.2s, #72, lsl #24
; CHECK-GI-NEXT: fcmp s2, s1
; CHECK-GI-NEXT: fmov h1, #5.00000000
; CHECK-GI-NEXT: fccmp s2, s3, #4, mi
; CHECK-GI-NEXT: fcsel h0, h0, h1, gt
; CHECK-GI-NEXT: str h0, [x0]
; CHECK-GI-NEXT: ret
%cmp1 = fcmp ogt bfloat %in, 0xR4800
%cmp2 = fcmp olt bfloat %in, 0xR4500
%cond = and i1 %cmp1, %cmp2
%result = select i1 %cond, bfloat %in, bfloat 0xR4500
store bfloat %result, ptr %out
ret void
}
define void @test_br_cc(bfloat %a, bfloat %b, ptr %p1, ptr %p2) #0 {
; CHECK-LABEL: test_br_cc:
; CHECK: // %bb.0: // %common.ret
; CHECK-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v1.4s, v1.4h, #16
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcmp s0, s1
; CHECK-NEXT: csel x8, x0, x1, pl
; CHECK-NEXT: str wzr, [x8]
; CHECK-NEXT: ret
%c = fcmp uge bfloat %a, %b
br i1 %c, label %then, label %else
then:
store i32 0, ptr %p1
ret void
else:
store i32 0, ptr %p2
ret void
}
define bfloat @test_phi(ptr %p1) #0 {
; CHECK-LABEL: test_phi:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: stp d9, d8, [sp, #-32]! // 16-byte Folded Spill
; CHECK-NEXT: ldr h9, [x0]
; CHECK-NEXT: stp x30, x19, [sp, #16] // 16-byte Folded Spill
; CHECK-NEXT: mov x19, x0
; CHECK-NEXT: .LBB31_1: // %loop
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: fmov s8, s9
; CHECK-NEXT: ldr h9, [x19]
; CHECK-NEXT: mov x0, x19
; CHECK-NEXT: bl test_dummy
; CHECK-NEXT: tbnz w0, #0, .LBB31_1
; CHECK-NEXT: // %bb.2: // %return
; CHECK-NEXT: ldp x30, x19, [sp, #16] // 16-byte Folded Reload
; CHECK-NEXT: fmov s0, s8
; CHECK-NEXT: ldp d9, d8, [sp], #32 // 16-byte Folded Reload
; CHECK-NEXT: ret
entry:
%a = load bfloat, ptr %p1
br label %loop
loop:
%r = phi bfloat [%a, %entry], [%b, %loop]
%b = load bfloat, ptr %p1
%c = call i1 @test_dummy(ptr %p1)
br i1 %c, label %loop, label %return
return:
ret bfloat %r
}
declare i1 @test_dummy(ptr %p1) #0
define i32 @test_fptosi_i32(bfloat %a) #0 {
; CHECK-LABEL: test_fptosi_i32:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcvtzs w0, s0
; CHECK-NEXT: ret
%r = fptosi bfloat %a to i32
ret i32 %r
}
define i64 @test_fptosi_i64(bfloat %a) #0 {
; CHECK-LABEL: test_fptosi_i64:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcvtzs x0, s0
; CHECK-NEXT: ret
%r = fptosi bfloat %a to i64
ret i64 %r
}
define i32 @test_fptoui_i32(bfloat %a) #0 {
; CHECK-LABEL: test_fptoui_i32:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcvtzu w0, s0
; CHECK-NEXT: ret
%r = fptoui bfloat %a to i32
ret i32 %r
}
define i64 @test_fptoui_i64(bfloat %a) #0 {
; CHECK-LABEL: test_fptoui_i64:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcvtzu x0, s0
; CHECK-NEXT: ret
%r = fptoui bfloat %a to i64
ret i64 %r
}
define bfloat @test_uitofp_i32(i32 %a) #0 {
; CHECK-CVT-LABEL: test_uitofp_i32:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: ucvtf d0, w0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: fcvtxn s0, d0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_uitofp_i32:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: ucvtf d0, w0
; CHECK-BF16-NEXT: fcvtxn s0, d0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = uitofp i32 %a to bfloat
ret bfloat %r
}
define bfloat @test_uitofp_i64(i64 %a) #0 {
; CHECK-CVT-LABEL: test_uitofp_i64:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: lsr x9, x0, #53
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: cmp x9, #0
; CHECK-CVT-NEXT: and x9, x0, #0xfffffffffffff000
; CHECK-CVT-NEXT: csel x9, x9, x0, ne
; CHECK-CVT-NEXT: ucvtf d0, x9
; CHECK-CVT-NEXT: cset w9, ne
; CHECK-CVT-NEXT: tst x0, #0xfff
; CHECK-CVT-NEXT: csel w9, wzr, w9, eq
; CHECK-CVT-NEXT: fmov x10, d0
; CHECK-CVT-NEXT: orr x9, x10, x9
; CHECK-CVT-NEXT: fmov d0, x9
; CHECK-CVT-NEXT: fcvtxn s0, d0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_uitofp_i64:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: lsr x8, x0, #53
; CHECK-BF16-NEXT: and x9, x0, #0xfffffffffffff000
; CHECK-BF16-NEXT: cmp x8, #0
; CHECK-BF16-NEXT: csel x8, x9, x0, ne
; CHECK-BF16-NEXT: ucvtf d0, x8
; CHECK-BF16-NEXT: cset w8, ne
; CHECK-BF16-NEXT: tst x0, #0xfff
; CHECK-BF16-NEXT: csel w8, wzr, w8, eq
; CHECK-BF16-NEXT: fmov x9, d0
; CHECK-BF16-NEXT: orr x8, x9, x8
; CHECK-BF16-NEXT: fmov d0, x8
; CHECK-BF16-NEXT: fcvtxn s0, d0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = uitofp i64 %a to bfloat
ret bfloat %r
}
define bfloat @test_sitofp_i32(i32 %a) #0 {
; CHECK-CVT-LABEL: test_sitofp_i32:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: scvtf d0, w0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: fcvtxn s0, d0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sitofp_i32:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: scvtf d0, w0
; CHECK-BF16-NEXT: fcvtxn s0, d0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = sitofp i32 %a to bfloat
ret bfloat %r
}
define bfloat @test_sitofp_i64(i64 %a) #0 {
; CHECK-CVT-LABEL: test_sitofp_i64:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: cmp x0, #0
; CHECK-CVT-NEXT: and x11, x0, #0x8000000000000000
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: cneg x9, x0, mi
; CHECK-CVT-NEXT: lsr x10, x9, #53
; CHECK-CVT-NEXT: cmp x10, #0
; CHECK-CVT-NEXT: and x10, x9, #0xfffffffffffff000
; CHECK-CVT-NEXT: csel x10, x10, x9, ne
; CHECK-CVT-NEXT: scvtf d0, x10
; CHECK-CVT-NEXT: cset w10, ne
; CHECK-CVT-NEXT: tst x9, #0xfff
; CHECK-CVT-NEXT: csel w10, wzr, w10, eq
; CHECK-CVT-NEXT: fmov x9, d0
; CHECK-CVT-NEXT: orr x9, x9, x11
; CHECK-CVT-NEXT: orr x9, x9, x10
; CHECK-CVT-NEXT: fmov d0, x9
; CHECK-CVT-NEXT: fcvtxn s0, d0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sitofp_i64:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: cmp x0, #0
; CHECK-BF16-NEXT: cneg x8, x0, mi
; CHECK-BF16-NEXT: lsr x9, x8, #53
; CHECK-BF16-NEXT: and x10, x8, #0xfffffffffffff000
; CHECK-BF16-NEXT: cmp x9, #0
; CHECK-BF16-NEXT: csel x9, x10, x8, ne
; CHECK-BF16-NEXT: and x10, x0, #0x8000000000000000
; CHECK-BF16-NEXT: cset w11, ne
; CHECK-BF16-NEXT: scvtf d0, x9
; CHECK-BF16-NEXT: tst x8, #0xfff
; CHECK-BF16-NEXT: fmov x9, d0
; CHECK-BF16-NEXT: orr x8, x9, x10
; CHECK-BF16-NEXT: csel w9, wzr, w11, eq
; CHECK-BF16-NEXT: orr x8, x8, x9
; CHECK-BF16-NEXT: fmov d0, x8
; CHECK-BF16-NEXT: fcvtxn s0, d0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = sitofp i64 %a to bfloat
ret bfloat %r
}
define bfloat @test_uitofp_i32_fadd(i32 %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_uitofp_i32_fadd:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: ucvtf d1, w0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fcvtxn s1, d1
; CHECK-CVT-NEXT: fmov w9, s1
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w9, w9, w8
; CHECK-CVT-NEXT: add w9, w10, w9
; CHECK-CVT-NEXT: lsr w9, w9, #16
; CHECK-CVT-NEXT: fmov s1, w9
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: fadd s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_uitofp_i32_fadd:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: ucvtf d1, w0
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fcvtxn s1, d1
; CHECK-BF16-NEXT: bfcvt h1, s1
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: fadd s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%c = uitofp i32 %a to bfloat
%r = fadd bfloat %b, %c
ret bfloat %r
}
define bfloat @test_sitofp_i32_fadd(i32 %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_sitofp_i32_fadd:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: scvtf d1, w0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fcvtxn s1, d1
; CHECK-CVT-NEXT: fmov w9, s1
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w9, w9, w8
; CHECK-CVT-NEXT: add w9, w10, w9
; CHECK-CVT-NEXT: lsr w9, w9, #16
; CHECK-CVT-NEXT: fmov s1, w9
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: fadd s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sitofp_i32_fadd:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: scvtf d1, w0
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fcvtxn s1, d1
; CHECK-BF16-NEXT: bfcvt h1, s1
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: fadd s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%c = sitofp i32 %a to bfloat
%r = fadd bfloat %b, %c
ret bfloat %r
}
define bfloat @test_fptrunc_float(float %a) #0 {
; CHECK-CVT-LABEL: test_fptrunc_float:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: fcmp s0, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: orr w9, w9, #0x400000
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: csel w8, w9, w8, vs
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fptrunc_float:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fptrunc float %a to bfloat
ret bfloat %r
}
define bfloat @test_fptrunc_double(double %a) #0 {
; CHECK-CVT-LABEL: test_fptrunc_double:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: fcvtxn s0, d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fptrunc_double:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: fcvtxn s0, d0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = fptrunc double %a to bfloat
ret bfloat %r
}
define float @test_fpext_float(bfloat %a) #0 {
; CHECK-LABEL: test_fpext_float:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-NEXT: ret
%r = fpext bfloat %a to float
ret float %r
}
define double @test_fpext_double(bfloat %a) #0 {
; CHECK-LABEL: test_fpext_double:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-NEXT: shll v0.4s, v0.4h, #16
; CHECK-NEXT: fcvt d0, s0
; CHECK-NEXT: ret
%r = fpext bfloat %a to double
ret double %r
}
define i16 @test_bitcast_bfloattoi16(bfloat %a) #0 {
; CHECK-LABEL: test_bitcast_bfloattoi16:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-NEXT: fmov w0, s0
; CHECK-NEXT: ret
%r = bitcast bfloat %a to i16
ret i16 %r
}
define bfloat @test_bitcast_i16tobfloat(i16 %a) #0 {
; CHECK-LABEL: test_bitcast_i16tobfloat:
; CHECK: // %bb.0:
; CHECK-NEXT: fmov s0, w0
; CHECK-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-NEXT: ret
%r = bitcast i16 %a to bfloat
ret bfloat %r
}
declare bfloat @llvm.sqrt.f16(bfloat %a) #0
declare bfloat @llvm.powi.f16.i32(bfloat %a, i32 %b) #0
declare bfloat @llvm.sin.f16(bfloat %a) #0
declare bfloat @llvm.cos.f16(bfloat %a) #0
declare bfloat @llvm.tan.f16(bfloat %a) #0
declare bfloat @llvm.asin.f16(bfloat %a) #0
declare bfloat @llvm.acos.f16(bfloat %a) #0
declare bfloat @llvm.atan.f16(bfloat %a) #0
declare bfloat @llvm.atan2.f16(bfloat %a, bfloat %b) #0
declare bfloat @llvm.sinh.f16(bfloat %a) #0
declare bfloat @llvm.cosh.f16(bfloat %a) #0
declare bfloat @llvm.tanh.f16(bfloat %a) #0
declare bfloat @llvm.pow.f16(bfloat %a, bfloat %b) #0
declare bfloat @llvm.exp.f16(bfloat %a) #0
declare bfloat @llvm.exp2.f16(bfloat %a) #0
declare bfloat @llvm.log.f16(bfloat %a) #0
declare bfloat @llvm.log10.f16(bfloat %a) #0
declare bfloat @llvm.log2.f16(bfloat %a) #0
declare bfloat @llvm.fma.f16(bfloat %a, bfloat %b, bfloat %c) #0
declare bfloat @llvm.fabs.f16(bfloat %a) #0
declare bfloat @llvm.minnum.f16(bfloat %a, bfloat %b) #0
declare bfloat @llvm.maxnum.f16(bfloat %a, bfloat %b) #0
declare bfloat @llvm.copysign.f16(bfloat %a, bfloat %b) #0
declare bfloat @llvm.floor.f16(bfloat %a) #0
declare bfloat @llvm.ceil.f16(bfloat %a) #0
declare bfloat @llvm.trunc.f16(bfloat %a) #0
declare bfloat @llvm.rint.f16(bfloat %a) #0
declare bfloat @llvm.nearbyint.f16(bfloat %a) #0
declare bfloat @llvm.round.f16(bfloat %a) #0
declare bfloat @llvm.roundeven.f16(bfloat %a) #0
declare bfloat @llvm.fmuladd.f16(bfloat %a, bfloat %b, bfloat %c) #0
define bfloat @test_sqrt(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_sqrt:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fsqrt s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sqrt:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fsqrt s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.sqrt.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_powi(bfloat %a, i32 %b) #0 {
; CHECK-CVT-LABEL: test_powi:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl __powisf2
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_powi:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl __powisf2
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.powi.f16.i32(bfloat %a, i32 %b)
ret bfloat %r
}
define bfloat @test_sin(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_sin:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl sinf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sin:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl sinf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.sin.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_cos(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_cos:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl cosf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_cos:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl cosf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.cos.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_tan(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_tan:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl tanf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_tan:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl tanf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.tan.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_acos(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_acos:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl acosf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_acos:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl acosf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.acos.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_asin(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_asin:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl asinf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_asin:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl asinf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.asin.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_atan(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_atan:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl atanf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_atan:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl atanf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.atan.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_atan2(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_atan2:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-CVT-NEXT: bl atan2f
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_atan2:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-BF16-NEXT: bl atan2f
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.atan2.f16(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_cosh(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_cosh:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl coshf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_cosh:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl coshf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.cosh.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_sinh(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_sinh:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl sinhf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_sinh:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl sinhf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.sinh.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_tanh(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_tanh:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl tanhf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_tanh:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl tanhf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.tanh.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_pow(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_pow:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-CVT-NEXT: bl powf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_pow:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: // kill: def $s1 killed $s1 killed $q1
; CHECK-BF16-NEXT: bl powf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.pow.f16(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_exp(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_exp:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl expf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_exp:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl expf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.exp.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_exp2(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_exp2:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl exp2f
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_exp2:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl exp2f
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.exp2.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_log(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_log:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl logf
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_log:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl logf
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.log.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_log10(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_log10:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl log10f
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_log10:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl log10f
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.log10.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_log2(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_log2:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: bl log2f
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_log2:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: str x30, [sp, #-16]! // 8-byte Folded Spill
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-BF16-NEXT: bl log2f
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ldr x30, [sp], #16 // 8-byte Folded Reload
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.log2.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_fma(bfloat %a, bfloat %b, bfloat %c) #0 {
; CHECK-CVT-LABEL: test_fma:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w10, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v2.4s, v2.4h, #16
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fmadd s0, s0, s1, s2
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: ubfx w9, w8, #16, #1
; CHECK-CVT-NEXT: add w8, w8, w10
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fma:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v2.4s, v2.4h, #16
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fmadd s0, s0, s1, s2
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.fma.f16(bfloat %a, bfloat %b, bfloat %c)
ret bfloat %r
}
define bfloat @test_fabs(bfloat %a) #0 {
; CHECK-LABEL: test_fabs:
; CHECK: // %bb.0:
; CHECK-NEXT: // kill: def $h0 killed $h0 def $s0
; CHECK-NEXT: fmov w8, s0
; CHECK-NEXT: and w8, w8, #0x7fff
; CHECK-NEXT: fmov s0, w8
; CHECK-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-NEXT: ret
%r = call bfloat @llvm.fabs.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_minnum(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_minnum:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fminnm s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_minnum:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fminnm s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.minnum.f16(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_maxnum(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_maxnum:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fmaxnm s0, s0, s1
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_maxnum:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fmaxnm s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.maxnum.f16(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_copysign(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_copysign:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_copysign:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-SD-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-SD-NEXT: shll v1.4s, v1.4h, #16
; CHECK-SD-NEXT: shll v0.4s, v0.4h, #16
; CHECK-SD-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: bfcvt h0, s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_copysign:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni v2.8h, #128, lsl #8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $q0
; CHECK-GI-NEXT: // kill: def $h1 killed $h1 def $q1
; CHECK-GI-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 killed $q0
; CHECK-GI-NEXT: ret
%r = call bfloat @llvm.copysign.f16(bfloat %a, bfloat %b)
ret bfloat %r
}
define bfloat @test_copysign_f32(bfloat %a, float %b) #0 {
; CHECK-CVT-LABEL: test_copysign_f32:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-CVT-NEXT: // kill: def $s1 killed $s1 def $q1
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_copysign_f32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-SD-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-SD-NEXT: // kill: def $s1 killed $s1 def $q1
; CHECK-SD-NEXT: shll v0.4s, v0.4h, #16
; CHECK-SD-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: bfcvt h0, s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_copysign_f32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: bfcvt h1, s1
; CHECK-GI-NEXT: mvni v2.8h, #128, lsl #8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $q0
; CHECK-GI-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 killed $q0
; CHECK-GI-NEXT: ret
%tb = fptrunc float %b to bfloat
%r = call bfloat @llvm.copysign.f16(bfloat %a, bfloat %tb)
ret bfloat %r
}
define bfloat @test_copysign_f64(bfloat %a, double %b) #0 {
; CHECK-CVT-LABEL: test_copysign_f64:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: fcvt s1, d1
; CHECK-CVT-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_copysign_f64:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-SD-NEXT: fcvt s1, d1
; CHECK-SD-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-SD-NEXT: shll v0.4s, v0.4h, #16
; CHECK-SD-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: bfcvt h0, s0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_copysign_f64:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: fcvtxn s1, d1
; CHECK-GI-NEXT: mvni v2.8h, #128, lsl #8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $q0
; CHECK-GI-NEXT: bfcvt h1, s1
; CHECK-GI-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 killed $q0
; CHECK-GI-NEXT: ret
%tb = fptrunc double %b to bfloat
%r = call bfloat @llvm.copysign.f16(bfloat %a, bfloat %tb)
ret bfloat %r
}
; away the (fpext (fp_round <result>)) here.
define float @test_copysign_extended(bfloat %a, bfloat %b) #0 {
; CHECK-CVT-LABEL: test_copysign_extended:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-CVT-NEXT: ret
;
; CHECK-SD-LABEL: test_copysign_extended:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-SD-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-SD-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-SD-NEXT: shll v1.4s, v1.4h, #16
; CHECK-SD-NEXT: shll v0.4s, v0.4h, #16
; CHECK-SD-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: test_copysign_extended:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni v2.8h, #128, lsl #8
; CHECK-GI-NEXT: // kill: def $h0 killed $h0 def $q0
; CHECK-GI-NEXT: // kill: def $h1 killed $h1 def $q1
; CHECK-GI-NEXT: bif v0.16b, v1.16b, v2.16b
; CHECK-GI-NEXT: shll v0.4s, v0.4h, #16
; CHECK-GI-NEXT: // kill: def $s0 killed $s0 killed $q0
; CHECK-GI-NEXT: ret
%r = call bfloat @llvm.copysign.f16(bfloat %a, bfloat %b)
%xr = fpext bfloat %r to float
ret float %xr
}
define bfloat @test_floor(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_floor:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frintm s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_floor:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frintm s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.floor.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_ceil(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_ceil:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frintp s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_ceil:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frintp s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.ceil.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_trunc(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_trunc:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frintz s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_trunc:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frintz s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.trunc.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_rint(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_rint:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frintx s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_rint:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frintx s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.rint.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_nearbyint(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_nearbyint:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frinti s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_nearbyint:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frinti s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.nearbyint.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_round(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_round:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frinta s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_round:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frinta s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.round.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_roundeven(bfloat %a) #0 {
; CHECK-CVT-LABEL: test_roundeven:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w8, #32767 // =0x7fff
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: frintn s0, s0
; CHECK-CVT-NEXT: fmov w9, s0
; CHECK-CVT-NEXT: ubfx w10, w9, #16, #1
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: add w8, w10, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_roundeven:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: frintn s0, s0
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.roundeven.f16(bfloat %a)
ret bfloat %r
}
define bfloat @test_fmuladd(bfloat %a, bfloat %b, bfloat %c) #0 {
; CHECK-CVT-LABEL: test_fmuladd:
; CHECK-CVT: // %bb.0:
; CHECK-CVT-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-CVT-NEXT: mov w10, #32767 // =0x7fff
; CHECK-CVT-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-CVT-NEXT: shll v1.4s, v1.4h, #16
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fmul s0, s0, s1
; CHECK-CVT-NEXT: shll v1.4s, v2.4h, #16
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: ubfx w9, w8, #16, #1
; CHECK-CVT-NEXT: add w8, w8, w10
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: shll v0.4s, v0.4h, #16
; CHECK-CVT-NEXT: fadd s0, s0, s1
; CHECK-CVT-NEXT: fmov w8, s0
; CHECK-CVT-NEXT: ubfx w9, w8, #16, #1
; CHECK-CVT-NEXT: add w8, w8, w10
; CHECK-CVT-NEXT: add w8, w9, w8
; CHECK-CVT-NEXT: lsr w8, w8, #16
; CHECK-CVT-NEXT: fmov s0, w8
; CHECK-CVT-NEXT: // kill: def $h0 killed $h0 killed $s0
; CHECK-CVT-NEXT: ret
;
; CHECK-BF16-LABEL: test_fmuladd:
; CHECK-BF16: // %bb.0:
; CHECK-BF16-NEXT: // kill: def $h1 killed $h1 def $d1
; CHECK-BF16-NEXT: // kill: def $h0 killed $h0 def $d0
; CHECK-BF16-NEXT: // kill: def $h2 killed $h2 def $d2
; CHECK-BF16-NEXT: shll v1.4s, v1.4h, #16
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fmul s0, s0, s1
; CHECK-BF16-NEXT: shll v1.4s, v2.4h, #16
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: shll v0.4s, v0.4h, #16
; CHECK-BF16-NEXT: fadd s0, s0, s1
; CHECK-BF16-NEXT: bfcvt h0, s0
; CHECK-BF16-NEXT: ret
%r = call bfloat @llvm.fmuladd.f16(bfloat %a, bfloat %b, bfloat %c)
ret bfloat %r
}
attributes #0 = { nounwind }