blob: 4bf2b8c7e6a578f7bdf51065c24c21e634f03db2 [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc --mtriple=aarch64-unknown-linux-gnu < %s | FileCheck %s --check-prefixes=CHECK,CHECK-SD
; RUN: llc --mtriple=aarch64-unknown-linux-gnu < %s -global-isel | FileCheck %s --check-prefixes=CHECK,CHECK-GI
; Check that the following does not crash
; See https://github.com/llvm/llvm-project/issues/123029 for details
define ptr @fn(ptr %in, ptr %out) {
; CHECK-SD-LABEL: fn:
; CHECK-SD: // %bb.0: // %fn
; CHECK-SD-NEXT: ldr d1, [x0]
; CHECK-SD-NEXT: movi v0.4h, #60, lsl #8
; CHECK-SD-NEXT: adrp x8, .LCPI0_0
; CHECK-SD-NEXT: fcvtl v1.4s, v1.4h
; CHECK-SD-NEXT: fcmgt v2.4s, v1.4s, #0.0
; CHECK-SD-NEXT: fcmlt v1.4s, v1.4s, #0.0
; CHECK-SD-NEXT: orr v1.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: ldr h2, [x8, :lo12:.LCPI0_0]
; CHECK-SD-NEXT: xtn v1.4h, v1.4s
; CHECK-SD-NEXT: and v0.8b, v1.8b, v0.8b
; CHECK-SD-NEXT: movi d1, #0000000000000000
; CHECK-SD-NEXT: str d0, [x1]
; CHECK-SD-NEXT: ldr h0, [x0, #8]
; CHECK-SD-NEXT: mov x0, xzr
; CHECK-SD-NEXT: fcvt s0, h0
; CHECK-SD-NEXT: fcmp s0, #0.0
; CHECK-SD-NEXT: fcsel s1, s2, s1, mi
; CHECK-SD-NEXT: fcsel s1, s2, s1, gt
; CHECK-SD-NEXT: mvni v2.4s, #128, lsl #24
; CHECK-SD-NEXT: fcvt s1, h1
; CHECK-SD-NEXT: bit v0.16b, v1.16b, v2.16b
; CHECK-SD-NEXT: fcvt h0, s0
; CHECK-SD-NEXT: str h0, [x1, #8]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: fn:
; CHECK-GI: // %bb.0: // %fn
; CHECK-GI-NEXT: movi v0.2d, #0000000000000000
; CHECK-GI-NEXT: ldr d1, [x0]
; CHECK-GI-NEXT: fcvtl v1.4s, v1.4h
; CHECK-GI-NEXT: fcvtl v0.4s, v0.4h
; CHECK-GI-NEXT: fcmgt v2.4s, v1.4s, v0.4s
; CHECK-GI-NEXT: fcmgt v0.4s, v0.4s, v1.4s
; CHECK-GI-NEXT: movi v1.4s, #1
; CHECK-GI-NEXT: orr v0.16b, v0.16b, v2.16b
; CHECK-GI-NEXT: and v0.16b, v0.16b, v1.16b
; CHECK-GI-NEXT: mvni v1.4h, #128, lsl #8
; CHECK-GI-NEXT: ucvtf v0.4s, v0.4s
; CHECK-GI-NEXT: fcvtn v0.4h, v0.4s
; CHECK-GI-NEXT: str d0, [x1]
; CHECK-GI-NEXT: ldr h0, [x0, #8]
; CHECK-GI-NEXT: ldr h2, [x0, #8]
; CHECK-GI-NEXT: mov x0, xzr
; CHECK-GI-NEXT: fcvt s0, h0
; CHECK-GI-NEXT: fcmp s0, #0.0
; CHECK-GI-NEXT: cset w8, mi
; CHECK-GI-NEXT: cset w9, gt
; CHECK-GI-NEXT: orr w8, w8, w9
; CHECK-GI-NEXT: ucvtf s0, w8
; CHECK-GI-NEXT: fcvt h0, s0
; CHECK-GI-NEXT: bif v0.8b, v2.8b, v1.8b
; CHECK-GI-NEXT: str h0, [x1, #8]
; CHECK-GI-NEXT: ret
fn:
%1 = load <4 x half>, ptr %in
%2 = fcmp one <4 x half> %1, zeroinitializer
%3 = uitofp <4 x i1> %2 to <4 x half>
store <4 x half> %3, ptr %out
%4 = getelementptr inbounds nuw i8, ptr %in, i64 8
%5 = load half, ptr %4
%6 = fcmp one half %5, 0xH0000
%7 = uitofp i1 %6 to half
%8 = call half @llvm.copysign.f16(half %7, half %5)
%9 = getelementptr inbounds nuw i8, ptr %out, i64 8
store half %8, ptr %9
ret ptr null
}
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
; CHECK: {{.*}}