blob: 1d9414f9f40f344cadf3a7ac2ee329e6b9141018 [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6
; RUN: llc -mtriple=amdgcn < %s | FileCheck %s
define i32 @v1i1(<1 x i1> %x) {
; CHECK-LABEL: v1i1:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: v_mov_b32_e32 v0, 0
; CHECK-NEXT: s_setpc_b64 s[30:31]
%y = call i32 @llvm.experimental.cttz.elts(<1 x i1> %x, i1 true)
ret i32 %y
}
define i32 @v4i1(<4 x i1> %x) {
; CHECK-LABEL: v4i1:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: v_and_b32_e32 v2, 1, v2
; CHECK-NEXT: v_and_b32_e32 v0, 1, v0
; CHECK-NEXT: v_and_b32_e32 v1, 1, v1
; CHECK-NEXT: v_cmp_eq_u32_e32 vcc, 1, v2
; CHECK-NEXT: v_cmp_ne_u32_e64 s[4:5], 1, v1
; CHECK-NEXT: v_cndmask_b32_e64 v1, 0, 1, s[4:5]
; CHECK-NEXT: v_add_i32_e64 v1, s[4:5], 1, v1
; CHECK-NEXT: v_cmp_eq_u32_e64 s[4:5], 1, v0
; CHECK-NEXT: s_xor_b64 s[6:7], vcc, -1
; CHECK-NEXT: v_cndmask_b32_e64 v0, 0, 1, s[6:7]
; CHECK-NEXT: s_xor_b64 s[6:7], s[4:5], -1
; CHECK-NEXT: v_cndmask_b32_e64 v2, 0, 1, s[6:7]
; CHECK-NEXT: v_cndmask_b32_e32 v0, 1, v0, vcc
; CHECK-NEXT: v_cndmask_b32_e64 v1, v1, v2, s[4:5]
; CHECK-NEXT: v_or_b32_e32 v0, 2, v0
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 2, v1
; CHECK-NEXT: v_cndmask_b32_e32 v0, v0, v1, vcc
; CHECK-NEXT: s_setpc_b64 s[30:31]
%y = call i32 @llvm.experimental.cttz.elts(<4 x i1> %x, i1 true)
ret i32 %y
}
define i32 @v1i8(<1 x i8> %x) {
; CHECK-LABEL: v1i8:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: v_mov_b32_e32 v0, 0
; CHECK-NEXT: s_setpc_b64 s[30:31]
%y = call i32 @llvm.experimental.cttz.elts(<1 x i8> %x, i1 true)
ret i32 %y
}
define i32 @v4i8(<4 x i8> %x) {
; CHECK-LABEL: v4i8:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: v_and_b32_e32 v2, 0xff, v2
; CHECK-NEXT: v_and_b32_e32 v0, 0xff, v0
; CHECK-NEXT: v_and_b32_e32 v1, 0xff, v1
; CHECK-NEXT: v_cmp_eq_u32_e32 vcc, 0, v1
; CHECK-NEXT: v_addc_u32_e64 v1, s[4:5], 1, 0, vcc
; CHECK-NEXT: v_cmp_eq_u32_e32 vcc, 0, v0
; CHECK-NEXT: v_cndmask_b32_e64 v3, 0, 1, vcc
; CHECK-NEXT: v_cmp_eq_u32_e32 vcc, 0, v2
; CHECK-NEXT: v_cndmask_b32_e64 v4, 0, 1, vcc
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 0, v0
; CHECK-NEXT: v_cndmask_b32_e32 v0, v1, v3, vcc
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 0, v2
; CHECK-NEXT: v_cndmask_b32_e32 v1, 1, v4, vcc
; CHECK-NEXT: v_or_b32_e32 v1, 2, v1
; CHECK-NEXT: v_cmp_ne_u32_e32 vcc, 2, v0
; CHECK-NEXT: v_cndmask_b32_e32 v0, v1, v0, vcc
; CHECK-NEXT: s_setpc_b64 s[30:31]
%y = call i32 @llvm.experimental.cttz.elts(<4 x i8> %x, i1 true)
ret i32 %y
}