blob: 5ea55ef81d650be7eab541198e098d4944ca6cb3 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc -mcpu=v2 -mtriple=bpf < %s | FileCheck %s --check-prefixes=CHECK-V2
; RUN: llc -mcpu=v4 -mtriple=bpf < %s | FileCheck %s --check-prefixes=CHECK-V4
; Zero extension instructions should be eliminated at instruction
; selection phase for all test cases below.
; In BPF zero extension is implemented as &= or a pair of <<=/>>=
; instructions, hence simply check that &= and >>= do not exist in
; generated code (<<= remains because %c is used by both call and
; lshr in a few test cases).
define void @shl_lshr_same_bb(ptr %p) {
; CHECK-V2-LABEL: shl_lshr_same_bb:
; CHECK-V2: # %bb.0: # %entry
; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0)
; CHECK-V2-NEXT: r5 = 1
; CHECK-V2-NEXT: if r1 == 0 goto LBB0_2
; CHECK-V2-NEXT: # %bb.1: # %entry
; CHECK-V2-NEXT: r5 = 0
; CHECK-V2-NEXT: LBB0_2: # %entry
; CHECK-V2-NEXT: r3 = r1
; CHECK-V2-NEXT: r3 <<= 56
; CHECK-V2-NEXT: r2 = r1
; CHECK-V2-NEXT: r4 = r1
; CHECK-V2-NEXT: call sink1
; CHECK-V2-NEXT: exit
;
; CHECK-V4-LABEL: shl_lshr_same_bb:
; CHECK-V4: # %bb.0: # %entry
; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0)
; CHECK-V4-NEXT: w5 = 1
; CHECK-V4-NEXT: if w1 == 0 goto LBB0_2
; CHECK-V4-NEXT: # %bb.1: # %entry
; CHECK-V4-NEXT: w5 = 0
; CHECK-V4-NEXT: LBB0_2: # %entry
; CHECK-V4-NEXT: r3 = r1
; CHECK-V4-NEXT: r3 <<= 56
; CHECK-V4-NEXT: r2 = r1
; CHECK-V4-NEXT: r4 = r1
; CHECK-V4-NEXT: call sink1
; CHECK-V4-NEXT: exit
entry:
%a = load i8, ptr %p, align 1
%b = zext i8 %a to i64
%c = shl i64 %b, 56
%d = lshr i64 %c, 56
%e = icmp eq i64 %d, 0
; hasOneUse() is a common requirement for many CombineDAG
; transofmations, make sure that it does not matter in this case.
call void @sink1(i8 %a, i64 %b, i64 %c, i64 %d, i1 %e)
ret void
}
define void @shl_lshr_diff_bb(ptr %p) {
; CHECK-V2-LABEL: shl_lshr_diff_bb:
; CHECK-V2: # %bb.0: # %entry
; CHECK-V2-NEXT: r1 = *(u16 *)(r1 + 0)
; CHECK-V2-NEXT: r5 = 1
; CHECK-V2-NEXT: if r1 == 0 goto LBB1_2
; CHECK-V2-NEXT: # %bb.1: # %entry
; CHECK-V2-NEXT: r5 = 0
; CHECK-V2-NEXT: LBB1_2: # %entry
; CHECK-V2-NEXT: r3 = r1
; CHECK-V2-NEXT: r3 <<= 48
; CHECK-V2-NEXT: r2 = r1
; CHECK-V2-NEXT: r4 = r1
; CHECK-V2-NEXT: call sink2
; CHECK-V2-NEXT: exit
;
; CHECK-V4-LABEL: shl_lshr_diff_bb:
; CHECK-V4: # %bb.0: # %entry
; CHECK-V4-NEXT: w1 = *(u16 *)(r1 + 0)
; CHECK-V4-NEXT: w5 = 1
; CHECK-V4-NEXT: if w1 == 0 goto LBB1_2
; CHECK-V4-NEXT: # %bb.1: # %entry
; CHECK-V4-NEXT: w5 = 0
; CHECK-V4-NEXT: LBB1_2: # %entry
; CHECK-V4-NEXT: r3 = r1
; CHECK-V4-NEXT: r3 <<= 48
; CHECK-V4-NEXT: r2 = r1
; CHECK-V4-NEXT: r4 = r1
; CHECK-V4-NEXT: call sink2
; CHECK-V4-NEXT: exit
entry:
%a = load i16, ptr %p, align 2
%b = zext i16 %a to i64
%c = shl i64 %b, 48
%d = lshr i64 %c, 48
br label %next
; Jump to the new basic block creates a COPY instruction for %d, which
; might be materialized as noop or as AND_ri (zero extension) at the
; start of the basic block. The decision depends on TLI.isZExtFree()
; results, see RegsForValue::getCopyToRegs(). Check below verifies
; that COPY is materialized as noop.
next:
%e = icmp eq i64 %d, 0
call void @sink2(i16 %a, i64 %b, i64 %c, i64 %d, i1 %e)
ret void
}
define void @load_zext_same_bb(ptr %p) {
; CHECK-V2-LABEL: load_zext_same_bb:
; CHECK-V2: # %bb.0: # %entry
; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0)
; CHECK-V2-NEXT: r2 = 1
; CHECK-V2-NEXT: if r1 == 0 goto LBB2_2
; CHECK-V2-NEXT: # %bb.1: # %entry
; CHECK-V2-NEXT: r2 = 0
; CHECK-V2-NEXT: LBB2_2: # %entry
; CHECK-V2-NEXT: call sink3
; CHECK-V2-NEXT: exit
;
; CHECK-V4-LABEL: load_zext_same_bb:
; CHECK-V4: # %bb.0: # %entry
; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0)
; CHECK-V4-NEXT: w2 = 1
; CHECK-V4-NEXT: if w1 == 0 goto LBB2_2
; CHECK-V4-NEXT: # %bb.1: # %entry
; CHECK-V4-NEXT: w2 = 0
; CHECK-V4-NEXT: LBB2_2: # %entry
; CHECK-V4-NEXT: call sink3
; CHECK-V4-NEXT: exit
entry:
%a = load i8, ptr %p, align 1
; zext is implicit in this context
%b = icmp eq i8 %a, 0
call void @sink3(i8 %a, i1 %b)
ret void
}
define void @load_zext_diff_bb(ptr %p) {
; CHECK-V2-LABEL: load_zext_diff_bb:
; CHECK-V2: # %bb.0: # %entry
; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0)
; CHECK-V2-NEXT: r2 = 1
; CHECK-V2-NEXT: if r1 == 0 goto LBB3_2
; CHECK-V2-NEXT: # %bb.1: # %next
; CHECK-V2-NEXT: r2 = 0
; CHECK-V2-NEXT: LBB3_2: # %next
; CHECK-V2-NEXT: call sink3
; CHECK-V2-NEXT: exit
;
; CHECK-V4-LABEL: load_zext_diff_bb:
; CHECK-V4: # %bb.0: # %entry
; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0)
; CHECK-V4-NEXT: w2 = 1
; CHECK-V4-NEXT: if w1 == 0 goto LBB3_2
; CHECK-V4-NEXT: # %bb.1: # %next
; CHECK-V4-NEXT: w2 = 0
; CHECK-V4-NEXT: LBB3_2: # %next
; CHECK-V4-NEXT: call sink3
; CHECK-V4-NEXT: exit
entry:
%a = load i8, ptr %p, align 1
br label %next
next:
%b = icmp eq i8 %a, 0
call void @sink3(i8 %a, i1 %b)
ret void
}
define void @load_zext_diff_bb_2(ptr %p) {
; CHECK-V2-LABEL: load_zext_diff_bb_2:
; CHECK-V2: # %bb.0: # %entry
; CHECK-V2-NEXT: r1 = *(u32 *)(r1 + 0)
; CHECK-V2-NEXT: r2 = 1
; CHECK-V2-NEXT: if r1 == 0 goto LBB4_2
; CHECK-V2-NEXT: # %bb.1: # %next
; CHECK-V2-NEXT: r2 = 0
; CHECK-V2-NEXT: LBB4_2: # %next
; CHECK-V2-NEXT: call sink4
; CHECK-V2-NEXT: exit
;
; CHECK-V4-LABEL: load_zext_diff_bb_2:
; CHECK-V4: # %bb.0: # %entry
; CHECK-V4-NEXT: w1 = *(u32 *)(r1 + 0)
; CHECK-V4-NEXT: w2 = 1
; CHECK-V4-NEXT: if w1 == 0 goto LBB4_2
; CHECK-V4-NEXT: # %bb.1: # %next
; CHECK-V4-NEXT: w2 = 0
; CHECK-V4-NEXT: LBB4_2: # %next
; CHECK-V4-NEXT: call sink4
; CHECK-V4-NEXT: exit
entry:
%a = load i32, ptr %p, align 4
br label %next
next:
%b = icmp eq i32 %a, 0
call void @sink4(i32 %a, i1 %b)
ret void
}
declare void @sink1(i8, i64, i64, i64, i1);
declare void @sink2(i16, i64, i64, i64, i1);
declare void @sink3(i8, i1);
declare void @sink4(i32, i1);