| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
| ; RUN: llc -mcpu=v2 -mtriple=bpf < %s | FileCheck %s --check-prefixes=CHECK-V2 |
| ; RUN: llc -mcpu=v4 -mtriple=bpf < %s | FileCheck %s --check-prefixes=CHECK-V4 |
| |
| ; Zero extension instructions should be eliminated at instruction |
| ; selection phase for all test cases below. |
| |
| ; In BPF zero extension is implemented as &= or a pair of <<=/>>= |
| ; instructions, hence simply check that &= and >>= do not exist in |
| ; generated code (<<= remains because %c is used by both call and |
| ; lshr in a few test cases). |
| |
| define void @shl_lshr_same_bb(ptr %p) { |
| ; CHECK-V2-LABEL: shl_lshr_same_bb: |
| ; CHECK-V2: # %bb.0: # %entry |
| ; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0) |
| ; CHECK-V2-NEXT: r5 = 1 |
| ; CHECK-V2-NEXT: if r1 == 0 goto LBB0_2 |
| ; CHECK-V2-NEXT: # %bb.1: # %entry |
| ; CHECK-V2-NEXT: r5 = 0 |
| ; CHECK-V2-NEXT: LBB0_2: # %entry |
| ; CHECK-V2-NEXT: r3 = r1 |
| ; CHECK-V2-NEXT: r3 <<= 56 |
| ; CHECK-V2-NEXT: r2 = r1 |
| ; CHECK-V2-NEXT: r4 = r1 |
| ; CHECK-V2-NEXT: call sink1 |
| ; CHECK-V2-NEXT: exit |
| ; |
| ; CHECK-V4-LABEL: shl_lshr_same_bb: |
| ; CHECK-V4: # %bb.0: # %entry |
| ; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0) |
| ; CHECK-V4-NEXT: w5 = 1 |
| ; CHECK-V4-NEXT: if w1 == 0 goto LBB0_2 |
| ; CHECK-V4-NEXT: # %bb.1: # %entry |
| ; CHECK-V4-NEXT: w5 = 0 |
| ; CHECK-V4-NEXT: LBB0_2: # %entry |
| ; CHECK-V4-NEXT: r3 = r1 |
| ; CHECK-V4-NEXT: r3 <<= 56 |
| ; CHECK-V4-NEXT: r2 = r1 |
| ; CHECK-V4-NEXT: r4 = r1 |
| ; CHECK-V4-NEXT: call sink1 |
| ; CHECK-V4-NEXT: exit |
| entry: |
| %a = load i8, ptr %p, align 1 |
| %b = zext i8 %a to i64 |
| %c = shl i64 %b, 56 |
| %d = lshr i64 %c, 56 |
| %e = icmp eq i64 %d, 0 |
| ; hasOneUse() is a common requirement for many CombineDAG |
| ; transofmations, make sure that it does not matter in this case. |
| call void @sink1(i8 %a, i64 %b, i64 %c, i64 %d, i1 %e) |
| ret void |
| } |
| |
| define void @shl_lshr_diff_bb(ptr %p) { |
| ; CHECK-V2-LABEL: shl_lshr_diff_bb: |
| ; CHECK-V2: # %bb.0: # %entry |
| ; CHECK-V2-NEXT: r1 = *(u16 *)(r1 + 0) |
| ; CHECK-V2-NEXT: r5 = 1 |
| ; CHECK-V2-NEXT: if r1 == 0 goto LBB1_2 |
| ; CHECK-V2-NEXT: # %bb.1: # %entry |
| ; CHECK-V2-NEXT: r5 = 0 |
| ; CHECK-V2-NEXT: LBB1_2: # %entry |
| ; CHECK-V2-NEXT: r3 = r1 |
| ; CHECK-V2-NEXT: r3 <<= 48 |
| ; CHECK-V2-NEXT: r2 = r1 |
| ; CHECK-V2-NEXT: r4 = r1 |
| ; CHECK-V2-NEXT: call sink2 |
| ; CHECK-V2-NEXT: exit |
| ; |
| ; CHECK-V4-LABEL: shl_lshr_diff_bb: |
| ; CHECK-V4: # %bb.0: # %entry |
| ; CHECK-V4-NEXT: w1 = *(u16 *)(r1 + 0) |
| ; CHECK-V4-NEXT: w5 = 1 |
| ; CHECK-V4-NEXT: if w1 == 0 goto LBB1_2 |
| ; CHECK-V4-NEXT: # %bb.1: # %entry |
| ; CHECK-V4-NEXT: w5 = 0 |
| ; CHECK-V4-NEXT: LBB1_2: # %entry |
| ; CHECK-V4-NEXT: r3 = r1 |
| ; CHECK-V4-NEXT: r3 <<= 48 |
| ; CHECK-V4-NEXT: r2 = r1 |
| ; CHECK-V4-NEXT: r4 = r1 |
| ; CHECK-V4-NEXT: call sink2 |
| ; CHECK-V4-NEXT: exit |
| entry: |
| %a = load i16, ptr %p, align 2 |
| %b = zext i16 %a to i64 |
| %c = shl i64 %b, 48 |
| %d = lshr i64 %c, 48 |
| br label %next |
| |
| ; Jump to the new basic block creates a COPY instruction for %d, which |
| ; might be materialized as noop or as AND_ri (zero extension) at the |
| ; start of the basic block. The decision depends on TLI.isZExtFree() |
| ; results, see RegsForValue::getCopyToRegs(). Check below verifies |
| ; that COPY is materialized as noop. |
| next: |
| %e = icmp eq i64 %d, 0 |
| call void @sink2(i16 %a, i64 %b, i64 %c, i64 %d, i1 %e) |
| ret void |
| } |
| |
| define void @load_zext_same_bb(ptr %p) { |
| ; CHECK-V2-LABEL: load_zext_same_bb: |
| ; CHECK-V2: # %bb.0: # %entry |
| ; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0) |
| ; CHECK-V2-NEXT: r2 = 1 |
| ; CHECK-V2-NEXT: if r1 == 0 goto LBB2_2 |
| ; CHECK-V2-NEXT: # %bb.1: # %entry |
| ; CHECK-V2-NEXT: r2 = 0 |
| ; CHECK-V2-NEXT: LBB2_2: # %entry |
| ; CHECK-V2-NEXT: call sink3 |
| ; CHECK-V2-NEXT: exit |
| ; |
| ; CHECK-V4-LABEL: load_zext_same_bb: |
| ; CHECK-V4: # %bb.0: # %entry |
| ; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0) |
| ; CHECK-V4-NEXT: w2 = 1 |
| ; CHECK-V4-NEXT: if w1 == 0 goto LBB2_2 |
| ; CHECK-V4-NEXT: # %bb.1: # %entry |
| ; CHECK-V4-NEXT: w2 = 0 |
| ; CHECK-V4-NEXT: LBB2_2: # %entry |
| ; CHECK-V4-NEXT: call sink3 |
| ; CHECK-V4-NEXT: exit |
| entry: |
| %a = load i8, ptr %p, align 1 |
| ; zext is implicit in this context |
| %b = icmp eq i8 %a, 0 |
| call void @sink3(i8 %a, i1 %b) |
| ret void |
| } |
| |
| define void @load_zext_diff_bb(ptr %p) { |
| ; CHECK-V2-LABEL: load_zext_diff_bb: |
| ; CHECK-V2: # %bb.0: # %entry |
| ; CHECK-V2-NEXT: r1 = *(u8 *)(r1 + 0) |
| ; CHECK-V2-NEXT: r2 = 1 |
| ; CHECK-V2-NEXT: if r1 == 0 goto LBB3_2 |
| ; CHECK-V2-NEXT: # %bb.1: # %next |
| ; CHECK-V2-NEXT: r2 = 0 |
| ; CHECK-V2-NEXT: LBB3_2: # %next |
| ; CHECK-V2-NEXT: call sink3 |
| ; CHECK-V2-NEXT: exit |
| ; |
| ; CHECK-V4-LABEL: load_zext_diff_bb: |
| ; CHECK-V4: # %bb.0: # %entry |
| ; CHECK-V4-NEXT: w1 = *(u8 *)(r1 + 0) |
| ; CHECK-V4-NEXT: w2 = 1 |
| ; CHECK-V4-NEXT: if w1 == 0 goto LBB3_2 |
| ; CHECK-V4-NEXT: # %bb.1: # %next |
| ; CHECK-V4-NEXT: w2 = 0 |
| ; CHECK-V4-NEXT: LBB3_2: # %next |
| ; CHECK-V4-NEXT: call sink3 |
| ; CHECK-V4-NEXT: exit |
| entry: |
| %a = load i8, ptr %p, align 1 |
| br label %next |
| |
| next: |
| %b = icmp eq i8 %a, 0 |
| call void @sink3(i8 %a, i1 %b) |
| ret void |
| } |
| |
| define void @load_zext_diff_bb_2(ptr %p) { |
| ; CHECK-V2-LABEL: load_zext_diff_bb_2: |
| ; CHECK-V2: # %bb.0: # %entry |
| ; CHECK-V2-NEXT: r1 = *(u32 *)(r1 + 0) |
| ; CHECK-V2-NEXT: r2 = 1 |
| ; CHECK-V2-NEXT: if r1 == 0 goto LBB4_2 |
| ; CHECK-V2-NEXT: # %bb.1: # %next |
| ; CHECK-V2-NEXT: r2 = 0 |
| ; CHECK-V2-NEXT: LBB4_2: # %next |
| ; CHECK-V2-NEXT: call sink4 |
| ; CHECK-V2-NEXT: exit |
| ; |
| ; CHECK-V4-LABEL: load_zext_diff_bb_2: |
| ; CHECK-V4: # %bb.0: # %entry |
| ; CHECK-V4-NEXT: w1 = *(u32 *)(r1 + 0) |
| ; CHECK-V4-NEXT: w2 = 1 |
| ; CHECK-V4-NEXT: if w1 == 0 goto LBB4_2 |
| ; CHECK-V4-NEXT: # %bb.1: # %next |
| ; CHECK-V4-NEXT: w2 = 0 |
| ; CHECK-V4-NEXT: LBB4_2: # %next |
| ; CHECK-V4-NEXT: call sink4 |
| ; CHECK-V4-NEXT: exit |
| entry: |
| %a = load i32, ptr %p, align 4 |
| br label %next |
| |
| next: |
| %b = icmp eq i32 %a, 0 |
| call void @sink4(i32 %a, i1 %b) |
| ret void |
| } |
| |
| declare void @sink1(i8, i64, i64, i64, i1); |
| declare void @sink2(i16, i64, i64, i64, i1); |
| declare void @sink3(i8, i1); |
| declare void @sink4(i32, i1); |