| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -O3 | FileCheck %s |
| |
| ; Function Attrs: uwtable |
| ; When tail-duplicating during placement, we work backward from blocks with |
| ; multiple successors. In this case, the block dup1 gets duplicated into dup2 |
| ; and if.then64, and then the block dup2 only gets duplicated into land.lhs.true. |
| |
| define void @partial_tail_dup(i1 %a1, i1 %a2, i32* %a4, i32* %a5, i8* %a6, i32 %a7) #0 align 2 !prof !1 { |
| ; CHECK-LABEL: partial_tail_dup: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: .p2align 4, 0x90 |
| ; CHECK-NEXT: .LBB0_1: # %for.cond |
| ; CHECK-NEXT: # =>This Inner Loop Header: Depth=1 |
| ; CHECK-NEXT: testb $1, %dil |
| ; CHECK-NEXT: je .LBB0_3 |
| ; CHECK-NEXT: # %bb.2: # %land.lhs.true |
| ; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1 |
| ; CHECK-NEXT: movl $10, (%rdx) |
| ; CHECK-NEXT: movl $2, (%rcx) |
| ; CHECK-NEXT: testl %r9d, %r9d |
| ; CHECK-NEXT: je .LBB0_1 |
| ; CHECK-NEXT: jmp .LBB0_8 |
| ; CHECK-NEXT: .p2align 4, 0x90 |
| ; CHECK-NEXT: .LBB0_6: # %dup2 |
| ; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1 |
| ; CHECK-NEXT: movl $2, (%rcx) |
| ; CHECK-NEXT: testl %r9d, %r9d |
| ; CHECK-NEXT: je .LBB0_1 |
| ; CHECK-NEXT: jmp .LBB0_8 |
| ; CHECK-NEXT: .p2align 4, 0x90 |
| ; CHECK-NEXT: .LBB0_3: # %if.end56 |
| ; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1 |
| ; CHECK-NEXT: testb $1, %sil |
| ; CHECK-NEXT: je .LBB0_5 |
| ; CHECK-NEXT: # %bb.4: # %if.then64 |
| ; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1 |
| ; CHECK-NEXT: movb $1, (%r8) |
| ; CHECK-NEXT: testl %r9d, %r9d |
| ; CHECK-NEXT: je .LBB0_1 |
| ; CHECK-NEXT: jmp .LBB0_8 |
| ; CHECK-NEXT: .LBB0_5: # %if.end70 |
| ; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1 |
| ; CHECK-NEXT: movl $12, (%rdx) |
| ; CHECK-NEXT: jne .LBB0_6 |
| ; CHECK-NEXT: .LBB0_8: # %for.end |
| ; CHECK-NEXT: retq |
| entry: |
| br label %for.cond |
| |
| for.cond: |
| br i1 %a1, label %land.lhs.true, label %if.end56 |
| |
| land.lhs.true: |
| store i32 10, i32* %a4, align 8 |
| br label %dup2 |
| |
| if.end56: |
| br i1 %a2, label %if.then64, label %if.end70, !prof !2 |
| |
| if.then64: |
| store i8 1, i8* %a6, align 1 |
| br label %dup1 |
| |
| if.end70: |
| store i32 12, i32* %a4, align 8 |
| br i1 %a2, label %dup2, label %for.end |
| |
| dup2: |
| store i32 2, i32* %a5, align 4 |
| br label %dup1 |
| |
| dup1: |
| %val = load i32, i32* %a4, align 8 |
| %switch = icmp ult i32 %a7, 1 |
| br i1 %switch, label %for.cond, label %for.end, !prof !3 |
| |
| for.end: |
| ret void |
| } |
| |
| attributes #0 = { uwtable } |
| |
| !1 = !{!"function_entry_count", i64 2} |
| !2 = !{!"branch_weights", i32 5, i32 1} |
| !3 = !{!"branch_weights", i32 5, i32 1} |