| ; RUN: opt < %s -S -passes=loop-unroll -unroll-runtime=true -unroll-count=4 | FileCheck %s |
| |
| ;; Check that the remainder loop is properly assigned a branch weight for its latch branch. |
| ; CHECK-LABEL: @test( |
| ; CHECK-LABEL: entry: |
| ; CHECK: [[FOR_BODY_PREHEADER:.*]]: |
| ; CHECK: br i1 %{{.*}}, label %[[FOR_BODY_EPIL_PREHEADER:.*]], label %[[FOR_BODY_PREHEADER_NEW:.*]], !prof ![[#PROF_UR_GUARD:]] |
| ; CHECK: [[FOR_BODY_PREHEADER_NEW]]: |
| ; CHECK: br label %for.body |
| ; CHECK: for.body: |
| ; CHECK: %add = add |
| ; CHECK: %add.1 = add |
| ; CHECK: %add.2 = add |
| ; CHECK: %add.3 = add |
| ; CHECK-NOT: %add.4 = add |
| ; CHECK: br i1 %{{.*}}, label %[[FOR_END_LOOPEXIT_UNR_LCSSA:.*]], label %for.body, !prof ![[#PROF_UR_LATCH:]], !llvm.loop ![[#LOOP_UR_LATCH:]] |
| ; CHECK: [[FOR_END_LOOPEXIT_UNR_LCSSA]]: |
| ; CHECK: br i1 %{{.*}}, label %[[FOR_BODY_EPIL_PREHEADER]], label %[[FOR_END_LOOPEXIT:.*]], !prof ![[#PROF_RM_GUARD:]] |
| ; CHECK: [[FOR_BODY_EPIL_PREHEADER]]: |
| ; CHECK: br label %[[FOR_BODY_EPIL:.*]] |
| ; CHECK: [[FOR_BODY_EPIL]]: |
| ; CHECK: br i1 {{.*}}, label %[[FOR_BODY_EPIL]], label %[[FOR_END_LOOPEXIT_EPILOG_LCSSA:.*]], !prof ![[#PROF_RM_LATCH:]], !llvm.loop ![[#LOOP_RM_LATCH:]] |
| |
| define i3 @test(ptr %a, i3 %n) { |
| entry: |
| %cmp1 = icmp eq i3 %n, 0 |
| br i1 %cmp1, label %for.end, label %for.body |
| |
| for.body: |
| %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %entry ] |
| %sum.02 = phi i3 [ %add, %for.body ], [ 0, %entry ] |
| %arrayidx = getelementptr inbounds i3, ptr %a, i64 %indvars.iv |
| %0 = load i3, ptr %arrayidx |
| %add = add nsw i3 %0, %sum.02 |
| %indvars.iv.next = add i64 %indvars.iv, 1 |
| %lftr.wideiv = trunc i64 %indvars.iv.next to i3 |
| %exitcond = icmp eq i3 %lftr.wideiv, %n |
| br i1 %exitcond, label %for.end, label %for.body, !prof !0 |
| |
| for.end: |
| %sum.0.lcssa = phi i3 [ 0, %entry ], [ %add, %for.body ] |
| ret i3 %sum.0.lcssa |
| } |
| |
| !0 = !{!"branch_weights", i32 1, i32 9999} |
| |
| ; Original loop probability: p = 9999/(1+9999) = 0.9999 |
| ; Original estimated trip count: (1+9999)/1 = 10000 |
| ; Unroll count: 4 |
| |
| ; Probability of >=3 iterations after first: p^3 = 0.9970003 =~ |
| ; 2146839468 / (644180 + 2146839468). |
| ; CHECK: ![[#PROF_UR_GUARD]] = !{!"branch_weights", i32 644180, i32 2146839468} |
| |
| ; Probability of >=4 more iterations: p^4 = 0.99960006 =~ |
| ; 2146624784 / (858864 + 2146624784). |
| ; CHECK: ![[#PROF_UR_LATCH]] = !{!"branch_weights", i32 858864, i32 2146624784} |
| |
| ; 10000//4 = 2500 |
| ; CHECK: ![[#LOOP_UR_LATCH]] = distinct !{![[#LOOP_UR_LATCH]], ![[#LOOP_UR_TC:]], ![[#DISABLE:]]} |
| ; CHECK: ![[#LOOP_UR_TC]] = !{!"llvm.loop.estimated_trip_count", i32 2500} |
| ; |
| ; CHECK: ![[#DISABLE]] = !{!"llvm.loop.unroll.disable"} |
| |
| ; Probability of 1 to 3 more of 3 more remainder iterations: |
| ; (p-p^4)/(1-p^4) = 0.749962497 =~ 1610532724 / (1610532724 + 536950924). |
| ; CHECK: ![[#PROF_RM_GUARD]] = !{!"branch_weights", i32 1610532724, i32 536950924} |
| |
| ; Frequency of first remainder iter: r1 = 1 |
| ; Frequency of second remainder iter: r2 = r1*(p-p^3)/(1-p^3) = 0.666633331 |
| ; Frequency of third remainder iter: r3 = r2*(p-p^2)/(1-p^2) = 0.333299999 |
| ; Solve for loop probability that produces that frequency: f = 1/(1-p') => |
| ; p' = 1-1/f = 1-1/(r1+r2+r3) = 0.499983332 =~ |
| ; 1073706403 / (1073706403 + 1073777245). |
| ; CHECK: ![[#PROF_RM_LATCH]] = !{!"branch_weights", i32 1073706403, i32 1073777245} |
| |
| ; 10000%4 = 0 |
| ; CHECK: ![[#LOOP_RM_LATCH]] = distinct !{![[#LOOP_RM_LATCH]], ![[#LOOP_RM_TC:]], ![[#DISABLE:]]} |
| ; CHECK: ![[#LOOP_RM_TC]] = !{!"llvm.loop.estimated_trip_count", i32 0} |