| ; RUN: opt < %s -basicaa -loop-interchange -pass-remarks-missed='loop-interchange' -verify-loop-lcssa -pass-remarks-output=%t -S |
| ; RUN: FileCheck --input-file %t --check-prefix REMARK %s |
| |
| target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| @A = common global [100 x [100 x i32]] zeroinitializer |
| @C = common global [100 x [100 x i32]] zeroinitializer |
| @X = common global i32 0 |
| @Y = common global i64 0 |
| @F = common global float 0.0 |
| |
| ; We cannot interchange this loop at the moment, because iv.outer.next is |
| ; produced in the outer loop latch and used in the loop exit block. If the inner |
| ; loop body is not executed, the outer loop latch won't be executed either |
| ; after interchanging. |
| ; REMARK: UnsupportedExitPHI |
| ; REMARK-NEXT: lcssa_01 |
| |
| define void @lcssa_01() { |
| entry: |
| %cmp21 = icmp sgt i64 100, 1 |
| br i1 %cmp21, label %outer.ph, label %for.end16 |
| |
| outer.ph: ; preds = %entry |
| %cmp218 = icmp sgt i64 100, 1 |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %outer.ph |
| %iv.outer = phi i64 [ 1, %outer.ph ], [ %iv.outer.next, %outer.inc ] |
| br i1 %cmp218, label %for.body3, label %outer.inc |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %arrayidx5 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %for.body3, %outer.header |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %iv.outer.next.lcssa = phi i64 [ %iv.outer.next, %outer.inc ] |
| store i64 %iv.outer.next.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit, %entry |
| ret void |
| } |
| |
| ; REMARK: UnsupportedExitPHI |
| ; REMARK-NEXT: lcssa_02 |
| define void @lcssa_02() { |
| entry: |
| %cmp21 = icmp sgt i64 100, 1 |
| br i1 %cmp21, label %outer.ph, label %for.end16 |
| |
| outer.ph: ; preds = %entry |
| %cmp218 = icmp sgt i64 100, 1 |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %outer.ph |
| %iv.outer = phi i64 [ 1, %outer.ph ], [ %iv.outer.next, %outer.inc ] |
| br i1 %cmp218, label %for.body3, label %outer.inc |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %arrayidx5 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %for.body3, %outer.header |
| %iv.inner.end = phi i64 [ 0, %outer.header ], [ %iv.inner.next, %for.body3 ] |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %iv.inner.end.lcssa = phi i64 [ %iv.inner.end, %outer.inc ] |
| store i64 %iv.inner.end.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit, %entry |
| ret void |
| } |
| |
| ; REMARK: Interchanged |
| ; REMARK-NEXT: lcssa_03 |
| define void @lcssa_03() { |
| entry: |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %entry |
| %iv.outer = phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ] |
| br label %for.body3 |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %arrayidx5 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %for.body3 |
| %iv.inner.lcssa = phi i64 [ %iv.inner, %for.body3 ] |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %iv.inner.lcssa.lcssa = phi i64 [ %iv.inner.lcssa, %outer.inc ] |
| store i64 %iv.inner.lcssa.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit |
| ret void |
| } |
| |
| ; FIXME: We currently do not support LCSSA phi nodes involving floating point |
| ; types, as we fail to detect floating point reductions for now. |
| ; REMARK: UnsupportedPHIOuter |
| ; REMARK-NEXT: lcssa_04 |
| |
| define void @lcssa_04() { |
| entry: |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %entry |
| %iv.outer = phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ] |
| %float.outer = phi float [ 1.000000e+00, %entry ], [ 2.000000e+00, %outer.inc ] |
| br label %for.body3 |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %arrayidx5 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %for.body3 |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %float.outer.lcssa = phi float [ %float.outer, %outer.inc ] |
| store float %float.outer.lcssa, float* @F |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit |
| ret void |
| } |
| |
| ; PHI node in inner latch with multiple predecessors. |
| ; REMARK: Interchanged |
| ; REMARK-NEXT: lcssa_05 |
| |
| define void @lcssa_05(i32* %ptr) { |
| entry: |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %entry |
| %iv.outer = phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ] |
| br label %for.body3 |
| |
| for.body3: ; preds = %bb3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %bb3 ], [ 1, %outer.header ] |
| br i1 undef, label %bb2, label %bb3 |
| |
| bb2: ; preds = %for.body3 |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| br label %bb3 |
| |
| bb3: ; preds = %bb2, %for.body3 |
| %addp = phi i32 [ %add, %bb2 ], [ 0, %for.body3 ] |
| store i32 %addp, i32* %ptr |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %bb3 |
| %iv.inner.lcssa = phi i64 [ %iv.inner, %bb3 ] |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %iv.inner.lcssa.lcssa = phi i64 [ %iv.inner.lcssa, %outer.inc ] |
| store i64 %iv.inner.lcssa.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit |
| ret void |
| } |
| |
| ; REMARK: UnsupportedExitPHI |
| ; REMARK-NEXT: lcssa_06 |
| |
| define void @lcssa_06(i64* %ptr, i32* %ptr1) { |
| entry: |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %entry |
| %iv.outer = phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ] |
| br i1 undef, label %for.body3, label %outer.inc |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %ptr1 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.inc, label %for.body3 |
| |
| outer.inc: ; preds = %for.body3, %outer.header |
| %sv = phi i64 [ 0, %outer.header ], [ 1, %for.body3 ] |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %sv.lcssa = phi i64 [ %sv, %outer.inc ] |
| store i64 %sv.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit |
| ret void |
| } |
| |
| ; REMARK: Interchanged |
| ; REMARK-NEXT: lcssa_07 |
| define void @lcssa_07() { |
| entry: |
| br label %outer.header |
| |
| outer.header: ; preds = %outer.inc, %entry |
| %iv.outer = phi i64 [ 1, %entry ], [ %iv.outer.next, %outer.inc ] |
| br label %for.body3 |
| |
| for.body3: ; preds = %for.body3, %outer.header |
| %iv.inner = phi i64 [ %iv.inner.next, %for.body3 ], [ 1, %outer.header ] |
| %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vA = load i32, i32* %arrayidx5 |
| %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @C, i64 0, i64 %iv.inner, i64 %iv.outer |
| %vC = load i32, i32* %arrayidx9 |
| %add = add nsw i32 %vA, %vC |
| store i32 %add, i32* %arrayidx5 |
| %iv.inner.next = add nuw nsw i64 %iv.inner, 1 |
| %exitcond = icmp eq i64 %iv.inner.next, 100 |
| br i1 %exitcond, label %outer.bb, label %for.body3 |
| |
| outer.bb: ; preds = %for.body3 |
| %iv.inner.lcssa = phi i64 [ %iv.inner, %for.body3 ] |
| br label %outer.inc |
| |
| outer.inc: ; preds = %outer.bb |
| %iv.outer.next = add nsw i64 %iv.outer, 1 |
| %cmp = icmp eq i64 %iv.outer.next, 100 |
| br i1 %cmp, label %outer.header, label %for.exit |
| |
| for.exit: ; preds = %outer.inc |
| %iv.inner.lcssa.lcssa = phi i64 [ %iv.inner.lcssa, %outer.inc ] |
| store i64 %iv.inner.lcssa.lcssa, i64* @Y |
| br label %for.end16 |
| |
| for.end16: ; preds = %for.exit |
| ret void |
| } |