| ; RUN: opt < %s -basicaa -loop-interchange -S | FileCheck %s |
| ;; We test the complete .ll for adjustment in outer loop header/latch and inner loop header/latch. |
| |
| target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| @A = common global [100 x [100 x i32]] zeroinitializer |
| |
| ;; Test to make sure we can handle output dependencies. |
| ;; |
| ;; for (int i = 0; i < 2; ++i) |
| ;; for(int j = 0; j < 3; ++j) { |
| ;; A[j][i] = i; |
| ;; A[j][i+1] = j; |
| ;; } |
| |
| @A10 = local_unnamed_addr global [3 x [3 x i32]] zeroinitializer, align 16 |
| |
| define void @interchange_10() { |
| entry: |
| br label %for.cond1.preheader |
| |
| for.cond.loopexit: ; preds = %for.body4 |
| %exitcond28 = icmp ne i64 %indvars.iv.next27, 2 |
| br i1 %exitcond28, label %for.cond1.preheader, label %for.cond.cleanup |
| |
| for.cond1.preheader: ; preds = %for.cond.loopexit, %entry |
| %indvars.iv26 = phi i64 [ 0, %entry ], [ %indvars.iv.next27, %for.cond.loopexit ] |
| %indvars.iv.next27 = add nuw nsw i64 %indvars.iv26, 1 |
| br label %for.body4 |
| |
| for.cond.cleanup: ; preds = %for.cond.loopexit |
| ret void |
| |
| for.body4: ; preds = %for.body4, %for.cond1.preheader |
| %indvars.iv = phi i64 [ 0, %for.cond1.preheader ], [ %indvars.iv.next, %for.body4 ] |
| %arrayidx6 = getelementptr inbounds [3 x [3 x i32]], [3 x [3 x i32]]* @A10, i64 0, i64 %indvars.iv, i64 %indvars.iv26 |
| %tmp = trunc i64 %indvars.iv26 to i32 |
| store i32 %tmp, i32* %arrayidx6, align 4 |
| %arrayidx10 = getelementptr inbounds [3 x [3 x i32]], [3 x [3 x i32]]* @A10, i64 0, i64 %indvars.iv, i64 %indvars.iv.next27 |
| %tmp1 = trunc i64 %indvars.iv to i32 |
| store i32 %tmp1, i32* %arrayidx10, align 4 |
| %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| %exitcond = icmp ne i64 %indvars.iv.next, 3 |
| br i1 %exitcond, label %for.body4, label %for.cond.loopexit |
| } |
| |
| ; CHECK-LABEL: @interchange_10 |
| ; CHECK: entry: |
| ; CHECK: br label %for.body4.preheader |
| |
| ; CHECK: for.cond1.preheader.preheader: |
| ; CHECK: br label %for.cond1.preheader |
| |
| ; CHECK: for.cond.loopexit: |
| ; CHECK: %exitcond28 = icmp ne i64 %indvars.iv.next27, 2 |
| ; CHECK: br i1 %exitcond28, label %for.cond1.preheader, label %for.body4.split |
| |
| ; CHECK: for.cond1.preheader: |
| ; CHECK: %indvars.iv26 = phi i64 [ %indvars.iv.next27, %for.cond.loopexit ], [ 0, %for.cond1.preheader.preheader ] |
| ; CHECK: %indvars.iv.next27 = add nuw nsw i64 %indvars.iv26, 1 |
| ; CHECK: br label %for.body4.split1 |
| |
| ; CHECK: for.body4.preheader: |
| ; CHECK: br label %for.body4 |
| |
| ; CHECK: for.cond.cleanup: |
| ; CHECK: ret void |
| |
| ; CHECK: for.body4: |
| ; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %for.body4.split ], [ 0, %for.body4.preheader ] |
| ; CHECK: br label %for.cond1.preheader.preheader |
| |
| ; CHECK: for.body4.split1: |
| ; CHECK: %arrayidx6 = getelementptr inbounds [3 x [3 x i32]], [3 x [3 x i32]]* @A10, i64 0, i64 %indvars.iv, i64 %indvars.iv26 |
| ; CHECK: %tmp = trunc i64 %indvars.iv26 to i32 |
| ; CHECK: store i32 %tmp, i32* %arrayidx6, align 4 |
| ; CHECK: %arrayidx10 = getelementptr inbounds [3 x [3 x i32]], [3 x [3 x i32]]* @A10, i64 0, i64 %indvars.iv, i64 %indvars.iv.next27 |
| ; CHECK: %tmp1 = trunc i64 %indvars.iv to i32 |
| ; CHECK: store i32 %tmp1, i32* %arrayidx10, align 4 |
| ; CHECK: br label %for.cond.loopexit |
| |
| ; CHECK: for.body4.split: |
| ; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| ; CHECK: %exitcond = icmp ne i64 %indvars.iv.next, 3 |
| ; CHECK: br i1 %exitcond, label %for.body4, label %for.cond.cleanup |