blob: 82ba8e234c5daad6e3dd45069c1531a3dc6231c2 [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
; RUN: opt < %s -passes=loop-interchange -loop-interchange-profitabilities=ignore -S | FileCheck %s
; sum = 0;
; for (i = 0, sum_i = sum; i < 2; i++)
; for (j = 0; j < 2; j++) {
; sum += A[j][i];
; B[j][i] = sum_i;
; }
;
; Interchanging the loops will become as follows:
;
; sum = 0;
; for (j = 0, sum_j = sum; j < 2; j++)
; for (i = 0; i < 2; i++) {
; sum += A[j][i];
; B[j][i] = sum_j;
; }
;
; This is invalid transformation. Consider the case when `A` is as follows:
;
; A = {{ 0, 0 }, { 1, 1 }}
;
; In this case, `sum_i` evolves 0 -> 1, while `sum_j` evolves 0 -> 0.
;
define i8 @extra_reduction_use_in_inner0(ptr noalias %A, ptr noalias %B) {
; CHECK-LABEL: define i8 @extra_reduction_use_in_inner0(
; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
; CHECK-NEXT: [[INNER_PREHEADER:.*]]:
; CHECK-NEXT: br label %[[INNER:.*]]
; CHECK: [[INNER]]:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ 0, %[[INNER_PREHEADER]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
; CHECK-NEXT: [[SUM_OUTER:%.*]] = phi i8 [ 0, %[[INNER_PREHEADER]] ], [ [[SUM_LCSSA:%.*]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: br label %[[OUTER_HEADER_PREHEADER:.*]]
; CHECK: [[OUTER_HEADER_PREHEADER]]:
; CHECK-NEXT: [[J:%.*]] = phi i64 [ 0, %[[INNER]] ], [ [[TMP0:%.*]], %[[OUTER_HEADER_PREHEADER]] ]
; CHECK-NEXT: [[SUM_INNER:%.*]] = phi i8 [ [[SUM_OUTER]], %[[INNER]] ], [ [[SUM_INNER_NEXT:%.*]], %[[OUTER_HEADER_PREHEADER]] ]
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr [2 x i8], ptr [[A]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
; CHECK-NEXT: [[SUM_INNER_NEXT]] = add i8 [[SUM_INNER]], [[A]]
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr [2 x i8], ptr [[B]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: store i8 [[SUM_OUTER]], ptr [[GEP_B]], align 1
; CHECK-NEXT: [[TMP0]] = add i64 [[J]], 1
; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
; CHECK-NEXT: br i1 [[TMP1]], label %[[OUTER_LATCH]], label %[[OUTER_HEADER_PREHEADER]]
; CHECK: [[OUTER_LATCH]]:
; CHECK-NEXT: [[SUM_LCSSA]] = phi i8 [ [[SUM_INNER_NEXT]], %[[OUTER_HEADER_PREHEADER]] ]
; CHECK-NEXT: [[I_NEXT]] = add i64 [[I]], 1
; CHECK-NEXT: [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
; CHECK-NEXT: br i1 [[EC_I]], label %[[EXIT:.*]], label %[[INNER]]
; CHECK: [[EXIT]]:
; CHECK-NEXT: [[RES:%.*]] = phi i8 [ [[SUM_LCSSA]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: ret i8 [[RES]]
;
entry:
br label %outer.header
outer.header:
%i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
%sum.outer = phi i8 [ 0, %entry ], [ %sum.lcssa, %outer.latch ]
br label %inner
inner:
%j = phi i64 [ 0, %outer.header ], [ %j.next, %inner ]
%sum.inner = phi i8 [ %sum.outer, %outer.header ], [ %sum.inner.next, %inner ]
%gep.A = getelementptr [2 x i8], ptr %A, i64 %j, i64 %i
%a = load i8, ptr %gep.A
%sum.inner.next = add i8 %sum.inner, %a
%gep.B = getelementptr [2 x i8], ptr %B, i64 %j, i64 %i
store i8 %sum.outer, ptr %gep.B
%j.next = add i64 %j, 1
%ec.j = icmp eq i64 %j.next, 2
br i1 %ec.j, label %outer.latch, label %inner
outer.latch:
%sum.lcssa = phi i8 [ %sum.inner.next, %inner ]
%i.next = add i64 %i, 1
%ec.i = icmp eq i64 %i.next, 2
br i1 %ec.i, label %exit, label %outer.header
exit:
%res = phi i8 [ %sum.lcssa, %outer.latch ]
ret i8 %res
}
; sum = 0;
; for (i = 0; i < 2; i++)
; for (j = 0; j < 2; j++) {
; sum += A[j][i];
; B[j][i] = sum;
; }
;
; Interchanging the loops will become as follows:
;
; sum = 0;
; for (j = 0; j < 2; j++)
; for (i = 0; i < 2; i++) {
; sum += A[j][i];
; B[j][i] = sum;
; }
;
; This is invalid transformation. Consider the case when `A` is as follows:
;
; A = {{ 0, 1 }, { 0, 0 }}
;
; In this case, in the original loops, `sum` evolves 0 -> 0 -> 1 -> 1, while in
; the interchanged loops, `sum` evolves 0 -> 1 -> 1 -> 1
;
define i8 @extra_reduction_use_in_inner1(ptr noalias %A, ptr noalias %B) {
; CHECK-LABEL: define i8 @extra_reduction_use_in_inner1(
; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*]]:
; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
; CHECK: [[OUTER_HEADER]]:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
; CHECK-NEXT: [[SUM_OUTER:%.*]] = phi i8 [ 0, %[[ENTRY]] ], [ [[SUM_LCSSA:%.*]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: br label %[[INNER:.*]]
; CHECK: [[INNER]]:
; CHECK-NEXT: [[J:%.*]] = phi i64 [ 0, %[[OUTER_HEADER]] ], [ [[J_NEXT:%.*]], %[[INNER]] ]
; CHECK-NEXT: [[SUM_INNER:%.*]] = phi i8 [ [[SUM_OUTER]], %[[OUTER_HEADER]] ], [ [[SUM_NEXT:%.*]], %[[INNER]] ]
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr [2 x i8], ptr [[A]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
; CHECK-NEXT: [[SUM_NEXT]] = add i8 [[SUM_INNER]], [[A]]
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr [2 x i8], ptr [[B]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: store i8 [[SUM_NEXT]], ptr [[GEP_B]], align 1
; CHECK-NEXT: [[J_NEXT]] = add i64 [[J]], 1
; CHECK-NEXT: [[EC_J:%.*]] = icmp eq i64 [[J_NEXT]], 2
; CHECK-NEXT: br i1 [[EC_J]], label %[[OUTER_LATCH]], label %[[INNER]]
; CHECK: [[OUTER_LATCH]]:
; CHECK-NEXT: [[SUM_LCSSA]] = phi i8 [ [[SUM_NEXT]], %[[INNER]] ]
; CHECK-NEXT: [[I_NEXT]] = add i64 [[I]], 1
; CHECK-NEXT: [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
; CHECK-NEXT: br i1 [[EC_I]], label %[[EXIT:.*]], label %[[OUTER_HEADER]]
; CHECK: [[EXIT]]:
; CHECK-NEXT: [[RES:%.*]] = phi i8 [ [[SUM_LCSSA]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: ret i8 [[RES]]
;
entry:
br label %outer.header
outer.header:
%i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
%sum.outer = phi i8 [ 0, %entry ], [ %sum.lcssa, %outer.latch ]
br label %inner
inner:
%j = phi i64 [ 0, %outer.header ], [ %j.next, %inner ]
%sum.inner = phi i8 [ %sum.outer, %outer.header ], [ %sum.inner.next, %inner ]
%gep.A = getelementptr [2 x i8], ptr %A, i64 %j, i64 %i
%a = load i8, ptr %gep.A
%sum.inner.next = add i8 %sum.inner, %a
%gep.B = getelementptr [2 x i8], ptr %B, i64 %j, i64 %i
store i8 %sum.inner.next, ptr %gep.B
%j.next = add i64 %j, 1
%ec.j = icmp eq i64 %j.next, 2
br i1 %ec.j, label %outer.latch, label %inner
outer.latch:
%sum.lcssa = phi i8 [ %sum.inner.next, %inner ]
%i.next = add i64 %i, 1
%ec.i = icmp eq i64 %i.next, 2
br i1 %ec.i, label %exit, label %outer.header
exit:
%res = phi i8 [ %sum.lcssa, %outer.latch ]
ret i8 %res
}
; sum = 0;
; for (i = 0, sum_i = sum; i < 2; i++)
; for (j = 0; j < 2; j++)
; for (k = 0; k < 2; k++) {
; sum += A[j][i];
; B[j][i] = sum_i;
; }
;
; In this case, interchanging the j-loop and the k-loop is legal.
;
define i8 @extra_reduction_use_in_inner2(ptr noalias %A, ptr noalias %B) {
; CHECK-LABEL: define i8 @extra_reduction_use_in_inner2(
; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*]]:
; CHECK-NEXT: br label %[[OUTER_HEADER:.*]]
; CHECK: [[OUTER_HEADER]]:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[I_NEXT:%.*]], %[[OUTER_LATCH:.*]] ]
; CHECK-NEXT: [[SUM_OUTER:%.*]] = phi i8 [ 0, %[[ENTRY]] ], [ [[SUM_OUTER_LCSSA:%.*]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: br label %[[MIDDLE_HEADER_PREHEADER:.*]]
; CHECK: [[MIDDLE_HEADER_PREHEADER]]:
; CHECK-NEXT: br label %[[MIDDLE_HEADER:.*]]
; CHECK: [[MIDDLE_HEADER]]:
; CHECK-NEXT: [[J:%.*]] = phi i64 [ [[TMP2:%.*]], %[[MIDDLE_LATCH_SPLIT:.*]] ], [ 0, %[[MIDDLE_HEADER_PREHEADER]] ]
; CHECK-NEXT: [[SUM_MIDDLE:%.*]] = phi i8 [ [[SUM_MIDDLE_LCSSA:%.*]], %[[MIDDLE_LATCH_SPLIT]] ], [ [[SUM_OUTER]], %[[MIDDLE_HEADER_PREHEADER]] ]
; CHECK-NEXT: br label %[[INNER_PREHEADER:.*]]
; CHECK: [[INNER_PREHEADER]]:
; CHECK-NEXT: br label %[[INNER:.*]]
; CHECK: [[INNER]]:
; CHECK-NEXT: [[K:%.*]] = phi i64 [ [[TMP0:%.*]], %[[INNER_SPLIT:.*]] ], [ 0, %[[INNER_PREHEADER]] ]
; CHECK-NEXT: [[SUM_INNER:%.*]] = phi i8 [ [[SUM_INNER_NEXT:%.*]], %[[INNER_SPLIT]] ], [ [[SUM_MIDDLE]], %[[INNER_PREHEADER]] ]
; CHECK-NEXT: br label %[[INNER_SPLIT1:.*]]
; CHECK: [[INNER_SPLIT1]]:
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr [2 x [2 x i8]], ptr [[A]], i64 [[K]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: [[A:%.*]] = load i8, ptr [[GEP_A]], align 1
; CHECK-NEXT: [[SUM_INNER_NEXT]] = add i8 [[SUM_INNER]], [[A]]
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr [2 x [2 x i8]], ptr [[B]], i64 [[K]], i64 [[J]], i64 [[I]]
; CHECK-NEXT: store i8 [[SUM_OUTER]], ptr [[GEP_B]], align 1
; CHECK-NEXT: [[K_NEXT:%.*]] = add i64 [[K]], 1
; CHECK-NEXT: [[EC_K:%.*]] = icmp eq i64 [[K_NEXT]], 2
; CHECK-NEXT: br label %[[MIDDLE_LATCH:.*]]
; CHECK: [[INNER_SPLIT]]:
; CHECK-NEXT: [[TMP0]] = add i64 [[K]], 1
; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
; CHECK-NEXT: br i1 [[TMP1]], label %[[MIDDLE_LATCH_SPLIT]], label %[[INNER]]
; CHECK: [[MIDDLE_LATCH]]:
; CHECK-NEXT: [[J_NEXT:%.*]] = add i64 [[J]], 1
; CHECK-NEXT: [[EC_J:%.*]] = icmp eq i64 [[J_NEXT]], 2
; CHECK-NEXT: br label %[[INNER_SPLIT]]
; CHECK: [[MIDDLE_LATCH_SPLIT]]:
; CHECK-NEXT: [[SUM_MIDDLE_LCSSA]] = phi i8 [ [[SUM_INNER_NEXT]], %[[INNER_SPLIT]] ]
; CHECK-NEXT: [[TMP2]] = add i64 [[J]], 1
; CHECK-NEXT: [[TMP3:%.*]] = icmp eq i64 [[TMP2]], 2
; CHECK-NEXT: br i1 [[TMP3]], label %[[OUTER_LATCH]], label %[[MIDDLE_HEADER]]
; CHECK: [[OUTER_LATCH]]:
; CHECK-NEXT: [[SUM_OUTER_LCSSA]] = phi i8 [ [[SUM_MIDDLE_LCSSA]], %[[MIDDLE_LATCH_SPLIT]] ]
; CHECK-NEXT: [[I_NEXT]] = add i64 [[I]], 1
; CHECK-NEXT: [[EC_I:%.*]] = icmp eq i64 [[I_NEXT]], 2
; CHECK-NEXT: br i1 [[EC_I]], label %[[EXIT:.*]], label %[[OUTER_HEADER]]
; CHECK: [[EXIT]]:
; CHECK-NEXT: [[RES:%.*]] = phi i8 [ [[SUM_OUTER_LCSSA]], %[[OUTER_LATCH]] ]
; CHECK-NEXT: ret i8 [[RES]]
;
entry:
br label %outer.header
outer.header:
%i = phi i64 [ 0, %entry ], [ %i.next, %outer.latch ]
%sum.outer = phi i8 [ 0, %entry ], [ %sum.outer.lcssa, %outer.latch ]
br label %middle.header
middle.header:
%j = phi i64 [ 0, %outer.header ], [ %j.next, %middle.latch ]
%sum.middle = phi i8 [ %sum.outer, %outer.header ], [ %sum.middle.lcssa, %middle.latch ]
br label %inner
inner:
%k = phi i64 [ 0, %middle.header ], [ %k.next, %inner ]
%sum.inner = phi i8 [ %sum.middle, %middle.header ], [ %sum.inner.next, %inner ]
%gep.A = getelementptr [2 x [2 x i8]], ptr %A, i64 %k, i64 %j, i64 %i
%a = load i8, ptr %gep.A
%sum.inner.next = add i8 %sum.inner, %a
%gep.B = getelementptr [2 x [2 x i8]], ptr %B, i64 %k, i64 %j, i64 %i
store i8 %sum.outer, ptr %gep.B
%k.next = add i64 %k, 1
%ec.k = icmp eq i64 %k.next, 2
br i1 %ec.k, label %middle.latch, label %inner
middle.latch:
%sum.middle.lcssa = phi i8 [ %sum.inner.next, %inner ]
%j.next = add i64 %j, 1
%ec.j = icmp eq i64 %j.next, 2
br i1 %ec.j, label %outer.latch, label %middle.header
outer.latch:
%sum.outer.lcssa = phi i8 [ %sum.middle.lcssa, %middle.latch ]
%i.next = add i64 %i, 1
%ec.i = icmp eq i64 %i.next, 2
br i1 %ec.i, label %exit, label %outer.header
exit:
%res = phi i8 [ %sum.outer.lcssa, %outer.latch ]
ret i8 %res
}