blob: 6f1d275f6a385a87d63b33cfb731cd99fcb4bad7 [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
; RUN: opt < %s -passes=loop-interchange -loop-interchange-profitabilities=ignore -S | FileCheck %s
; sum = 0.0;
; for (i = 0; i < 2; i++)
; for (j = 0; j < 2; j++)
; sum += A[i][j];
;
; The fadd instruction has reassoc flag, so it's legal to interchange the
; loops. However, it also has ninf flag, which means the transformation
; potentially produces a poison due to the change of the order of evaluation.
; For example, consider the case where
; A[2][2] = {{FLT_MAX, -FLT_MAX}, {FLT_MAX, -FLT_MAX}}.
;
; FIXME: The ninf flag should be dropped when the loop interchange is applied.
;
define noundef float @reduction_reassoc_ninf(ptr %A) {
; CHECK-LABEL: define noundef float @reduction_reassoc_ninf(
; CHECK-SAME: ptr [[A:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*:]]
; CHECK-NEXT: br label %[[FOR_J_PREHEADER:.*]]
; CHECK: [[FOR_I_HEADER_PREHEADER:.*]]:
; CHECK-NEXT: br label %[[FOR_I_HEADER:.*]]
; CHECK: [[FOR_I_HEADER]]:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ [[I_INC:%.*]], %[[FOR_I_LATCH:.*]] ], [ 0, %[[FOR_I_HEADER_PREHEADER]] ]
; CHECK-NEXT: [[SUM_J:%.*]] = phi float [ [[SUM_J_NEXT:%.*]], %[[FOR_I_LATCH]] ], [ [[SUM_I:%.*]], %[[FOR_I_HEADER_PREHEADER]] ]
; CHECK-NEXT: br label %[[FOR_J_SPLIT1:.*]]
; CHECK: [[FOR_J_PREHEADER]]:
; CHECK-NEXT: br label %[[FOR_J:.*]]
; CHECK: [[FOR_J]]:
; CHECK-NEXT: [[J:%.*]] = phi i64 [ [[TMP0:%.*]], %[[FOR_J_SPLIT:.*]] ], [ 0, %[[FOR_J_PREHEADER]] ]
; CHECK-NEXT: [[SUM_I]] = phi float [ [[SUM_I_NEXT:%.*]], %[[FOR_J_SPLIT]] ], [ 0.000000e+00, %[[FOR_J_PREHEADER]] ]
; CHECK-NEXT: br label %[[FOR_I_HEADER_PREHEADER]]
; CHECK: [[FOR_J_SPLIT1]]:
; CHECK-NEXT: [[GEP:%.*]] = getelementptr [2 x float], ptr [[A]], i64 [[I]], i64 [[J]]
; CHECK-NEXT: [[VAL:%.*]] = load float, ptr [[GEP]], align 4
; CHECK-NEXT: [[SUM_J_NEXT]] = fadd reassoc float [[SUM_J]], [[VAL]]
; CHECK-NEXT: [[J_INC:%.*]] = add i64 [[J]], 1
; CHECK-NEXT: [[EC_J:%.*]] = icmp eq i64 [[J_INC]], 2
; CHECK-NEXT: br label %[[FOR_I_LATCH]]
; CHECK: [[FOR_J_SPLIT]]:
; CHECK-NEXT: [[SUM_I_NEXT]] = phi float [ [[SUM_J_NEXT]], %[[FOR_I_LATCH]] ]
; CHECK-NEXT: [[TMP0]] = add i64 [[J]], 1
; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
; CHECK-NEXT: br i1 [[TMP1]], label %[[EXIT:.*]], label %[[FOR_J]]
; CHECK: [[FOR_I_LATCH]]:
; CHECK-NEXT: [[I_INC]] = add i64 [[I]], 1
; CHECK-NEXT: [[EC_I:%.*]] = icmp eq i64 [[I_INC]], 2
; CHECK-NEXT: br i1 [[EC_I]], label %[[FOR_J_SPLIT]], label %[[FOR_I_HEADER]]
; CHECK: [[EXIT]]:
; CHECK-NEXT: [[SUM_I_NEXT_LCSSA:%.*]] = phi float [ [[SUM_I_NEXT]], %[[FOR_J_SPLIT]] ]
; CHECK-NEXT: ret float [[SUM_I_NEXT_LCSSA]]
;
entry:
br label %for.i.header
for.i.header:
%i = phi i64 [ 0, %entry ], [ %i.inc, %for.i.latch ]
%sum.i = phi float [ 0.0, %entry ], [ %sum.i.next, %for.i.latch ]
br label %for.j
for.j:
%j = phi i64 [ 0, %for.i.header ], [ %j.inc, %for.j ]
%sum.j = phi float [ %sum.i, %for.i.header ], [ %sum.j.next, %for.j ]
%gep = getelementptr [2 x float], ptr %A, i64 %i, i64 %j
%val = load float, ptr %gep
%sum.j.next = fadd reassoc ninf float %sum.j, %val
%j.inc = add i64 %j, 1
%ec.j = icmp eq i64 %j.inc, 2
br i1 %ec.j, label %for.i.latch, label %for.j
for.i.latch:
%sum.i.next = phi float [ %sum.j.next, %for.j ]
%i.inc = add i64 %i, 1
%ec.i = icmp eq i64 %i.inc, 2
br i1 %ec.i, label %exit, label %for.i.header
exit:
ret float %sum.i.next
}
; for (i = 0; i < 2; i++)
; for (j = 0; j < 2; j++)
; C[i][j] = A[i][j] + B[i][j];
;
; The fadd instruction has ninf flag, but different from the above example,
; it's not a reduction so interchanging the loops shouldn't result in a poison
; value.
;
define void @non_reduction_ninf(ptr %A, ptr %B, ptr noalias %C) {
; CHECK-LABEL: define void @non_reduction_ninf(
; CHECK-SAME: ptr [[A:%.*]], ptr [[B:%.*]], ptr noalias [[C:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*:]]
; CHECK-NEXT: br label %[[FOR_J_PREHEADER:.*]]
; CHECK: [[FOR_I_HEADER_PREHEADER:.*]]:
; CHECK-NEXT: br label %[[FOR_I_HEADER:.*]]
; CHECK: [[FOR_I_HEADER]]:
; CHECK-NEXT: [[I:%.*]] = phi i64 [ [[I_INC:%.*]], %[[FOR_I_LATCH:.*]] ], [ 0, %[[FOR_I_HEADER_PREHEADER]] ]
; CHECK-NEXT: br label %[[FOR_J_SPLIT1:.*]]
; CHECK: [[FOR_J_PREHEADER]]:
; CHECK-NEXT: br label %[[FOR_J:.*]]
; CHECK: [[FOR_J]]:
; CHECK-NEXT: [[J:%.*]] = phi i64 [ [[TMP0:%.*]], %[[FOR_J_SPLIT:.*]] ], [ 0, %[[FOR_J_PREHEADER]] ]
; CHECK-NEXT: br label %[[FOR_I_HEADER_PREHEADER]]
; CHECK: [[FOR_J_SPLIT1]]:
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr [2 x float], ptr [[A]], i64 [[I]], i64 [[J]]
; CHECK-NEXT: [[VAL_A:%.*]] = load float, ptr [[GEP_A]], align 4
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr [2 x float], ptr [[B]], i64 [[I]], i64 [[J]]
; CHECK-NEXT: [[VAL_B:%.*]] = load float, ptr [[GEP_B]], align 4
; CHECK-NEXT: [[SUM:%.*]] = fadd ninf float [[VAL_A]], [[VAL_B]]
; CHECK-NEXT: [[GEP_C:%.*]] = getelementptr [2 x float], ptr [[C]], i64 [[I]], i64 [[J]]
; CHECK-NEXT: store float [[SUM]], ptr [[GEP_C]], align 4
; CHECK-NEXT: [[J_INC:%.*]] = add i64 [[J]], 1
; CHECK-NEXT: [[EC_J:%.*]] = icmp eq i64 [[J_INC]], 2
; CHECK-NEXT: br label %[[FOR_I_LATCH]]
; CHECK: [[FOR_J_SPLIT]]:
; CHECK-NEXT: [[TMP0]] = add i64 [[J]], 1
; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[TMP0]], 2
; CHECK-NEXT: br i1 [[TMP1]], label %[[EXIT:.*]], label %[[FOR_J]]
; CHECK: [[FOR_I_LATCH]]:
; CHECK-NEXT: [[I_INC]] = add i64 [[I]], 1
; CHECK-NEXT: [[EC_I:%.*]] = icmp eq i64 [[I_INC]], 2
; CHECK-NEXT: br i1 [[EC_I]], label %[[FOR_J_SPLIT]], label %[[FOR_I_HEADER]]
; CHECK: [[EXIT]]:
; CHECK-NEXT: ret void
;
entry:
br label %for.i.header
for.i.header:
%i = phi i64 [ 0, %entry ], [ %i.inc, %for.i.latch ]
br label %for.j
for.j:
%j = phi i64 [ 0, %for.i.header ], [ %j.inc, %for.j ]
%gep.A = getelementptr [2 x float], ptr %A, i64 %i, i64 %j
%val.A = load float, ptr %gep.A
%gep.B = getelementptr [2 x float], ptr %B, i64 %i, i64 %j
%val.B = load float, ptr %gep.B
%sum = fadd ninf float %val.A, %val.B
%gep.C = getelementptr [2 x float], ptr %C, i64 %i, i64 %j
store float %sum, ptr %gep.C
%j.inc = add i64 %j, 1
%ec.j = icmp eq i64 %j.inc, 2
br i1 %ec.j, label %for.i.latch, label %for.j
for.i.latch:
%i.inc = add i64 %i, 1
%ec.i = icmp eq i64 %i.inc, 2
br i1 %ec.i, label %exit, label %for.i.header
exit:
ret void
}