| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6 |
| ; RUN: opt -aa-pipeline=basic-aa -passes=loop-distribute -enable-loop-distribute -verify-loop-info -verify-dom-info -S \ |
| ; RUN: < %s | FileCheck %s |
| |
| ; Doubly nested loop with two statements in the innermost loop. |
| ; Statement S2 can be put into a separate loop because there is no dependence between S1 and S2. |
| ; |
| ; for (int i = 0; i < N; i++) { |
| ; for (int j = 0; j < M; j++) { |
| ; S1: A[i][j+1] = A[i][j] + B[i][j] + C[i][j] // Statement S1 |
| ; ================================ |
| ; S2: D[i][j] = E[i][j] * F[i][j]; // Statement 2 |
| ; } |
| ; } |
| |
| define void @doubly_nested_distributable(ptr noalias %A, ptr noalias %B, ptr noalias %C, |
| ptr noalias %D, ptr noalias %E, ptr noalias %F, |
| i64 %N, i64 %M) { |
| ; CHECK-LABEL: define void @doubly_nested_distributable( |
| ; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]], ptr noalias [[C:%.*]], ptr noalias [[D:%.*]], ptr noalias [[E:%.*]], ptr noalias [[F:%.*]], i64 [[N:%.*]], i64 [[M:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[FOR_I_HEADER:.*]] |
| ; CHECK: [[FOR_I_HEADER]]: |
| ; CHECK-NEXT: [[I:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[I_NEXT:%.*]], %[[FOR_I_INC:.*]] ] |
| ; CHECK-NEXT: [[I_CMP:%.*]] = icmp slt i64 [[I]], [[N]] |
| ; CHECK-NEXT: br i1 [[I_CMP]], label %[[FOR_J_PREHEADER_LDIST1:.*]], label %[[FOR_END:.*]] |
| ; CHECK: [[FOR_J_PREHEADER_LDIST1]]: |
| ; CHECK-NEXT: br label %[[FOR_J_BODY_LDIST1:.*]] |
| ; CHECK: [[FOR_J_BODY_LDIST1]]: |
| ; CHECK-NEXT: [[J_LDIST1:%.*]] = phi i64 [ 0, %[[FOR_J_PREHEADER_LDIST1]] ], [ [[J_NEXT_LDIST1:%.*]], %[[FOR_J_BODY_LDIST1]] ] |
| ; CHECK-NEXT: [[IDX_I_LDIST1:%.*]] = mul i64 [[I]], [[M]] |
| ; CHECK-NEXT: [[IDX_LDIST1:%.*]] = add i64 [[IDX_I_LDIST1]], [[J_LDIST1]] |
| ; CHECK-NEXT: [[ARRAYIDXA_LDIST1:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[IDX_LDIST1]] |
| ; CHECK-NEXT: [[LOADA_LDIST1:%.*]] = load i32, ptr [[ARRAYIDXA_LDIST1]], align 4 |
| ; CHECK-NEXT: [[ARRAYIDXB_LDIST1:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[IDX_LDIST1]] |
| ; CHECK-NEXT: [[LOADB_LDIST1:%.*]] = load i32, ptr [[ARRAYIDXB_LDIST1]], align 4 |
| ; CHECK-NEXT: [[ARRAYIDXC_LDIST1:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[IDX_LDIST1]] |
| ; CHECK-NEXT: [[LOADC_LDIST1:%.*]] = load i32, ptr [[ARRAYIDXC_LDIST1]], align 4 |
| ; CHECK-NEXT: [[ADDS1_LDIST1:%.*]] = add i32 [[LOADB_LDIST1]], [[LOADC_LDIST1]] |
| ; CHECK-NEXT: [[ADDWITHDEP_LDIST1:%.*]] = add i32 [[ADDS1_LDIST1]], [[LOADA_LDIST1]] |
| ; CHECK-NEXT: [[J_NEXT_LDIST1]] = add nuw nsw i64 [[J_LDIST1]], 1 |
| ; CHECK-NEXT: [[IDX_NEXT_LDIST1:%.*]] = add i64 [[IDX_LDIST1]], 1 |
| ; CHECK-NEXT: [[ARRAYIDXA_NEXT_LDIST1:%.*]] = getelementptr inbounds i32, ptr [[A]], i64 [[IDX_NEXT_LDIST1]] |
| ; CHECK-NEXT: store i32 [[ADDWITHDEP_LDIST1]], ptr [[ARRAYIDXA_NEXT_LDIST1]], align 4 |
| ; CHECK-NEXT: [[EXITCOND_J_LDIST1:%.*]] = icmp eq i64 [[J_NEXT_LDIST1]], [[M]] |
| ; CHECK-NEXT: br i1 [[EXITCOND_J_LDIST1]], label %[[FOR_J_PREHEADER:.*]], label %[[FOR_J_BODY_LDIST1]] |
| ; CHECK: [[FOR_J_PREHEADER]]: |
| ; CHECK-NEXT: br label %[[FOR_J_BODY:.*]] |
| ; CHECK: [[FOR_J_BODY]]: |
| ; CHECK-NEXT: [[J:%.*]] = phi i64 [ 0, %[[FOR_J_PREHEADER]] ], [ [[J_NEXT:%.*]], %[[FOR_J_BODY]] ] |
| ; CHECK-NEXT: [[IDX_I:%.*]] = mul i64 [[I]], [[M]] |
| ; CHECK-NEXT: [[IDX:%.*]] = add i64 [[IDX_I]], [[J]] |
| ; CHECK-NEXT: [[J_NEXT]] = add nuw nsw i64 [[J]], 1 |
| ; CHECK-NEXT: [[ARRAYIDXD:%.*]] = getelementptr inbounds i32, ptr [[D]], i64 [[IDX]] |
| ; CHECK-NEXT: [[ARRAYIDXE:%.*]] = getelementptr inbounds i32, ptr [[E]], i64 [[IDX]] |
| ; CHECK-NEXT: [[LOADE:%.*]] = load i32, ptr [[ARRAYIDXE]], align 4 |
| ; CHECK-NEXT: [[ARRAYIDXF:%.*]] = getelementptr inbounds i32, ptr [[F]], i64 [[IDX]] |
| ; CHECK-NEXT: [[LOADF:%.*]] = load i32, ptr [[ARRAYIDXF]], align 4 |
| ; CHECK-NEXT: [[MULS2:%.*]] = mul i32 [[LOADE]], [[LOADF]] |
| ; CHECK-NEXT: store i32 [[MULS2]], ptr [[ARRAYIDXD]], align 4 |
| ; CHECK-NEXT: [[EXITCOND_J:%.*]] = icmp eq i64 [[J_NEXT]], [[M]] |
| ; CHECK-NEXT: br i1 [[EXITCOND_J]], label %[[FOR_J_END:.*]], label %[[FOR_J_BODY]] |
| ; CHECK: [[FOR_J_END]]: |
| ; CHECK-NEXT: br label %[[FOR_I_INC]] |
| ; CHECK: [[FOR_I_INC]]: |
| ; CHECK-NEXT: [[I_NEXT]] = add nuw nsw i64 [[I]], 1 |
| ; CHECK-NEXT: br label %[[FOR_I_HEADER]] |
| ; CHECK: [[FOR_END]]: |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| br label %for.i.header |
| |
| for.i.header: ; preds = %for.i.inc, %entry |
| %i = phi i64 [ 0, %entry ], [ %i.next, %for.i.inc ] |
| %i.cmp = icmp slt i64 %i, %N |
| br i1 %i.cmp, label %for.j.preheader, label %for.end |
| |
| for.j.preheader: ; preds = %for.i.header |
| br label %for.j.body |
| |
| for.j.body: ; preds = %for.j.body, %for.j.preheader |
| %j = phi i64 [ 0, %for.j.preheader ], [ %j.next, %for.j.body ] |
| |
| %idx.i = mul i64 %i, %M |
| %idx = add i64 %idx.i, %j |
| |
| ; Statement 1: A[i][j+1] = A[i][j] + B[i][j] + C[i][j] |
| %arrayidxA = getelementptr inbounds i32, ptr %A, i64 %idx |
| %loadA = load i32, ptr %arrayidxA, align 4 |
| |
| %arrayidxB = getelementptr inbounds i32, ptr %B, i64 %idx |
| %loadB = load i32, ptr %arrayidxB, align 4 |
| |
| %arrayidxC = getelementptr inbounds i32, ptr %C, i64 %idx |
| %loadC = load i32, ptr %arrayidxC, align 4 |
| |
| %addS1 = add i32 %loadB, %loadC |
| %addWithDep = add i32 %addS1, %loadA |
| |
| %j.next = add nuw nsw i64 %j, 1 |
| %idx.next = add i64 %idx, 1 |
| %arrayidxA_next = getelementptr inbounds i32, ptr %A, i64 %idx.next |
| store i32 %addWithDep, ptr %arrayidxA_next, align 4 |
| |
| ; Statement 2: D[i][j] = E[i][j] * F[i][j] |
| %arrayidxD = getelementptr inbounds i32, ptr %D, i64 %idx |
| %arrayidxE = getelementptr inbounds i32, ptr %E, i64 %idx |
| %loadE = load i32, ptr %arrayidxE, align 4 |
| |
| %arrayidxF = getelementptr inbounds i32, ptr %F, i64 %idx |
| %loadF = load i32, ptr %arrayidxF, align 4 |
| |
| %mulS2 = mul i32 %loadE, %loadF |
| store i32 %mulS2, ptr %arrayidxD, align 4 |
| |
| %exitcond.j = icmp eq i64 %j.next, %M |
| br i1 %exitcond.j, label %for.j.end, label %for.j.body |
| |
| for.j.end: ; preds = %for.j.body |
| br label %for.i.inc |
| |
| for.i.inc: ; preds = %for.j.end |
| %i.next = add nuw nsw i64 %i, 1 |
| br label %for.i.header |
| |
| for.end: ; preds = %for.i.header |
| ret void |
| } |