| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=1 -S %s | FileCheck %s |
| |
| define void @test1_pr58811() { |
| ; CHECK-LABEL: @test1_pr58811( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: br label [[LOOP_1_PREHEADER:%.*]] |
| ; CHECK: loop.1.preheader: |
| ; CHECK-NEXT: [[IV_1_PH:%.*]] = phi i32 [ [[SUB93_2:%.*]], [[UNREACHABLE_BB:%.*]] ], [ 0, [[ENTRY:%.*]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = sub i32 0, [[IV_1_PH]] |
| ; CHECK-NEXT: br label [[LOOP_1:%.*]] |
| ; CHECK: loop.1: |
| ; CHECK-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], [[LOOP_1]] ], [ [[TMP0]], [[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[IV_1:%.*]] = phi i32 [ [[IV_1_NEXT:%.*]], [[LOOP_1]] ], [ [[IV_1_PH]], [[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[IV_2:%.*]] = phi i32 [ [[IV_2_NEXT:%.*]], [[LOOP_1]] ], [ 0, [[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_2]], -1 |
| ; CHECK-NEXT: [[IV_2_NEXT]] = add i32 [[IV_2]], 1 |
| ; CHECK-NEXT: [[IV_1_NEXT]] = add i32 [[IV_2]], [[IV_1]] |
| ; CHECK-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_1]], label [[LOOP_2_PREHEADER:%.*]] |
| ; CHECK: loop.2.preheader: |
| ; CHECK-NEXT: [[INDUCTION_IV_LCSSA:%.*]] = phi i32 [ [[INDUCTION_IV]], [[LOOP_1]] ] |
| ; CHECK-NEXT: [[IV_1_LCSSA:%.*]] = phi i32 [ [[IV_1]], [[LOOP_1]] ] |
| ; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]] |
| ; CHECK: vector.ph: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[INDUCTION_IV_LCSSA]] |
| ; CHECK-NEXT: br label [[VECTOR_BODY:%.*]] |
| ; CHECK: vector.body: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[TMP2:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP2]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]] |
| ; CHECK: middle.block: |
| ; CHECK-NEXT: [[IND_ESCAPE:%.*]] = sub i32 [[IND_END]], [[INDUCTION_IV_LCSSA]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_3_PREHEADER:%.*]], label [[SCALAR_PH]] |
| ; CHECK: scalar.ph: |
| ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i16 [ 196, [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_2_PREHEADER]] ] |
| ; CHECK-NEXT: [[BC_RESUME_VAL1:%.*]] = phi i32 [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_2_PREHEADER]] ] |
| ; CHECK-NEXT: br label [[LOOP_2:%.*]] |
| ; CHECK: loop.2: |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i16 [ [[IV_3_NEXT:%.*]], [[LOOP_2]] ], [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i32 [ [[IV_4_NEXT:%.*]], [[LOOP_2]] ], [ [[BC_RESUME_VAL1]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_4_NEXT]] = sub i32 [[IV_4]], [[IV_1_LCSSA]] |
| ; CHECK-NEXT: [[IV_3_NEXT]] = add i16 [[IV_3]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label [[LOOP_2]], label [[LOOP_3_PREHEADER]], !llvm.loop [[LOOP3:![0-9]+]] |
| ; CHECK: loop.3.preheader: |
| ; CHECK-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], [[LOOP_2]] ], [ [[IND_ESCAPE]], [[MIDDLE_BLOCK]] ] |
| ; CHECK-NEXT: br label [[LOOP_3:%.*]] |
| ; CHECK: loop.3: |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], [[LOOP_3]] ], [ 0, [[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; CHECK-NEXT: br label [[LOOP_3]] |
| ; CHECK: unreachable.bb: |
| ; CHECK-NEXT: br label [[LOOP_1_PREHEADER]] |
| ; |
| entry: |
| br label %loop.1.preheader |
| |
| loop.1.preheader: |
| %iv.1.ph = phi i32 [ %sub93.2, %unreachable.bb ], [ 0, %entry ] |
| br label %loop.1 |
| |
| loop.1: |
| %iv.1 = phi i32 [ %iv.1.next, %loop.1 ], [ %iv.1.ph, %loop.1.preheader ] |
| %iv.2 = phi i32 [ %iv.2.next, %loop.1 ], [ 0, %loop.1.preheader ] |
| %iv.2.next = add i32 %iv.2, 1 |
| %iv.1.next = add i32 %iv.2, %iv.1 |
| br i1 false, label %loop.1, label %loop.2.preheader |
| |
| loop.2.preheader: |
| %iv.1.lcssa = phi i32 [ %iv.1, %loop.1 ] |
| br label %loop.2 |
| |
| loop.2: |
| %iv.3 = phi i16 [ %iv.3.next, %loop.2 ], [ 0, %loop.2.preheader ] |
| %iv.4 = phi i32 [ %iv.4.next, %loop.2 ], [ 0, %loop.2.preheader ] |
| %iv.4.next = sub i32 %iv.4, %iv.1.lcssa |
| %iv.3.next = add i16 %iv.3, 1 |
| %cmp88.1 = icmp ult i16 %iv.3, 198 |
| br i1 %cmp88.1, label %loop.2, label %loop.3.preheader |
| |
| loop.3.preheader: |
| %iv.4.lcssa = phi i32 [ %iv.4, %loop.2 ] |
| br label %loop.3 |
| |
| loop.3: |
| %iv.5 = phi i32 [ %sub93.2, %loop.3 ], [ 0, %loop.3.preheader ] |
| %sub93.2 = sub i32 %iv.5, %iv.4.lcssa |
| br label %loop.3 |
| |
| unreachable.bb: ; No predecessors! |
| br label %loop.1.preheader |
| } |
| |
| define void @test2_pr58811() { |
| ; CHECK-LABEL: @test2_pr58811( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: br label [[LOOP_1_HEADER:%.*]] |
| ; CHECK: loop.1.header.loopexit: |
| ; CHECK-NEXT: [[SUB93_2_LCSSA:%.*]] = phi i32 [ [[SUB93_2:%.*]], [[LOOP_4:%.*]] ] |
| ; CHECK-NEXT: br label [[LOOP_1_HEADER]] |
| ; CHECK: loop.1.header: |
| ; CHECK-NEXT: [[P_1:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[SUB93_2_LCSSA]], [[LOOP_1_HEADER_LOOPEXIT:%.*]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = mul i32 [[P_1]], -1 |
| ; CHECK-NEXT: br label [[LOOP_2:%.*]] |
| ; CHECK: loop.2: |
| ; CHECK-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], [[LOOP_2]] ], [ [[TMP0]], [[LOOP_1_HEADER]] ] |
| ; CHECK-NEXT: [[IV_2:%.*]] = phi i32 [ [[P_1]], [[LOOP_1_HEADER]] ], [ [[ADD101:%.*]], [[LOOP_2]] ] |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i32 [ 0, [[LOOP_1_HEADER]] ], [ [[SUB93:%.*]], [[LOOP_2]] ] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_3]], -1 |
| ; CHECK-NEXT: [[SUB93]] = add i32 [[IV_3]], 1 |
| ; CHECK-NEXT: [[ADD101]] = add i32 [[IV_3]], [[IV_2]] |
| ; CHECK-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_2]], label [[LOOP_3_PREHEADER:%.*]] |
| ; CHECK: loop.3.preheader: |
| ; CHECK-NEXT: [[IV_2_LCSSA:%.*]] = phi i32 [ [[IV_2]], [[LOOP_2]] ] |
| ; CHECK-NEXT: [[INDUCTION_IV_LCSSA:%.*]] = phi i32 [ [[INDUCTION_IV]], [[LOOP_2]] ] |
| ; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]] |
| ; CHECK: vector.ph: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[INDUCTION_IV_LCSSA]] |
| ; CHECK-NEXT: br label [[VECTOR_BODY:%.*]] |
| ; CHECK: vector.body: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[TMP2:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP2]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]] |
| ; CHECK: middle.block: |
| ; CHECK-NEXT: [[IND_ESCAPE:%.*]] = sub i32 [[IND_END]], [[INDUCTION_IV_LCSSA]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_4_PREHEADER:%.*]], label [[SCALAR_PH]] |
| ; CHECK: scalar.ph: |
| ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i16 [ 196, [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: [[BC_RESUME_VAL1:%.*]] = phi i32 [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: br label [[LOOP_3:%.*]] |
| ; CHECK: loop.3: |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i16 [ [[INC_1:%.*]], [[LOOP_3]] ], [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_1:%.*]], [[LOOP_3]] ], [ [[BC_RESUME_VAL1]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[SUB93_1]] = sub i32 [[IV_5]], [[IV_2_LCSSA]] |
| ; CHECK-NEXT: [[INC_1]] = add i16 [[IV_4]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_4]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label [[LOOP_3]], label [[LOOP_4_PREHEADER]], !llvm.loop [[LOOP5:![0-9]+]] |
| ; CHECK: loop.4.preheader: |
| ; CHECK-NEXT: [[IV_5_LCSSA:%.*]] = phi i32 [ [[IV_5]], [[LOOP_3]] ], [ [[IND_ESCAPE]], [[MIDDLE_BLOCK]] ] |
| ; CHECK-NEXT: br label [[LOOP_4]] |
| ; CHECK: loop.4: |
| ; CHECK-NEXT: [[IV_6:%.*]] = phi i32 [ [[SUB93_2]], [[LOOP_4]] ], [ 0, [[LOOP_4_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_6]], [[IV_5_LCSSA]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_4]], label [[LOOP_1_HEADER_LOOPEXIT]] |
| ; |
| entry: |
| br label %loop.1.header |
| |
| loop.1.header: |
| %p.1 = phi i32 [ 0, %entry ], [ %sub93.2, %loop.4 ] |
| br label %loop.2 |
| |
| loop.2: |
| %iv.2 = phi i32 [ %p.1, %loop.1.header ], [ %add101, %loop.2 ] |
| %iv.3 = phi i32 [ 0, %loop.1.header ], [ %sub93, %loop.2 ] |
| %sub93 = add i32 %iv.3, 1 |
| %add101 = add i32 %iv.3, %iv.2 |
| br i1 false, label %loop.2, label %loop.3 |
| |
| loop.3: |
| %iv.4 = phi i16 [ 0, %loop.2 ], [ %inc.1, %loop.3 ] |
| %iv.5 = phi i32 [ 0, %loop.2 ], [ %sub93.1, %loop.3 ] |
| %sub93.1 = sub i32 %iv.5, %iv.2 |
| %inc.1 = add i16 %iv.4, 1 |
| %cmp88.1 = icmp ult i16 %iv.4, 198 |
| br i1 %cmp88.1, label %loop.3, label %loop.4 |
| |
| loop.4: |
| %iv.6 = phi i32 [ 0, %loop.3 ], [ %sub93.2, %loop.4 ] |
| %sub93.2 = sub i32 %iv.6, %iv.5 |
| br i1 false, label %loop.4, label %loop.1.header |
| } |
| |
| define void @test3_pr58811() { |
| ; CHECK-LABEL: @test3_pr58811( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: br label [[LOOP_1_HEADER:%.*]] |
| ; CHECK: loop.1.header: |
| ; CHECK-NEXT: [[P_1:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[SUB93_2:%.*]], [[LOOP_1_LATCH:%.*]] ] |
| ; CHECK-NEXT: [[REM85:%.*]] = urem i32 1, [[P_1]] |
| ; CHECK-NEXT: br label [[LOOP_2:%.*]] |
| ; CHECK: loop.2: |
| ; CHECK-NEXT: [[P_2:%.*]] = phi i32 [ 1, [[LOOP_1_HEADER]] ], [ 0, [[LOOP_2]] ] |
| ; CHECK-NEXT: [[ADD101:%.*]] = add i32 [[REM85]], [[P_2]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_2]], label [[LOOP_3_PREHEADER:%.*]] |
| ; CHECK: loop.3.preheader: |
| ; CHECK-NEXT: [[P_2_LCSSA:%.*]] = phi i32 [ [[P_2]], [[LOOP_2]] ] |
| ; CHECK-NEXT: [[ADD101_LCSSA:%.*]] = phi i32 [ [[ADD101]], [[LOOP_2]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = udiv i32 1, [[P_1]] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw i32 [[P_1]], [[TMP0]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = add i32 [[TMP1]], -1 |
| ; CHECK-NEXT: [[TMP3:%.*]] = sub i32 [[TMP2]], [[P_2_LCSSA]] |
| ; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]] |
| ; CHECK: vector.ph: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[TMP3]] |
| ; CHECK-NEXT: br label [[VECTOR_BODY:%.*]] |
| ; CHECK: vector.body: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[TMP4:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP4]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP6:![0-9]+]] |
| ; CHECK: middle.block: |
| ; CHECK-NEXT: [[IND_ESCAPE:%.*]] = sub i32 [[IND_END]], [[TMP3]] |
| ; CHECK-NEXT: br i1 false, label [[LOOP_4_PREHEADER:%.*]], label [[SCALAR_PH]] |
| ; CHECK: scalar.ph: |
| ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i16 [ 196, [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: [[BC_RESUME_VAL1:%.*]] = phi i32 [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ 0, [[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: br label [[LOOP_3:%.*]] |
| ; CHECK: loop.3: |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i16 [ [[INC_1:%.*]], [[LOOP_3]] ], [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i32 [ [[SUB93_1:%.*]], [[LOOP_3]] ], [ [[BC_RESUME_VAL1]], [[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[SUB93_1]] = sub i32 [[IV_4]], [[ADD101_LCSSA]] |
| ; CHECK-NEXT: [[INC_1]] = add i16 [[IV_3]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label [[LOOP_3]], label [[LOOP_4_PREHEADER]], !llvm.loop [[LOOP7:![0-9]+]] |
| ; CHECK: loop.4.preheader: |
| ; CHECK-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], [[LOOP_3]] ], [ [[IND_ESCAPE]], [[MIDDLE_BLOCK]] ] |
| ; CHECK-NEXT: br label [[LOOP_4:%.*]] |
| ; CHECK: loop.4: |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], [[LOOP_4]] ], [ 0, [[LOOP_4_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; CHECK-NEXT: br label [[LOOP_4]] |
| ; CHECK: loop.1.latch: |
| ; CHECK-NEXT: br label [[LOOP_1_HEADER]] |
| ; |
| entry: |
| br label %loop.1.header |
| |
| loop.1.header: |
| %p.1 = phi i32 [ 0, %entry ], [ %sub93.2, %loop.1.latch ] |
| %rem85 = urem i32 1, %p.1 |
| br label %loop.2 |
| |
| loop.2: |
| %p.2 = phi i32 [ 1, %loop.1.header ], [ 0, %loop.2 ] |
| %add101 = add i32 %rem85, %p.2 |
| br i1 false, label %loop.2, label %loop.3 |
| |
| loop.3: |
| %iv.3 = phi i16 [ 0, %loop.2 ], [ %inc.1, %loop.3 ] |
| %iv.4 = phi i32 [ 0, %loop.2 ], [ %sub93.1, %loop.3 ] |
| %sub93.1 = sub i32 %iv.4, %add101 |
| %inc.1 = add i16 %iv.3, 1 |
| %cmp88.1 = icmp ult i16 %iv.3, 198 |
| br i1 %cmp88.1, label %loop.3, label %loop.4 |
| |
| loop.4: |
| %iv.5 = phi i32 [ 0, %loop.3 ], [ %sub93.2, %loop.4 ] |
| %sub93.2 = sub i32 %iv.5, %iv.4 |
| br label %loop.4 |
| |
| loop.1.latch: ; No predecessors! |
| br label %loop.1.header |
| } |