| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --version 6 |
| ; RUN: opt -passes=loop-vectorize -force-vector-width=2 -force-vector-interleave=1 -S %s | FileCheck --check-prefix=VF2 %s |
| ; RUN: opt -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=1 -S %s | FileCheck %s |
| |
| define void @test1_pr58811(ptr %dst) { |
| ; VF2-LABEL: define void @test1_pr58811( |
| ; VF2-SAME: ptr [[DST:%.*]]) { |
| ; VF2-NEXT: [[ENTRY:.*]]: |
| ; VF2-NEXT: br label %[[LOOP_1_PREHEADER:.*]] |
| ; VF2: [[LOOP_1_PREHEADER]]: |
| ; VF2-NEXT: [[IV_1_PH:%.*]] = phi i32 [ [[SUB93_2:%.*]], %[[UNREACHABLE_BB:.*]] ], [ 0, %[[ENTRY]] ] |
| ; VF2-NEXT: [[TMP0:%.*]] = sub i32 0, [[IV_1_PH]] |
| ; VF2-NEXT: br label %[[LOOP_1:.*]] |
| ; VF2: [[LOOP_1]]: |
| ; VF2-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], %[[LOOP_1]] ], [ [[TMP0]], %[[LOOP_1_PREHEADER]] ] |
| ; VF2-NEXT: [[IV_1:%.*]] = phi i32 [ [[IV_1_NEXT:%.*]], %[[LOOP_1]] ], [ [[IV_1_PH]], %[[LOOP_1_PREHEADER]] ] |
| ; VF2-NEXT: [[IV_2:%.*]] = phi i32 [ [[IV_2_NEXT:%.*]], %[[LOOP_1]] ], [ 0, %[[LOOP_1_PREHEADER]] ] |
| ; VF2-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_2]], -1 |
| ; VF2-NEXT: [[IV_2_NEXT]] = add i32 [[IV_2]], 1 |
| ; VF2-NEXT: [[IV_1_NEXT]] = add i32 [[IV_2]], [[IV_1]] |
| ; VF2-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; VF2-NEXT: br i1 false, label %[[LOOP_1]], label %[[LOOP_2_PREHEADER:.*]] |
| ; VF2: [[LOOP_2_PREHEADER]]: |
| ; VF2-NEXT: [[IV_1_LCSSA:%.*]] = phi i32 [ [[IV_1]], %[[LOOP_1]] ] |
| ; VF2-NEXT: br label %[[VECTOR_PH:.*]] |
| ; VF2: [[VECTOR_PH]]: |
| ; VF2-NEXT: [[TMP2:%.*]] = mul i32 198, [[INDUCTION_IV]] |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x i32> poison, i32 [[INDUCTION_IV]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: [[TMP3:%.*]] = mul <2 x i32> <i32 0, i32 1>, [[BROADCAST_SPLAT]] |
| ; VF2-NEXT: [[INDUCTION:%.*]] = add <2 x i32> zeroinitializer, [[TMP3]] |
| ; VF2-NEXT: [[TMP4:%.*]] = mul i32 [[INDUCTION_IV]], 2 |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <2 x i32> poison, i32 [[TMP4]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT1]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; VF2: [[VECTOR_BODY]]: |
| ; VF2-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[VEC_IND:%.*]] = phi <2 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; VF2-NEXT: [[TMP5:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; VF2-NEXT: store <2 x i32> [[VEC_IND]], ptr [[TMP5]], align 4 |
| ; VF2-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2 |
| ; VF2-NEXT: [[VEC_IND_NEXT]] = add <2 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; VF2-NEXT: [[TMP6:%.*]] = icmp eq i32 [[INDEX_NEXT]], 198 |
| ; VF2-NEXT: br i1 [[TMP6]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]] |
| ; VF2: [[MIDDLE_BLOCK]]: |
| ; VF2-NEXT: br label %[[SCALAR_PH:.*]] |
| ; VF2: [[SCALAR_PH]]: |
| ; VF2-NEXT: br label %[[LOOP_2:.*]] |
| ; VF2: [[LOOP_2]]: |
| ; VF2-NEXT: [[IV_3:%.*]] = phi i16 [ [[IV_3_NEXT:%.*]], %[[LOOP_2]] ], [ 198, %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[IV_4:%.*]] = phi i32 [ [[IV_4_NEXT:%.*]], %[[LOOP_2]] ], [ [[TMP2]], %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_3]] |
| ; VF2-NEXT: store i32 [[IV_4]], ptr [[GEP_DST]], align 4 |
| ; VF2-NEXT: [[IV_4_NEXT]] = sub i32 [[IV_4]], [[IV_1_LCSSA]] |
| ; VF2-NEXT: [[IV_3_NEXT]] = add i16 [[IV_3]], 1 |
| ; VF2-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; VF2-NEXT: br i1 [[CMP88_1]], label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]], !llvm.loop [[LOOP3:![0-9]+]] |
| ; VF2: [[LOOP_3_PREHEADER]]: |
| ; VF2-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], %[[LOOP_2]] ] |
| ; VF2-NEXT: br label %[[LOOP_3:.*]] |
| ; VF2: [[LOOP_3]]: |
| ; VF2-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_3]] ], [ 0, %[[LOOP_3_PREHEADER]] ] |
| ; VF2-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; VF2-NEXT: br label %[[LOOP_3]] |
| ; VF2: [[UNREACHABLE_BB]]: |
| ; VF2-NEXT: br label %[[LOOP_1_PREHEADER]] |
| ; |
| ; CHECK-LABEL: define void @test1_pr58811( |
| ; CHECK-SAME: ptr [[DST:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[LOOP_1_PREHEADER:.*]] |
| ; CHECK: [[LOOP_1_PREHEADER]]: |
| ; CHECK-NEXT: [[IV_1_PH:%.*]] = phi i32 [ [[SUB93_2:%.*]], %[[UNREACHABLE_BB:.*]] ], [ 0, %[[ENTRY]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = sub i32 0, [[IV_1_PH]] |
| ; CHECK-NEXT: br label %[[LOOP_1:.*]] |
| ; CHECK: [[LOOP_1]]: |
| ; CHECK-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], %[[LOOP_1]] ], [ [[TMP0]], %[[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[IV_1:%.*]] = phi i32 [ [[IV_1_NEXT:%.*]], %[[LOOP_1]] ], [ [[IV_1_PH]], %[[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[IV_2:%.*]] = phi i32 [ [[IV_2_NEXT:%.*]], %[[LOOP_1]] ], [ 0, %[[LOOP_1_PREHEADER]] ] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_2]], -1 |
| ; CHECK-NEXT: [[IV_2_NEXT]] = add i32 [[IV_2]], 1 |
| ; CHECK-NEXT: [[IV_1_NEXT]] = add i32 [[IV_2]], [[IV_1]] |
| ; CHECK-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; CHECK-NEXT: br i1 false, label %[[LOOP_1]], label %[[LOOP_2_PREHEADER:.*]] |
| ; CHECK: [[LOOP_2_PREHEADER]]: |
| ; CHECK-NEXT: [[IV_1_LCSSA:%.*]] = phi i32 [ [[IV_1]], %[[LOOP_1]] ] |
| ; CHECK-NEXT: br label %[[VECTOR_PH:.*]] |
| ; CHECK: [[VECTOR_PH]]: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[INDUCTION_IV]] |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i32> poison, i32 [[INDUCTION_IV]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: [[TMP3:%.*]] = mul <4 x i32> <i32 0, i32 1, i32 2, i32 3>, [[BROADCAST_SPLAT]] |
| ; CHECK-NEXT: [[INDUCTION:%.*]] = add <4 x i32> zeroinitializer, [[TMP3]] |
| ; CHECK-NEXT: [[TMP4:%.*]] = mul i32 [[INDUCTION_IV]], 4 |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <4 x i32> poison, i32 [[TMP4]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT1]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; CHECK: [[VECTOR_BODY]]: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; CHECK-NEXT: store <4 x i32> [[VEC_IND]], ptr [[TMP5]], align 4 |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP2]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]] |
| ; CHECK: [[MIDDLE_BLOCK]]: |
| ; CHECK-NEXT: br label %[[SCALAR_PH:.*]] |
| ; CHECK: [[SCALAR_PH]]: |
| ; CHECK-NEXT: br label %[[LOOP_2:.*]] |
| ; CHECK: [[LOOP_2]]: |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i16 [ [[IV_3_NEXT:%.*]], %[[LOOP_2]] ], [ 196, %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i32 [ [[IV_4_NEXT:%.*]], %[[LOOP_2]] ], [ [[IND_END]], %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_3]] |
| ; CHECK-NEXT: store i32 [[IV_4]], ptr [[GEP_DST]], align 4 |
| ; CHECK-NEXT: [[IV_4_NEXT]] = sub i32 [[IV_4]], [[IV_1_LCSSA]] |
| ; CHECK-NEXT: [[IV_3_NEXT]] = add i16 [[IV_3]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]], !llvm.loop [[LOOP3:![0-9]+]] |
| ; CHECK: [[LOOP_3_PREHEADER]]: |
| ; CHECK-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: br label %[[LOOP_3:.*]] |
| ; CHECK: [[LOOP_3]]: |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_3]] ], [ 0, %[[LOOP_3_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; CHECK-NEXT: br label %[[LOOP_3]] |
| ; CHECK: [[UNREACHABLE_BB]]: |
| ; CHECK-NEXT: br label %[[LOOP_1_PREHEADER]] |
| ; |
| entry: |
| br label %loop.1.preheader |
| |
| loop.1.preheader: |
| %iv.1.ph = phi i32 [ %sub93.2, %unreachable.bb ], [ 0, %entry ] |
| br label %loop.1 |
| |
| loop.1: |
| %iv.1 = phi i32 [ %iv.1.next, %loop.1 ], [ %iv.1.ph, %loop.1.preheader ] |
| %iv.2 = phi i32 [ %iv.2.next, %loop.1 ], [ 0, %loop.1.preheader ] |
| %iv.2.next = add i32 %iv.2, 1 |
| %iv.1.next = add i32 %iv.2, %iv.1 |
| br i1 false, label %loop.1, label %loop.2.preheader |
| |
| loop.2.preheader: |
| %iv.1.lcssa = phi i32 [ %iv.1, %loop.1 ] |
| br label %loop.2 |
| |
| loop.2: |
| %iv.3 = phi i16 [ %iv.3.next, %loop.2 ], [ 0, %loop.2.preheader ] |
| %iv.4 = phi i32 [ %iv.4.next, %loop.2 ], [ 0, %loop.2.preheader ] |
| %gep.dst = getelementptr inbounds i32, ptr %dst, i16 %iv.3 |
| store i32 %iv.4, ptr %gep.dst |
| %iv.4.next = sub i32 %iv.4, %iv.1.lcssa |
| %iv.3.next = add i16 %iv.3, 1 |
| %cmp88.1 = icmp ult i16 %iv.3, 198 |
| br i1 %cmp88.1, label %loop.2, label %loop.3.preheader |
| |
| loop.3.preheader: |
| %iv.4.lcssa = phi i32 [ %iv.4, %loop.2 ] |
| br label %loop.3 |
| |
| loop.3: |
| %iv.5 = phi i32 [ %sub93.2, %loop.3 ], [ 0, %loop.3.preheader ] |
| %sub93.2 = sub i32 %iv.5, %iv.4.lcssa |
| br label %loop.3 |
| |
| unreachable.bb: ; No predecessors! |
| br label %loop.1.preheader |
| } |
| |
| define void @test2_pr58811(ptr %dst) { |
| ; VF2-LABEL: define void @test2_pr58811( |
| ; VF2-SAME: ptr [[DST:%.*]]) { |
| ; VF2-NEXT: [[ENTRY:.*]]: |
| ; VF2-NEXT: br label %[[LOOP_1_HEADER:.*]] |
| ; VF2: [[LOOP_1_HEADER_LOOPEXIT:.*]]: |
| ; VF2-NEXT: [[SUB93_2_LCSSA:%.*]] = phi i32 [ [[SUB93_2:%.*]], %[[LOOP_4:.*]] ] |
| ; VF2-NEXT: br label %[[LOOP_1_HEADER]] |
| ; VF2: [[LOOP_1_HEADER]]: |
| ; VF2-NEXT: [[P_1:%.*]] = phi i32 [ 0, %[[ENTRY]] ], [ [[SUB93_2_LCSSA]], %[[LOOP_1_HEADER_LOOPEXIT]] ] |
| ; VF2-NEXT: [[TMP0:%.*]] = mul i32 [[P_1]], -1 |
| ; VF2-NEXT: br label %[[LOOP_2:.*]] |
| ; VF2: [[LOOP_2]]: |
| ; VF2-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], %[[LOOP_2]] ], [ [[TMP0]], %[[LOOP_1_HEADER]] ] |
| ; VF2-NEXT: [[IV_2:%.*]] = phi i32 [ [[P_1]], %[[LOOP_1_HEADER]] ], [ [[ADD101:%.*]], %[[LOOP_2]] ] |
| ; VF2-NEXT: [[IV_3:%.*]] = phi i32 [ 0, %[[LOOP_1_HEADER]] ], [ [[SUB93:%.*]], %[[LOOP_2]] ] |
| ; VF2-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_3]], -1 |
| ; VF2-NEXT: [[SUB93]] = add i32 [[IV_3]], 1 |
| ; VF2-NEXT: [[ADD101]] = add i32 [[IV_3]], [[IV_2]] |
| ; VF2-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; VF2-NEXT: br i1 false, label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]] |
| ; VF2: [[LOOP_3_PREHEADER]]: |
| ; VF2-NEXT: [[INDUCTION_IV_LCSSA:%.*]] = phi i32 [ [[INDUCTION_IV]], %[[LOOP_2]] ] |
| ; VF2-NEXT: [[IV_2_LCSSA:%.*]] = phi i32 [ [[IV_2]], %[[LOOP_2]] ] |
| ; VF2-NEXT: br label %[[VECTOR_PH:.*]] |
| ; VF2: [[VECTOR_PH]]: |
| ; VF2-NEXT: [[TMP2:%.*]] = mul i32 198, [[INDUCTION_IV_LCSSA]] |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x i32> poison, i32 [[INDUCTION_IV_LCSSA]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: [[TMP3:%.*]] = mul <2 x i32> <i32 0, i32 1>, [[BROADCAST_SPLAT]] |
| ; VF2-NEXT: [[INDUCTION:%.*]] = add <2 x i32> zeroinitializer, [[TMP3]] |
| ; VF2-NEXT: [[TMP4:%.*]] = mul i32 [[INDUCTION_IV_LCSSA]], 2 |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <2 x i32> poison, i32 [[TMP4]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT1]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; VF2: [[VECTOR_BODY]]: |
| ; VF2-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[VEC_IND:%.*]] = phi <2 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; VF2-NEXT: [[TMP5:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; VF2-NEXT: store <2 x i32> [[VEC_IND]], ptr [[TMP5]], align 4 |
| ; VF2-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2 |
| ; VF2-NEXT: [[VEC_IND_NEXT]] = add <2 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; VF2-NEXT: [[TMP6:%.*]] = icmp eq i32 [[INDEX_NEXT]], 198 |
| ; VF2-NEXT: br i1 [[TMP6]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]] |
| ; VF2: [[MIDDLE_BLOCK]]: |
| ; VF2-NEXT: br label %[[SCALAR_PH:.*]] |
| ; VF2: [[SCALAR_PH]]: |
| ; VF2-NEXT: br label %[[LOOP_3:.*]] |
| ; VF2: [[LOOP_3]]: |
| ; VF2-NEXT: [[IV_4:%.*]] = phi i16 [ [[INC_1:%.*]], %[[LOOP_3]] ], [ 198, %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_1:%.*]], %[[LOOP_3]] ], [ [[TMP2]], %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_4]] |
| ; VF2-NEXT: store i32 [[IV_5]], ptr [[GEP_DST]], align 4 |
| ; VF2-NEXT: [[SUB93_1]] = sub i32 [[IV_5]], [[IV_2_LCSSA]] |
| ; VF2-NEXT: [[INC_1]] = add i16 [[IV_4]], 1 |
| ; VF2-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_4]], 198 |
| ; VF2-NEXT: br i1 [[CMP88_1]], label %[[LOOP_3]], label %[[LOOP_4_PREHEADER:.*]], !llvm.loop [[LOOP5:![0-9]+]] |
| ; VF2: [[LOOP_4_PREHEADER]]: |
| ; VF2-NEXT: [[IV_5_LCSSA:%.*]] = phi i32 [ [[IV_5]], %[[LOOP_3]] ] |
| ; VF2-NEXT: br label %[[LOOP_4]] |
| ; VF2: [[LOOP_4]]: |
| ; VF2-NEXT: [[IV_6:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_4]] ], [ 0, %[[LOOP_4_PREHEADER]] ] |
| ; VF2-NEXT: [[SUB93_2]] = sub i32 [[IV_6]], [[IV_5_LCSSA]] |
| ; VF2-NEXT: br i1 false, label %[[LOOP_4]], label %[[LOOP_1_HEADER_LOOPEXIT]] |
| ; |
| ; CHECK-LABEL: define void @test2_pr58811( |
| ; CHECK-SAME: ptr [[DST:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[LOOP_1_HEADER:.*]] |
| ; CHECK: [[LOOP_1_HEADER_LOOPEXIT:.*]]: |
| ; CHECK-NEXT: [[SUB93_2_LCSSA:%.*]] = phi i32 [ [[SUB93_2:%.*]], %[[LOOP_4:.*]] ] |
| ; CHECK-NEXT: br label %[[LOOP_1_HEADER]] |
| ; CHECK: [[LOOP_1_HEADER]]: |
| ; CHECK-NEXT: [[P_1:%.*]] = phi i32 [ 0, %[[ENTRY]] ], [ [[SUB93_2_LCSSA]], %[[LOOP_1_HEADER_LOOPEXIT]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = mul i32 [[P_1]], -1 |
| ; CHECK-NEXT: br label %[[LOOP_2:.*]] |
| ; CHECK: [[LOOP_2]]: |
| ; CHECK-NEXT: [[INDUCTION_IV:%.*]] = phi i32 [ [[INDUCTION_IV_NEXT:%.*]], %[[LOOP_2]] ], [ [[TMP0]], %[[LOOP_1_HEADER]] ] |
| ; CHECK-NEXT: [[IV_2:%.*]] = phi i32 [ [[P_1]], %[[LOOP_1_HEADER]] ], [ [[ADD101:%.*]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i32 [ 0, %[[LOOP_1_HEADER]] ], [ [[SUB93:%.*]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i32 [[IV_3]], -1 |
| ; CHECK-NEXT: [[SUB93]] = add i32 [[IV_3]], 1 |
| ; CHECK-NEXT: [[ADD101]] = add i32 [[IV_3]], [[IV_2]] |
| ; CHECK-NEXT: [[INDUCTION_IV_NEXT]] = add i32 [[INDUCTION_IV]], [[TMP1]] |
| ; CHECK-NEXT: br i1 false, label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]] |
| ; CHECK: [[LOOP_3_PREHEADER]]: |
| ; CHECK-NEXT: [[INDUCTION_IV_LCSSA:%.*]] = phi i32 [ [[INDUCTION_IV]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[IV_2_LCSSA:%.*]] = phi i32 [ [[IV_2]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: br label %[[VECTOR_PH:.*]] |
| ; CHECK: [[VECTOR_PH]]: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[INDUCTION_IV_LCSSA]] |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i32> poison, i32 [[INDUCTION_IV_LCSSA]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: [[TMP3:%.*]] = mul <4 x i32> <i32 0, i32 1, i32 2, i32 3>, [[BROADCAST_SPLAT]] |
| ; CHECK-NEXT: [[INDUCTION:%.*]] = add <4 x i32> zeroinitializer, [[TMP3]] |
| ; CHECK-NEXT: [[TMP4:%.*]] = mul i32 [[INDUCTION_IV_LCSSA]], 4 |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <4 x i32> poison, i32 [[TMP4]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT1]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; CHECK: [[VECTOR_BODY]]: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; CHECK-NEXT: store <4 x i32> [[VEC_IND]], ptr [[TMP5]], align 4 |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP2]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]] |
| ; CHECK: [[MIDDLE_BLOCK]]: |
| ; CHECK-NEXT: br label %[[SCALAR_PH:.*]] |
| ; CHECK: [[SCALAR_PH]]: |
| ; CHECK-NEXT: br label %[[LOOP_3:.*]] |
| ; CHECK: [[LOOP_3]]: |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i16 [ [[INC_1:%.*]], %[[LOOP_3]] ], [ 196, %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_1:%.*]], %[[LOOP_3]] ], [ [[IND_END]], %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_4]] |
| ; CHECK-NEXT: store i32 [[IV_5]], ptr [[GEP_DST]], align 4 |
| ; CHECK-NEXT: [[SUB93_1]] = sub i32 [[IV_5]], [[IV_2_LCSSA]] |
| ; CHECK-NEXT: [[INC_1]] = add i16 [[IV_4]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_4]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label %[[LOOP_3]], label %[[LOOP_4_PREHEADER:.*]], !llvm.loop [[LOOP5:![0-9]+]] |
| ; CHECK: [[LOOP_4_PREHEADER]]: |
| ; CHECK-NEXT: [[IV_5_LCSSA:%.*]] = phi i32 [ [[IV_5]], %[[LOOP_3]] ] |
| ; CHECK-NEXT: br label %[[LOOP_4]] |
| ; CHECK: [[LOOP_4]]: |
| ; CHECK-NEXT: [[IV_6:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_4]] ], [ 0, %[[LOOP_4_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_6]], [[IV_5_LCSSA]] |
| ; CHECK-NEXT: br i1 false, label %[[LOOP_4]], label %[[LOOP_1_HEADER_LOOPEXIT]] |
| ; |
| entry: |
| br label %loop.1.header |
| |
| loop.1.header: |
| %p.1 = phi i32 [ 0, %entry ], [ %sub93.2, %loop.4 ] |
| br label %loop.2 |
| |
| loop.2: |
| %iv.2 = phi i32 [ %p.1, %loop.1.header ], [ %add101, %loop.2 ] |
| %iv.3 = phi i32 [ 0, %loop.1.header ], [ %sub93, %loop.2 ] |
| %sub93 = add i32 %iv.3, 1 |
| %add101 = add i32 %iv.3, %iv.2 |
| br i1 false, label %loop.2, label %loop.3 |
| |
| loop.3: |
| %iv.4 = phi i16 [ 0, %loop.2 ], [ %inc.1, %loop.3 ] |
| %iv.5 = phi i32 [ 0, %loop.2 ], [ %sub93.1, %loop.3 ] |
| %gep.dst = getelementptr inbounds i32, ptr %dst, i16 %iv.4 |
| store i32 %iv.5, ptr %gep.dst |
| %sub93.1 = sub i32 %iv.5, %iv.2 |
| %inc.1 = add i16 %iv.4, 1 |
| %cmp88.1 = icmp ult i16 %iv.4, 198 |
| br i1 %cmp88.1, label %loop.3, label %loop.4 |
| |
| loop.4: |
| %iv.6 = phi i32 [ 0, %loop.3 ], [ %sub93.2, %loop.4 ] |
| %sub93.2 = sub i32 %iv.6, %iv.5 |
| br i1 false, label %loop.4, label %loop.1.header |
| } |
| |
| define void @test3_pr58811(ptr %dst) { |
| ; VF2-LABEL: define void @test3_pr58811( |
| ; VF2-SAME: ptr [[DST:%.*]]) { |
| ; VF2-NEXT: [[ENTRY:.*]]: |
| ; VF2-NEXT: br label %[[LOOP_1_HEADER:.*]] |
| ; VF2: [[LOOP_1_HEADER]]: |
| ; VF2-NEXT: [[P_1:%.*]] = phi i32 [ 0, %[[ENTRY]] ], [ [[SUB93_2:%.*]], %[[LOOP_1_LATCH:.*]] ] |
| ; VF2-NEXT: [[REM85:%.*]] = urem i32 1, [[P_1]] |
| ; VF2-NEXT: br label %[[LOOP_2:.*]] |
| ; VF2: [[LOOP_2]]: |
| ; VF2-NEXT: [[P_2:%.*]] = phi i32 [ 1, %[[LOOP_1_HEADER]] ], [ 0, %[[LOOP_2]] ] |
| ; VF2-NEXT: [[ADD101:%.*]] = add i32 [[REM85]], [[P_2]] |
| ; VF2-NEXT: br i1 false, label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]] |
| ; VF2: [[LOOP_3_PREHEADER]]: |
| ; VF2-NEXT: [[ADD101_LCSSA:%.*]] = phi i32 [ [[ADD101]], %[[LOOP_2]] ] |
| ; VF2-NEXT: [[TMP0:%.*]] = udiv i32 1, [[P_1]] |
| ; VF2-NEXT: [[TMP1:%.*]] = mul nuw i32 [[P_1]], [[TMP0]] |
| ; VF2-NEXT: [[TMP2:%.*]] = add i32 [[TMP1]], -1 |
| ; VF2-NEXT: [[TMP3:%.*]] = sub i32 [[TMP2]], [[P_2]] |
| ; VF2-NEXT: br label %[[VECTOR_PH:.*]] |
| ; VF2: [[VECTOR_PH]]: |
| ; VF2-NEXT: [[TMP15:%.*]] = mul i32 198, [[TMP3]] |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x i32> poison, i32 [[TMP3]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: [[TMP5:%.*]] = mul <2 x i32> <i32 0, i32 1>, [[BROADCAST_SPLAT]] |
| ; VF2-NEXT: [[INDUCTION:%.*]] = add <2 x i32> zeroinitializer, [[TMP5]] |
| ; VF2-NEXT: [[TMP6:%.*]] = mul i32 [[TMP3]], 2 |
| ; VF2-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <2 x i32> poison, i32 [[TMP6]], i64 0 |
| ; VF2-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <2 x i32> [[BROADCAST_SPLATINSERT1]], <2 x i32> poison, <2 x i32> zeroinitializer |
| ; VF2-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; VF2: [[VECTOR_BODY]]: |
| ; VF2-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[VEC_IND:%.*]] = phi <2 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; VF2-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; VF2-NEXT: [[TMP7:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; VF2-NEXT: store <2 x i32> [[VEC_IND]], ptr [[TMP7]], align 4 |
| ; VF2-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2 |
| ; VF2-NEXT: [[VEC_IND_NEXT]] = add <2 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; VF2-NEXT: [[TMP22:%.*]] = icmp eq i32 [[INDEX_NEXT]], 198 |
| ; VF2-NEXT: br i1 [[TMP22]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP6:![0-9]+]] |
| ; VF2: [[MIDDLE_BLOCK]]: |
| ; VF2-NEXT: br label %[[SCALAR_PH:.*]] |
| ; VF2: [[SCALAR_PH]]: |
| ; VF2-NEXT: br label %[[LOOP_3:.*]] |
| ; VF2: [[LOOP_3]]: |
| ; VF2-NEXT: [[IV_3:%.*]] = phi i16 [ [[INC_1:%.*]], %[[LOOP_3]] ], [ 198, %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[IV_4:%.*]] = phi i32 [ [[SUB93_1:%.*]], %[[LOOP_3]] ], [ [[TMP15]], %[[SCALAR_PH]] ] |
| ; VF2-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_3]] |
| ; VF2-NEXT: store i32 [[IV_4]], ptr [[GEP_DST]], align 4 |
| ; VF2-NEXT: [[SUB93_1]] = sub i32 [[IV_4]], [[ADD101_LCSSA]] |
| ; VF2-NEXT: [[INC_1]] = add i16 [[IV_3]], 1 |
| ; VF2-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; VF2-NEXT: br i1 [[CMP88_1]], label %[[LOOP_3]], label %[[LOOP_4_PREHEADER:.*]], !llvm.loop [[LOOP7:![0-9]+]] |
| ; VF2: [[LOOP_4_PREHEADER]]: |
| ; VF2-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], %[[LOOP_3]] ] |
| ; VF2-NEXT: br label %[[LOOP_4:.*]] |
| ; VF2: [[LOOP_4]]: |
| ; VF2-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_4]] ], [ 0, %[[LOOP_4_PREHEADER]] ] |
| ; VF2-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; VF2-NEXT: br label %[[LOOP_4]] |
| ; VF2: [[LOOP_1_LATCH]]: |
| ; VF2-NEXT: br label %[[LOOP_1_HEADER]] |
| ; |
| ; CHECK-LABEL: define void @test3_pr58811( |
| ; CHECK-SAME: ptr [[DST:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[LOOP_1_HEADER:.*]] |
| ; CHECK: [[LOOP_1_HEADER]]: |
| ; CHECK-NEXT: [[P_1:%.*]] = phi i32 [ 0, %[[ENTRY]] ], [ [[SUB93_2:%.*]], %[[LOOP_1_LATCH:.*]] ] |
| ; CHECK-NEXT: [[REM85:%.*]] = urem i32 1, [[P_1]] |
| ; CHECK-NEXT: br label %[[LOOP_2:.*]] |
| ; CHECK: [[LOOP_2]]: |
| ; CHECK-NEXT: [[P_2:%.*]] = phi i32 [ 1, %[[LOOP_1_HEADER]] ], [ 0, %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[ADD101:%.*]] = add i32 [[REM85]], [[P_2]] |
| ; CHECK-NEXT: br i1 false, label %[[LOOP_2]], label %[[LOOP_3_PREHEADER:.*]] |
| ; CHECK: [[LOOP_3_PREHEADER]]: |
| ; CHECK-NEXT: [[ADD101_LCSSA:%.*]] = phi i32 [ [[ADD101]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[TMP0:%.*]] = udiv i32 1, [[P_1]] |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw i32 [[P_1]], [[TMP0]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = add i32 [[TMP1]], -1 |
| ; CHECK-NEXT: [[TMP3:%.*]] = sub i32 [[TMP2]], [[P_2]] |
| ; CHECK-NEXT: br label %[[VECTOR_PH:.*]] |
| ; CHECK: [[VECTOR_PH]]: |
| ; CHECK-NEXT: [[IND_END:%.*]] = mul i32 196, [[TMP3]] |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i32> poison, i32 [[TMP3]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: [[TMP5:%.*]] = mul <4 x i32> <i32 0, i32 1, i32 2, i32 3>, [[BROADCAST_SPLAT]] |
| ; CHECK-NEXT: [[INDUCTION:%.*]] = add <4 x i32> zeroinitializer, [[TMP5]] |
| ; CHECK-NEXT: [[TMP6:%.*]] = mul i32 [[TMP3]], 4 |
| ; CHECK-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <4 x i32> poison, i32 [[TMP6]], i64 0 |
| ; CHECK-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT1]], <4 x i32> poison, <4 x i32> zeroinitializer |
| ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; CHECK: [[VECTOR_BODY]]: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i32> [ [[INDUCTION]], %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[OFFSET_IDX:%.*]] = trunc i32 [[INDEX]] to i16 |
| ; CHECK-NEXT: [[TMP7:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[OFFSET_IDX]] |
| ; CHECK-NEXT: store <4 x i32> [[VEC_IND]], ptr [[TMP7]], align 4 |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4 |
| ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i32> [[VEC_IND]], [[BROADCAST_SPLAT2]] |
| ; CHECK-NEXT: [[TMP4:%.*]] = icmp eq i32 [[INDEX_NEXT]], 196 |
| ; CHECK-NEXT: br i1 [[TMP4]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP6:![0-9]+]] |
| ; CHECK: [[MIDDLE_BLOCK]]: |
| ; CHECK-NEXT: br label %[[SCALAR_PH:.*]] |
| ; CHECK: [[SCALAR_PH]]: |
| ; CHECK-NEXT: br label %[[LOOP_3:.*]] |
| ; CHECK: [[LOOP_3]]: |
| ; CHECK-NEXT: [[IV_3:%.*]] = phi i16 [ [[INC_1:%.*]], %[[LOOP_3]] ], [ 196, %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[IV_4:%.*]] = phi i32 [ [[SUB93_1:%.*]], %[[LOOP_3]] ], [ [[IND_END]], %[[SCALAR_PH]] ] |
| ; CHECK-NEXT: [[GEP_DST:%.*]] = getelementptr inbounds i32, ptr [[DST]], i16 [[IV_3]] |
| ; CHECK-NEXT: store i32 [[IV_4]], ptr [[GEP_DST]], align 4 |
| ; CHECK-NEXT: [[SUB93_1]] = sub i32 [[IV_4]], [[ADD101_LCSSA]] |
| ; CHECK-NEXT: [[INC_1]] = add i16 [[IV_3]], 1 |
| ; CHECK-NEXT: [[CMP88_1:%.*]] = icmp ult i16 [[IV_3]], 198 |
| ; CHECK-NEXT: br i1 [[CMP88_1]], label %[[LOOP_3]], label %[[LOOP_4_PREHEADER:.*]], !llvm.loop [[LOOP7:![0-9]+]] |
| ; CHECK: [[LOOP_4_PREHEADER]]: |
| ; CHECK-NEXT: [[IV_4_LCSSA:%.*]] = phi i32 [ [[IV_4]], %[[LOOP_3]] ] |
| ; CHECK-NEXT: br label %[[LOOP_4:.*]] |
| ; CHECK: [[LOOP_4]]: |
| ; CHECK-NEXT: [[IV_5:%.*]] = phi i32 [ [[SUB93_2]], %[[LOOP_4]] ], [ 0, %[[LOOP_4_PREHEADER]] ] |
| ; CHECK-NEXT: [[SUB93_2]] = sub i32 [[IV_5]], [[IV_4_LCSSA]] |
| ; CHECK-NEXT: br label %[[LOOP_4]] |
| ; CHECK: [[LOOP_1_LATCH]]: |
| ; CHECK-NEXT: br label %[[LOOP_1_HEADER]] |
| ; |
| entry: |
| br label %loop.1.header |
| |
| loop.1.header: |
| %p.1 = phi i32 [ 0, %entry ], [ %sub93.2, %loop.1.latch ] |
| %rem85 = urem i32 1, %p.1 |
| br label %loop.2 |
| |
| loop.2: |
| %p.2 = phi i32 [ 1, %loop.1.header ], [ 0, %loop.2 ] |
| %add101 = add i32 %rem85, %p.2 |
| br i1 false, label %loop.2, label %loop.3 |
| |
| loop.3: |
| %iv.3 = phi i16 [ 0, %loop.2 ], [ %inc.1, %loop.3 ] |
| %iv.4 = phi i32 [ 0, %loop.2 ], [ %sub93.1, %loop.3 ] |
| %gep.dst = getelementptr inbounds i32, ptr %dst, i16 %iv.3 |
| store i32 %iv.4, ptr %gep.dst |
| %sub93.1 = sub i32 %iv.4, %add101 |
| %inc.1 = add i16 %iv.3, 1 |
| %cmp88.1 = icmp ult i16 %iv.3, 198 |
| br i1 %cmp88.1, label %loop.3, label %loop.4 |
| |
| loop.4: |
| %iv.5 = phi i32 [ 0, %loop.3 ], [ %sub93.2, %loop.4 ] |
| %sub93.2 = sub i32 %iv.5, %iv.4 |
| br label %loop.4 |
| |
| loop.1.latch: ; No predecessors! |
| br label %loop.1.header |
| } |
| |
| define void @iv_start_from_shl_of_previous_iv(ptr %dst) { |
| ; VF2-LABEL: define void @iv_start_from_shl_of_previous_iv( |
| ; VF2-SAME: ptr [[DST:%.*]]) { |
| ; VF2-NEXT: [[ENTRY:.*:]] |
| ; VF2-NEXT: br label %[[VECTOR_PH:.*]] |
| ; VF2: [[VECTOR_PH]]: |
| ; VF2-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; VF2: [[VECTOR_BODY]]: |
| ; VF2-NEXT: store <2 x i8> zeroinitializer, ptr [[DST]], align 1 |
| ; VF2-NEXT: br label %[[MIDDLE_BLOCK:.*]] |
| ; VF2: [[MIDDLE_BLOCK]]: |
| ; VF2-NEXT: br label %[[LOOP_1_EXIT:.*]] |
| ; VF2: [[LOOP_1_EXIT]]: |
| ; VF2-NEXT: [[IV_1_SHL:%.*]] = shl i64 1, 1 |
| ; VF2-NEXT: br label %[[VECTOR_PH1:.*]] |
| ; VF2: [[VECTOR_PH1]]: |
| ; VF2-NEXT: br label %[[VECTOR_BODY2:.*]] |
| ; VF2: [[VECTOR_BODY2]]: |
| ; VF2-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH1]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY2]] ] |
| ; VF2-NEXT: [[OFFSET_IDX:%.*]] = add i64 2, [[INDEX]] |
| ; VF2-NEXT: [[TMP1:%.*]] = getelementptr i8, ptr [[DST]], i64 [[OFFSET_IDX]] |
| ; VF2-NEXT: store <2 x i8> splat (i8 1), ptr [[TMP1]], align 1 |
| ; VF2-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2 |
| ; VF2-NEXT: [[TMP2:%.*]] = icmp eq i64 [[INDEX_NEXT]], 98 |
| ; VF2-NEXT: br i1 [[TMP2]], label %[[MIDDLE_BLOCK3:.*]], label %[[VECTOR_BODY2]], !llvm.loop [[LOOP8:![0-9]+]] |
| ; VF2: [[MIDDLE_BLOCK3]]: |
| ; VF2-NEXT: br label %[[SCALAR_PH:.*]] |
| ; VF2: [[SCALAR_PH]]: |
| ; VF2-NEXT: br label %[[LOOP_2:.*]] |
| ; VF2: [[LOOP_2]]: |
| ; VF2-NEXT: [[IV_2:%.*]] = phi i64 [ 100, %[[SCALAR_PH]] ], [ [[IV_2_NEXT:%.*]], %[[LOOP_2]] ] |
| ; VF2-NEXT: [[GEP_2:%.*]] = getelementptr i8, ptr [[DST]], i64 [[IV_2]] |
| ; VF2-NEXT: store i8 1, ptr [[GEP_2]], align 1 |
| ; VF2-NEXT: [[IV_2_NEXT]] = add i64 [[IV_2]], 1 |
| ; VF2-NEXT: [[CMP_2:%.*]] = icmp eq i64 [[IV_2]], 100 |
| ; VF2-NEXT: br i1 [[CMP_2]], label %[[EXIT:.*]], label %[[LOOP_2]], !llvm.loop [[LOOP9:![0-9]+]] |
| ; VF2: [[EXIT]]: |
| ; VF2-NEXT: ret void |
| ; |
| ; CHECK-LABEL: define void @iv_start_from_shl_of_previous_iv( |
| ; CHECK-SAME: ptr [[DST:%.*]]) { |
| ; CHECK-NEXT: [[ENTRY:.*]]: |
| ; CHECK-NEXT: br label %[[LOOP_1:.*]] |
| ; CHECK: [[LOOP_1]]: |
| ; CHECK-NEXT: [[IV_1:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_1_NEXT:%.*]], %[[LOOP_1]] ] |
| ; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr i8, ptr [[DST]], i64 [[IV_1]] |
| ; CHECK-NEXT: store i8 0, ptr [[GEP_1]], align 1 |
| ; CHECK-NEXT: [[IV_1_NEXT]] = add i64 [[IV_1]], 1 |
| ; CHECK-NEXT: [[CMP_1:%.*]] = icmp eq i64 [[IV_1]], 0 |
| ; CHECK-NEXT: br i1 [[CMP_1]], label %[[LOOP_1]], label %[[LOOP_1_EXIT:.*]] |
| ; CHECK: [[LOOP_1_EXIT]]: |
| ; CHECK-NEXT: [[IV_1_LCSSA:%.*]] = phi i64 [ [[IV_1]], %[[LOOP_1]] ] |
| ; CHECK-NEXT: [[IV_1_SHL:%.*]] = shl i64 [[IV_1_LCSSA]], 1 |
| ; CHECK-NEXT: br label %[[VECTOR_PH:.*]] |
| ; CHECK: [[VECTOR_PH]]: |
| ; CHECK-NEXT: [[TMP2:%.*]] = add i64 [[IV_1_SHL]], 96 |
| ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]] |
| ; CHECK: [[VECTOR_BODY]]: |
| ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ] |
| ; CHECK-NEXT: [[OFFSET_IDX:%.*]] = add i64 [[IV_1_SHL]], [[INDEX]] |
| ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr i8, ptr [[DST]], i64 [[OFFSET_IDX]] |
| ; CHECK-NEXT: store <4 x i8> splat (i8 1), ptr [[TMP0]], align 1 |
| ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4 |
| ; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[INDEX_NEXT]], 96 |
| ; CHECK-NEXT: br i1 [[TMP1]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP8:![0-9]+]] |
| ; CHECK: [[MIDDLE_BLOCK]]: |
| ; CHECK-NEXT: br label %[[SCALAR_PH:.*]] |
| ; CHECK: [[SCALAR_PH]]: |
| ; CHECK-NEXT: br label %[[LOOP_2:.*]] |
| ; CHECK: [[LOOP_2]]: |
| ; CHECK-NEXT: [[IV_2:%.*]] = phi i64 [ [[TMP2]], %[[SCALAR_PH]] ], [ [[IV_2_NEXT:%.*]], %[[LOOP_2]] ] |
| ; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr i8, ptr [[DST]], i64 [[IV_2]] |
| ; CHECK-NEXT: store i8 1, ptr [[GEP_2]], align 1 |
| ; CHECK-NEXT: [[IV_2_NEXT]] = add i64 [[IV_2]], 1 |
| ; CHECK-NEXT: [[CMP_2:%.*]] = icmp eq i64 [[IV_2]], 100 |
| ; CHECK-NEXT: br i1 [[CMP_2]], label %[[EXIT:.*]], label %[[LOOP_2]], !llvm.loop [[LOOP9:![0-9]+]] |
| ; CHECK: [[EXIT]]: |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| br label %loop.1 |
| |
| loop.1: |
| %iv.1 = phi i64 [ 0, %entry ], [ %iv.1.next, %loop.1 ] |
| %gep.1 = getelementptr i8, ptr %dst, i64 %iv.1 |
| store i8 0, ptr %gep.1, align 1 |
| %iv.1.next = add i64 %iv.1, 1 |
| %cmp.1 = icmp eq i64 %iv.1, 0 |
| br i1 %cmp.1, label %loop.1, label %loop.1.exit |
| |
| loop.1.exit: |
| %iv.1.shl = shl i64 %iv.1, 1 |
| br label %loop.2 |
| |
| loop.2: |
| %iv.2 = phi i64 [ %iv.1.shl, %loop.1.exit ], [ %iv.2.next, %loop.2 ] |
| %gep.2 = getelementptr i8, ptr %dst, i64 %iv.2 |
| store i8 1, ptr %gep.2, align 1 |
| %iv.2.next = add i64 %iv.2, 1 |
| %cmp.2 = icmp eq i64 %iv.2, 100 |
| br i1 %cmp.2, label %exit, label %loop.2 |
| |
| exit: |
| ret void |
| } |