| ; RUN: opt < %s -passes=loop-vectorize,transform-warning -S 2>&1 | FileCheck %s |
| |
| ; Like no_array_bounds.ll we verify warnings are generated when vectorization/interleaving is |
| ; explicitly specified and fails to occur for both fixed and scalable vectorize.width loop hints. |
| |
| ; #pragma clang loop vectorize(enable) |
| ; for (int i = 0; i < number; i++) { |
| ; A[B[i]]++; |
| ; } |
| |
| ; CHECK: warning: <unknown>:0:0: loop not interleaved: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering |
| define dso_local void @foo(ptr nocapture %A, ptr nocapture readonly %B, i32 %N) { |
| entry: |
| %cmp7 = icmp sgt i32 %N, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.end |
| |
| for.body.preheader: ; preds = %entry |
| %wide.trip.count = zext i32 %N to i64 |
| br label %for.body |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ] |
| %arrayidx = getelementptr inbounds i32, ptr %B, i64 %indvars.iv |
| %0 = load i32, ptr %arrayidx, align 4 |
| %idxprom1 = sext i32 %0 to i64 |
| %arrayidx2 = getelementptr inbounds i32, ptr %A, i64 %idxprom1 |
| %1 = load i32, ptr %arrayidx2, align 4 |
| %inc = add nsw i32 %1, 1 |
| store i32 %inc, ptr %arrayidx2, align 4 |
| %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| %exitcond.not = icmp eq i64 %indvars.iv.next, %wide.trip.count |
| br i1 %exitcond.not, label %for.end, label %for.body, !llvm.loop !0 |
| |
| for.end: ; preds = %for.body, %entry |
| ret void |
| } |
| |
| ; CHECK: warning: <unknown>:0:0: loop not vectorized: the optimizer was unable to perform the requested transformation; the transformation might be disabled or specified as part of an unsupported transformation ordering |
| define dso_local void @foo2(ptr nocapture %A, ptr nocapture readonly %B, i32 %N) { |
| entry: |
| %cmp7 = icmp sgt i32 %N, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.end |
| |
| for.body.preheader: ; preds = %entry |
| %wide.trip.count = zext i32 %N to i64 |
| br label %for.body |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ] |
| %arrayidx = getelementptr inbounds i32, ptr %B, i64 %indvars.iv |
| %0 = load i32, ptr %arrayidx, align 4 |
| %idxprom1 = sext i32 %0 to i64 |
| %arrayidx2 = getelementptr inbounds i32, ptr %A, i64 %idxprom1 |
| %1 = load i32, ptr %arrayidx2, align 4 |
| %inc = add nsw i32 %1, 1 |
| store i32 %inc, ptr %arrayidx2, align 4 |
| %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 |
| %exitcond.not = icmp eq i64 %indvars.iv.next, %wide.trip.count |
| br i1 %exitcond.not, label %for.end, label %for.body, !llvm.loop !3 |
| |
| for.end: ; preds = %for.body, %entry |
| ret void |
| } |
| |
| !0 = distinct !{!0, !1, !2} |
| !1 = !{!"llvm.loop.vectorize.enable", i1 true} |
| !2 = !{!"llvm.loop.vectorize.width", i32 1} |
| !3 = distinct !{!3, !1, !2, !4} |
| !4 = !{!"llvm.loop.vectorize.scalable.enable", i1 true} |