blob: 36936ec9832a4ec343518080cdc4edfd8137c18f [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
; RUN: opt -S -passes=loop-vectorize %s | FileCheck %s
; TODO: The loop should be vectorized. The vectorizer needs to prove
; (A umin B) u<= A to establish memory safety from the dereferenceable
; assumption.
;
; long n = umin(count, length);
; for (long i = 0; i < n; i++)
; if (ptr[i] == 0) return null;
; ...
define ptr @main(i32 %length, ptr %ptr, i64 %0) #0 {
; CHECK-LABEL: define ptr @main(
; CHECK-SAME: i32 [[LENGTH:%.*]], ptr [[PTR:%.*]], i64 [[TMP0:%.*]]) #[[ATTR0:[0-9]+]] {
; CHECK-NEXT: [[ENTRY:.*:]]
; CHECK-NEXT: [[NULL_CHECK0:%.*]] = icmp eq i64 [[TMP0]], 0
; CHECK-NEXT: br i1 [[NULL_CHECK0]], label %[[DEOPT:.*]], label %[[PREHEADER:.*]]
; CHECK: [[PREHEADER]]:
; CHECK-NEXT: [[LENGTH_64:%.*]] = zext i32 [[LENGTH]] to i64
; CHECK-NEXT: [[EXIT:%.*]] = call i64 @llvm.umin.i64(i64 [[TMP0]], i64 [[LENGTH_64]])
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[PTR]], i64 8), "dereferenceable"(ptr [[PTR]], i64 [[LENGTH_64]]) ]
; CHECK-NEXT: [[NULL_CHECK:%.*]] = icmp eq i32 [[LENGTH]], 0
; CHECK-NEXT: br i1 [[NULL_CHECK]], label %[[DEOPT]], label %[[SCALAR_PH:.*]]
; CHECK: [[SCALAR_PH]]:
; CHECK-NEXT: br label %[[LOOP:.*]]
; CHECK: [[LOOP]]:
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[IV_NEXT:%.*]], %[[LATCH:.*]] ], [ 0, %[[SCALAR_PH]] ]
; CHECK-NEXT: [[ELEMENT_GEP:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[IV]]
; CHECK-NEXT: [[ELEMENT:%.*]] = load i8, ptr [[ELEMENT_GEP]], align 1
; CHECK-NEXT: [[FOUND_CHECK:%.*]] = icmp eq i8 [[ELEMENT]], 0
; CHECK-NEXT: br i1 [[FOUND_CHECK]], label %[[FOUND:.*]], label %[[LATCH]]
; CHECK: [[LATCH]]:
; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], 1
; CHECK-NEXT: [[RANGE_CHECK:%.*]] = icmp ult i64 [[IV_NEXT]], [[EXIT]]
; CHECK-NEXT: br i1 [[RANGE_CHECK]], label %[[LOOP]], label %[[DEOPT_LOOPEXIT:.*]]
; CHECK: [[FOUND]]:
; CHECK-NEXT: ret ptr null
; CHECK: [[DEOPT_LOOPEXIT]]:
; CHECK-NEXT: br label %[[DEOPT]]
; CHECK: [[DEOPT]]:
; CHECK-NEXT: unreachable
;
entry:
%null_check0 = icmp eq i64 %0, 0
br i1 %null_check0, label %deopt, label %preheader
preheader: ; preds = %entry
%length.64 = zext i32 %length to i64
%exit = call i64 @llvm.umin.i64(i64 %0, i64 %length.64)
call void @llvm.assume(i1 true) [ "align"(ptr %ptr, i64 8), "dereferenceable"(ptr %ptr, i64 %length.64) ]
%null_check = icmp eq i32 %length, 0
br i1 %null_check, label %deopt, label %loop
loop: ; preds = %latch, %preheader
%iv = phi i64 [ %iv.next, %latch ], [ 0, %preheader ]
%element_gep = getelementptr i8, ptr %ptr, i64 %iv
%element = load i8, ptr %element_gep, align 1
%found_check = icmp eq i8 %element, 0
br i1 %found_check, label %found, label %latch
latch: ; preds = %loop
%iv.next = add i64 %iv, 1
%range_check = icmp ult i64 %iv.next, %exit
br i1 %range_check, label %loop, label %deopt
found: ; preds = %loop
ret ptr null
deopt: ; preds = %latch, %preheader
unreachable
}
declare i64 @llvm.umin.i64(i64, i64)
declare void @llvm.assume(i1 noundef)
attributes #0 = { nofree nosync }