blob: ac82e47633d5a914a0a9b4f0f31e5a4f9a81cba9 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt < %s -slp-vectorizer -S -mtriple=x86_64-- -mcpu=skylake-avx512 | FileCheck %s
; These code should be fully vectorized by D57059 patch
define void @foo(i8* noalias nocapture %t0, i8* noalias nocapture readonly %t1) {
; CHECK-LABEL: @foo(
; CHECK-NEXT: [[T3:%.*]] = load i8, i8* [[T1:%.*]], align 1, !tbaa [[TBAA0:![0-9]+]]
; CHECK-NEXT: [[T4:%.*]] = icmp ult i8 [[T3]], 64
; CHECK-NEXT: [[T5:%.*]] = sub i8 0, [[T3]]
; CHECK-NEXT: [[T6:%.*]] = select i1 [[T4]], i8 [[T3]], i8 [[T5]]
; CHECK-NEXT: store i8 [[T6]], i8* [[T0:%.*]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T7:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 1
; CHECK-NEXT: [[T8:%.*]] = load i8, i8* [[T7]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T9:%.*]] = icmp ult i8 [[T8]], 64
; CHECK-NEXT: [[T10:%.*]] = sub i8 0, [[T8]]
; CHECK-NEXT: [[T11:%.*]] = select i1 [[T9]], i8 [[T8]], i8 [[T10]]
; CHECK-NEXT: [[T12:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 1
; CHECK-NEXT: store i8 [[T11]], i8* [[T12]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T13:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 2
; CHECK-NEXT: [[T14:%.*]] = load i8, i8* [[T13]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T15:%.*]] = icmp ult i8 [[T14]], 64
; CHECK-NEXT: [[T16:%.*]] = sub i8 0, [[T14]]
; CHECK-NEXT: [[T17:%.*]] = select i1 [[T15]], i8 [[T14]], i8 [[T16]]
; CHECK-NEXT: [[T18:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 2
; CHECK-NEXT: store i8 [[T17]], i8* [[T18]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T19:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 3
; CHECK-NEXT: [[T20:%.*]] = load i8, i8* [[T19]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T21:%.*]] = icmp ult i8 [[T20]], 64
; CHECK-NEXT: [[T22:%.*]] = sub i8 0, [[T20]]
; CHECK-NEXT: [[T23:%.*]] = select i1 [[T21]], i8 [[T20]], i8 [[T22]]
; CHECK-NEXT: [[T24:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 3
; CHECK-NEXT: store i8 [[T23]], i8* [[T24]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T25:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 4
; CHECK-NEXT: [[T26:%.*]] = load i8, i8* [[T25]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T27:%.*]] = icmp ult i8 [[T26]], 64
; CHECK-NEXT: [[T28:%.*]] = sub i8 0, [[T26]]
; CHECK-NEXT: [[T29:%.*]] = select i1 [[T27]], i8 [[T26]], i8 [[T28]]
; CHECK-NEXT: [[T30:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 4
; CHECK-NEXT: store i8 [[T29]], i8* [[T30]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T31:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 5
; CHECK-NEXT: [[T32:%.*]] = load i8, i8* [[T31]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T33:%.*]] = icmp ult i8 [[T32]], 64
; CHECK-NEXT: [[T34:%.*]] = sub i8 0, [[T32]]
; CHECK-NEXT: [[T35:%.*]] = select i1 [[T33]], i8 [[T32]], i8 [[T34]]
; CHECK-NEXT: [[T36:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 5
; CHECK-NEXT: store i8 [[T35]], i8* [[T36]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T37:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 6
; CHECK-NEXT: [[T38:%.*]] = load i8, i8* [[T37]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T39:%.*]] = icmp ult i8 [[T38]], 64
; CHECK-NEXT: [[T40:%.*]] = sub i8 0, [[T38]]
; CHECK-NEXT: [[T41:%.*]] = select i1 [[T39]], i8 [[T38]], i8 [[T40]]
; CHECK-NEXT: [[T42:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 6
; CHECK-NEXT: store i8 [[T41]], i8* [[T42]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T43:%.*]] = getelementptr inbounds i8, i8* [[T1]], i64 7
; CHECK-NEXT: [[T44:%.*]] = load i8, i8* [[T43]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: [[T45:%.*]] = icmp ult i8 [[T44]], 64
; CHECK-NEXT: [[T46:%.*]] = sub i8 0, [[T44]]
; CHECK-NEXT: [[T47:%.*]] = select i1 [[T45]], i8 [[T44]], i8 [[T46]]
; CHECK-NEXT: [[T48:%.*]] = getelementptr inbounds i8, i8* [[T0]], i64 7
; CHECK-NEXT: store i8 [[T47]], i8* [[T48]], align 1, !tbaa [[TBAA0]]
; CHECK-NEXT: ret void
;
%t3 = load i8, i8* %t1, align 1, !tbaa !3
%t4 = icmp ult i8 %t3, 64
%t5 = sub i8 0, %t3
%t6 = select i1 %t4, i8 %t3, i8 %t5
store i8 %t6, i8* %t0, align 1, !tbaa !3
%t7 = getelementptr inbounds i8, i8* %t1, i64 1
%t8 = load i8, i8* %t7, align 1, !tbaa !3
%t9 = icmp ult i8 %t8, 64
%t10 = sub i8 0, %t8
%t11 = select i1 %t9, i8 %t8, i8 %t10
%t12 = getelementptr inbounds i8, i8* %t0, i64 1
store i8 %t11, i8* %t12, align 1, !tbaa !3
%t13 = getelementptr inbounds i8, i8* %t1, i64 2
%t14 = load i8, i8* %t13, align 1, !tbaa !3
%t15 = icmp ult i8 %t14, 64
%t16 = sub i8 0, %t14
%t17 = select i1 %t15, i8 %t14, i8 %t16
%t18 = getelementptr inbounds i8, i8* %t0, i64 2
store i8 %t17, i8* %t18, align 1, !tbaa !3
%t19 = getelementptr inbounds i8, i8* %t1, i64 3
%t20 = load i8, i8* %t19, align 1, !tbaa !3
%t21 = icmp ult i8 %t20, 64
%t22 = sub i8 0, %t20
%t23 = select i1 %t21, i8 %t20, i8 %t22
%t24 = getelementptr inbounds i8, i8* %t0, i64 3
store i8 %t23, i8* %t24, align 1, !tbaa !3
%t25 = getelementptr inbounds i8, i8* %t1, i64 4
%t26 = load i8, i8* %t25, align 1, !tbaa !3
%t27 = icmp ult i8 %t26, 64
%t28 = sub i8 0, %t26
%t29 = select i1 %t27, i8 %t26, i8 %t28
%t30 = getelementptr inbounds i8, i8* %t0, i64 4
store i8 %t29, i8* %t30, align 1, !tbaa !3
%t31 = getelementptr inbounds i8, i8* %t1, i64 5
%t32 = load i8, i8* %t31, align 1, !tbaa !3
%t33 = icmp ult i8 %t32, 64
%t34 = sub i8 0, %t32
%t35 = select i1 %t33, i8 %t32, i8 %t34
%t36 = getelementptr inbounds i8, i8* %t0, i64 5
store i8 %t35, i8* %t36, align 1, !tbaa !3
%t37 = getelementptr inbounds i8, i8* %t1, i64 6
%t38 = load i8, i8* %t37, align 1, !tbaa !3
%t39 = icmp ult i8 %t38, 64
%t40 = sub i8 0, %t38
%t41 = select i1 %t39, i8 %t38, i8 %t40
%t42 = getelementptr inbounds i8, i8* %t0, i64 6
store i8 %t41, i8* %t42, align 1, !tbaa !3
%t43 = getelementptr inbounds i8, i8* %t1, i64 7
%t44 = load i8, i8* %t43, align 1, !tbaa !3
%t45 = icmp ult i8 %t44, 64
%t46 = sub i8 0, %t44
%t47 = select i1 %t45, i8 %t44, i8 %t46
%t48 = getelementptr inbounds i8, i8* %t0, i64 7
store i8 %t47, i8* %t48, align 1, !tbaa !3
ret void
}
!3 = !{!4, !4, i64 0}
!4 = !{!"omnipotent char", !5, i64 0}
!5 = !{!"Simple C++ TBAA"}