blob: 374f240a1ac2d5f4e3078c40a4a918507e068878 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -slp-vectorizer -S %s | FileCheck %s
; RUN: opt -aa-pipeline=basic-aa -passes='slp-vectorizer' -S %s | FileCheck %s
target datalayout = "e-m:o-i64:64-i128:128-n32:64-S128"
target triple = "arm64-apple-ios5.0.0"
; Some negative tests first.
; We need selects with a uniform predicate to lower effectively to vector
; instructions.
define void @select_mixed_predicates_8xi16(i16* %ptr, i16 %x) {
; CHECK-LABEL: @select_mixed_predicates_8xi16(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[L_0:%.*]] = load i16, i16* [[PTR:%.*]], align 2
; CHECK-NEXT: [[CMP_0:%.*]] = icmp ult i16 [[L_0]], 16383
; CHECK-NEXT: [[S_0:%.*]] = select i1 [[CMP_0]], i16 [[L_0]], i16 [[X:%.*]]
; CHECK-NEXT: store i16 [[S_0]], i16* [[PTR]], align 2
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 1
; CHECK-NEXT: [[L_1:%.*]] = load i16, i16* [[GEP_1]], align 2
; CHECK-NEXT: [[CMP_1:%.*]] = icmp sgt i16 [[L_1]], 16383
; CHECK-NEXT: [[S_1:%.*]] = select i1 [[CMP_1]], i16 [[L_1]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_1]], i16* [[GEP_1]], align 2
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 2
; CHECK-NEXT: [[L_2:%.*]] = load i16, i16* [[GEP_2]], align 2
; CHECK-NEXT: [[CMP_2:%.*]] = icmp eq i16 [[L_2]], 16383
; CHECK-NEXT: [[S_2:%.*]] = select i1 [[CMP_2]], i16 [[L_2]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_2]], i16* [[GEP_2]], align 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 3
; CHECK-NEXT: [[L_3:%.*]] = load i16, i16* [[GEP_3]], align 2
; CHECK-NEXT: [[CMP_3:%.*]] = icmp ne i16 [[L_3]], 16383
; CHECK-NEXT: [[S_3:%.*]] = select i1 [[CMP_3]], i16 [[L_3]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_3]], i16* [[GEP_3]], align 2
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 4
; CHECK-NEXT: [[L_4:%.*]] = load i16, i16* [[GEP_4]], align 2
; CHECK-NEXT: [[CMP_4:%.*]] = icmp eq i16 [[L_4]], 16383
; CHECK-NEXT: [[S_4:%.*]] = select i1 [[CMP_4]], i16 [[L_4]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_4]], i16* [[GEP_4]], align 2
; CHECK-NEXT: [[GEP_5:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 5
; CHECK-NEXT: [[L_5:%.*]] = load i16, i16* [[GEP_5]], align 2
; CHECK-NEXT: [[CMP_5:%.*]] = icmp ule i16 [[L_5]], 16383
; CHECK-NEXT: [[S_5:%.*]] = select i1 [[CMP_5]], i16 [[L_5]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_5]], i16* [[GEP_5]], align 2
; CHECK-NEXT: [[GEP_6:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 6
; CHECK-NEXT: [[L_6:%.*]] = load i16, i16* [[GEP_6]], align 2
; CHECK-NEXT: [[CMP_6:%.*]] = icmp ult i16 [[L_6]], 16383
; CHECK-NEXT: [[S_6:%.*]] = select i1 [[CMP_6]], i16 [[L_6]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_6]], i16* [[GEP_6]], align 2
; CHECK-NEXT: [[GEP_7:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 7
; CHECK-NEXT: [[L_7:%.*]] = load i16, i16* [[GEP_7]], align 2
; CHECK-NEXT: [[CMP_7:%.*]] = icmp ult i16 [[L_7]], 16383
; CHECK-NEXT: [[S_7:%.*]] = select i1 [[CMP_7]], i16 [[L_7]], i16 [[X]]
; CHECK-NEXT: store i16 [[S_7]], i16* [[GEP_7]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i16, i16* %ptr
%cmp.0 = icmp ult i16 %l.0, 16383
%s.0 = select i1 %cmp.0, i16 %l.0, i16 %x
store i16 %s.0, i16* %ptr, align 2
%gep.1 = getelementptr inbounds i16, i16* %ptr, i16 1
%l.1 = load i16, i16* %gep.1
%cmp.1 = icmp sgt i16 %l.1, 16383
%s.1 = select i1 %cmp.1, i16 %l.1, i16 %x
store i16 %s.1, i16* %gep.1, align 2
%gep.2 = getelementptr inbounds i16, i16* %ptr, i16 2
%l.2 = load i16, i16* %gep.2
%cmp.2 = icmp eq i16 %l.2, 16383
%s.2 = select i1 %cmp.2, i16 %l.2, i16 %x
store i16 %s.2, i16* %gep.2, align 2
%gep.3 = getelementptr inbounds i16, i16* %ptr, i16 3
%l.3 = load i16, i16* %gep.3
%cmp.3 = icmp ne i16 %l.3, 16383
%s.3 = select i1 %cmp.3, i16 %l.3, i16 %x
store i16 %s.3, i16* %gep.3, align 2
%gep.4 = getelementptr inbounds i16, i16* %ptr, i16 4
%l.4 = load i16, i16* %gep.4
%cmp.4 = icmp eq i16 %l.4, 16383
%s.4 = select i1 %cmp.4, i16 %l.4, i16 %x
store i16 %s.4, i16* %gep.4, align 2
%gep.5 = getelementptr inbounds i16, i16* %ptr, i16 5
%l.5 = load i16, i16* %gep.5
%cmp.5 = icmp ule i16 %l.5, 16383
%s.5 = select i1 %cmp.5, i16 %l.5, i16 %x
store i16 %s.5, i16* %gep.5, align 2
%gep.6 = getelementptr inbounds i16, i16* %ptr, i16 6
%l.6 = load i16, i16* %gep.6
%cmp.6 = icmp ult i16 %l.6, 16383
%s.6 = select i1 %cmp.6, i16 %l.6, i16 %x
store i16 %s.6, i16* %gep.6, align 2
%gep.7 = getelementptr inbounds i16, i16* %ptr, i16 7
%l.7 = load i16, i16* %gep.7
%cmp.7 = icmp ult i16 %l.7, 16383
%s.7 = select i1 %cmp.7, i16 %l.7, i16 %x
store i16 %s.7, i16* %gep.7, align 2
ret void
}
define void @select_uniform_ugt_7xi8(i8* %ptr, i8 %x) {
; CHECK-LABEL: @select_uniform_ugt_7xi8(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[L_0:%.*]] = load i8, i8* [[PTR:%.*]], align 1
; CHECK-NEXT: [[CMP_0:%.*]] = icmp ugt i8 [[L_0]], -1
; CHECK-NEXT: [[S_0:%.*]] = select i1 [[CMP_0]], i8 [[L_0]], i8 [[X:%.*]]
; CHECK-NEXT: store i8 [[S_0]], i8* [[PTR]], align 2
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 1
; CHECK-NEXT: [[L_1:%.*]] = load i8, i8* [[GEP_1]], align 1
; CHECK-NEXT: [[CMP_1:%.*]] = icmp ugt i8 [[L_1]], -1
; CHECK-NEXT: [[S_1:%.*]] = select i1 [[CMP_1]], i8 [[L_1]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_1]], i8* [[GEP_1]], align 2
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 2
; CHECK-NEXT: [[L_2:%.*]] = load i8, i8* [[GEP_2]], align 1
; CHECK-NEXT: [[CMP_2:%.*]] = icmp ugt i8 [[L_2]], -1
; CHECK-NEXT: [[S_2:%.*]] = select i1 [[CMP_2]], i8 [[L_2]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_2]], i8* [[GEP_2]], align 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 3
; CHECK-NEXT: [[L_3:%.*]] = load i8, i8* [[GEP_3]], align 1
; CHECK-NEXT: [[CMP_3:%.*]] = icmp ugt i8 [[L_3]], -1
; CHECK-NEXT: [[S_3:%.*]] = select i1 [[CMP_3]], i8 [[L_3]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_3]], i8* [[GEP_3]], align 2
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 4
; CHECK-NEXT: [[L_4:%.*]] = load i8, i8* [[GEP_4]], align 1
; CHECK-NEXT: [[CMP_4:%.*]] = icmp ugt i8 [[L_4]], -1
; CHECK-NEXT: [[S_4:%.*]] = select i1 [[CMP_4]], i8 [[L_4]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_4]], i8* [[GEP_4]], align 2
; CHECK-NEXT: [[GEP_5:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 5
; CHECK-NEXT: [[L_5:%.*]] = load i8, i8* [[GEP_5]], align 1
; CHECK-NEXT: [[CMP_5:%.*]] = icmp ugt i8 [[L_5]], -1
; CHECK-NEXT: [[S_5:%.*]] = select i1 [[CMP_5]], i8 [[L_5]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_5]], i8* [[GEP_5]], align 2
; CHECK-NEXT: [[GEP_6:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 6
; CHECK-NEXT: [[L_6:%.*]] = load i8, i8* [[GEP_6]], align 1
; CHECK-NEXT: [[CMP_6:%.*]] = icmp ugt i8 [[L_6]], -1
; CHECK-NEXT: [[S_6:%.*]] = select i1 [[CMP_6]], i8 [[L_6]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_6]], i8* [[GEP_6]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i8, i8* %ptr
%cmp.0 = icmp ugt i8 %l.0, 16383
%s.0 = select i1 %cmp.0, i8 %l.0, i8 %x
store i8 %s.0, i8* %ptr, align 2
%gep.1 = getelementptr inbounds i8, i8* %ptr, i8 1
%l.1 = load i8, i8* %gep.1
%cmp.1 = icmp ugt i8 %l.1, 16383
%s.1 = select i1 %cmp.1, i8 %l.1, i8 %x
store i8 %s.1, i8* %gep.1, align 2
%gep.2 = getelementptr inbounds i8, i8* %ptr, i8 2
%l.2 = load i8, i8* %gep.2
%cmp.2 = icmp ugt i8 %l.2, 16383
%s.2 = select i1 %cmp.2, i8 %l.2, i8 %x
store i8 %s.2, i8* %gep.2, align 2
%gep.3 = getelementptr inbounds i8, i8* %ptr, i8 3
%l.3 = load i8, i8* %gep.3
%cmp.3 = icmp ugt i8 %l.3, 16383
%s.3 = select i1 %cmp.3, i8 %l.3, i8 %x
store i8 %s.3, i8* %gep.3, align 2
%gep.4 = getelementptr inbounds i8, i8* %ptr, i8 4
%l.4 = load i8, i8* %gep.4
%cmp.4 = icmp ugt i8 %l.4, 16383
%s.4 = select i1 %cmp.4, i8 %l.4, i8 %x
store i8 %s.4, i8* %gep.4, align 2
%gep.5 = getelementptr inbounds i8, i8* %ptr, i8 5
%l.5 = load i8, i8* %gep.5
%cmp.5 = icmp ugt i8 %l.5, 16383
%s.5 = select i1 %cmp.5, i8 %l.5, i8 %x
store i8 %s.5, i8* %gep.5, align 2
%gep.6 = getelementptr inbounds i8, i8* %ptr, i8 6
%l.6 = load i8, i8* %gep.6
%cmp.6 = icmp ugt i8 %l.6, 16383
%s.6 = select i1 %cmp.6, i8 %l.6, i8 %x
store i8 %s.6, i8* %gep.6, align 2
ret void
}
; Positive tests.
define void @select_uniform_ugt_8xi8(i8* %ptr, i8 %x) {
; CHECK-LABEL: @select_uniform_ugt_8xi8(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i8, i8* [[PTR:%.*]], i8 1
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 3
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 4
; CHECK-NEXT: [[GEP_5:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 5
; CHECK-NEXT: [[GEP_6:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 6
; CHECK-NEXT: [[GEP_7:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 7
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i8* [[PTR]] to <8 x i8>*
; CHECK-NEXT: [[TMP1:%.*]] = load <8 x i8>, <8 x i8>* [[TMP0]], align 1
; CHECK-NEXT: [[TMP2:%.*]] = icmp ugt <8 x i8> [[TMP1]], <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <8 x i8> poison, i8 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <8 x i8> [[TMP3]], i8 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i8> [[TMP4]], i8 [[X]], i32 2
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <8 x i8> [[TMP5]], i8 [[X]], i32 3
; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i8> [[TMP6]], i8 [[X]], i32 4
; CHECK-NEXT: [[TMP8:%.*]] = insertelement <8 x i8> [[TMP7]], i8 [[X]], i32 5
; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i8> [[TMP8]], i8 [[X]], i32 6
; CHECK-NEXT: [[TMP10:%.*]] = insertelement <8 x i8> [[TMP9]], i8 [[X]], i32 7
; CHECK-NEXT: [[TMP11:%.*]] = select <8 x i1> [[TMP2]], <8 x i8> [[TMP1]], <8 x i8> [[TMP10]]
; CHECK-NEXT: [[TMP12:%.*]] = bitcast i8* [[PTR]] to <8 x i8>*
; CHECK-NEXT: store <8 x i8> [[TMP11]], <8 x i8>* [[TMP12]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i8, i8* %ptr
%cmp.0 = icmp ugt i8 %l.0, 16383
%s.0 = select i1 %cmp.0, i8 %l.0, i8 %x
store i8 %s.0, i8* %ptr, align 2
%gep.1 = getelementptr inbounds i8, i8* %ptr, i8 1
%l.1 = load i8, i8* %gep.1
%cmp.1 = icmp ugt i8 %l.1, 16383
%s.1 = select i1 %cmp.1, i8 %l.1, i8 %x
store i8 %s.1, i8* %gep.1, align 2
%gep.2 = getelementptr inbounds i8, i8* %ptr, i8 2
%l.2 = load i8, i8* %gep.2
%cmp.2 = icmp ugt i8 %l.2, 16383
%s.2 = select i1 %cmp.2, i8 %l.2, i8 %x
store i8 %s.2, i8* %gep.2, align 2
%gep.3 = getelementptr inbounds i8, i8* %ptr, i8 3
%l.3 = load i8, i8* %gep.3
%cmp.3 = icmp ugt i8 %l.3, 16383
%s.3 = select i1 %cmp.3, i8 %l.3, i8 %x
store i8 %s.3, i8* %gep.3, align 2
%gep.4 = getelementptr inbounds i8, i8* %ptr, i8 4
%l.4 = load i8, i8* %gep.4
%cmp.4 = icmp ugt i8 %l.4, 16383
%s.4 = select i1 %cmp.4, i8 %l.4, i8 %x
store i8 %s.4, i8* %gep.4, align 2
%gep.5 = getelementptr inbounds i8, i8* %ptr, i8 5
%l.5 = load i8, i8* %gep.5
%cmp.5 = icmp ugt i8 %l.5, 16383
%s.5 = select i1 %cmp.5, i8 %l.5, i8 %x
store i8 %s.5, i8* %gep.5, align 2
%gep.6 = getelementptr inbounds i8, i8* %ptr, i8 6
%l.6 = load i8, i8* %gep.6
%cmp.6 = icmp ugt i8 %l.6, 16383
%s.6 = select i1 %cmp.6, i8 %l.6, i8 %x
store i8 %s.6, i8* %gep.6, align 2
%gep.7 = getelementptr inbounds i8, i8* %ptr, i8 7
%l.7 = load i8, i8* %gep.7
%cmp.7 = icmp ugt i8 %l.7, 16383
%s.7 = select i1 %cmp.7, i8 %l.7, i8 %x
store i8 %s.7, i8* %gep.7, align 2
ret void
}
define void @select_uniform_ugt_16xi8(i8* %ptr, i8 %x) {
; CHECK-LABEL: @select_uniform_ugt_16xi8(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i8, i8* [[PTR:%.*]], i8 1
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 3
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 4
; CHECK-NEXT: [[GEP_5:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 5
; CHECK-NEXT: [[GEP_6:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 6
; CHECK-NEXT: [[GEP_7:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 7
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i8* [[PTR]] to <8 x i8>*
; CHECK-NEXT: [[TMP1:%.*]] = load <8 x i8>, <8 x i8>* [[TMP0]], align 1
; CHECK-NEXT: [[TMP2:%.*]] = icmp ugt <8 x i8> [[TMP1]], <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <8 x i8> poison, i8 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <8 x i8> [[TMP3]], i8 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i8> [[TMP4]], i8 [[X]], i32 2
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <8 x i8> [[TMP5]], i8 [[X]], i32 3
; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i8> [[TMP6]], i8 [[X]], i32 4
; CHECK-NEXT: [[TMP8:%.*]] = insertelement <8 x i8> [[TMP7]], i8 [[X]], i32 5
; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i8> [[TMP8]], i8 [[X]], i32 6
; CHECK-NEXT: [[TMP10:%.*]] = insertelement <8 x i8> [[TMP9]], i8 [[X]], i32 7
; CHECK-NEXT: [[TMP11:%.*]] = select <8 x i1> [[TMP2]], <8 x i8> [[TMP1]], <8 x i8> [[TMP10]]
; CHECK-NEXT: [[TMP12:%.*]] = bitcast i8* [[PTR]] to <8 x i8>*
; CHECK-NEXT: store <8 x i8> [[TMP11]], <8 x i8>* [[TMP12]], align 2
; CHECK-NEXT: [[GEP_8:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 8
; CHECK-NEXT: [[L_8:%.*]] = load i8, i8* [[GEP_8]], align 1
; CHECK-NEXT: [[CMP_8:%.*]] = icmp ugt i8 [[L_8]], -1
; CHECK-NEXT: [[TMP13:%.*]] = extractelement <8 x i8> [[TMP1]], i32 0
; CHECK-NEXT: [[S_8:%.*]] = select i1 [[CMP_8]], i8 [[TMP13]], i8 [[X]]
; CHECK-NEXT: [[TMP14:%.*]] = extractelement <8 x i8> [[TMP11]], i32 0
; CHECK-NEXT: store i8 [[TMP14]], i8* [[GEP_8]], align 2
; CHECK-NEXT: [[GEP_9:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 9
; CHECK-NEXT: [[L_9:%.*]] = load i8, i8* [[GEP_9]], align 1
; CHECK-NEXT: [[CMP_9:%.*]] = icmp ugt i8 [[L_9]], -1
; CHECK-NEXT: [[S_9:%.*]] = select i1 [[CMP_9]], i8 [[L_9]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_9]], i8* [[GEP_9]], align 2
; CHECK-NEXT: [[GEP_10:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 10
; CHECK-NEXT: [[L_10:%.*]] = load i8, i8* [[GEP_10]], align 1
; CHECK-NEXT: [[CMP_10:%.*]] = icmp ugt i8 [[L_10]], -1
; CHECK-NEXT: [[S_10:%.*]] = select i1 [[CMP_10]], i8 [[L_10]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_10]], i8* [[GEP_10]], align 2
; CHECK-NEXT: [[GEP_11:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 11
; CHECK-NEXT: [[L_11:%.*]] = load i8, i8* [[GEP_11]], align 1
; CHECK-NEXT: [[CMP_11:%.*]] = icmp ugt i8 [[L_11]], -1
; CHECK-NEXT: [[S_11:%.*]] = select i1 [[CMP_11]], i8 [[L_11]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_11]], i8* [[GEP_11]], align 2
; CHECK-NEXT: [[GEP_12:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 12
; CHECK-NEXT: [[L_12:%.*]] = load i8, i8* [[GEP_12]], align 1
; CHECK-NEXT: [[CMP_12:%.*]] = icmp ugt i8 [[L_12]], -1
; CHECK-NEXT: [[S_12:%.*]] = select i1 [[CMP_12]], i8 [[L_12]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_12]], i8* [[GEP_12]], align 2
; CHECK-NEXT: [[GEP_13:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 13
; CHECK-NEXT: [[L_13:%.*]] = load i8, i8* [[GEP_13]], align 1
; CHECK-NEXT: [[CMP_13:%.*]] = icmp ugt i8 [[L_13]], -1
; CHECK-NEXT: [[S_13:%.*]] = select i1 [[CMP_13]], i8 [[L_13]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_13]], i8* [[GEP_13]], align 2
; CHECK-NEXT: [[GEP_14:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 14
; CHECK-NEXT: [[L_14:%.*]] = load i8, i8* [[GEP_14]], align 1
; CHECK-NEXT: [[CMP_14:%.*]] = icmp ugt i8 [[L_14]], -1
; CHECK-NEXT: [[S_14:%.*]] = select i1 [[CMP_14]], i8 [[L_14]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_14]], i8* [[GEP_14]], align 2
; CHECK-NEXT: [[GEP_15:%.*]] = getelementptr inbounds i8, i8* [[PTR]], i8 15
; CHECK-NEXT: [[L_15:%.*]] = load i8, i8* [[GEP_15]], align 1
; CHECK-NEXT: [[CMP_15:%.*]] = icmp ugt i8 [[L_15]], -1
; CHECK-NEXT: [[S_15:%.*]] = select i1 [[CMP_15]], i8 [[L_15]], i8 [[X]]
; CHECK-NEXT: store i8 [[S_15]], i8* [[GEP_15]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i8, i8* %ptr
%cmp.0 = icmp ugt i8 %l.0, 16383
%s.0 = select i1 %cmp.0, i8 %l.0, i8 %x
store i8 %s.0, i8* %ptr, align 2
%gep.1 = getelementptr inbounds i8, i8* %ptr, i8 1
%l.1 = load i8, i8* %gep.1
%cmp.1 = icmp ugt i8 %l.1, 16383
%s.1 = select i1 %cmp.1, i8 %l.1, i8 %x
store i8 %s.1, i8* %gep.1, align 2
%gep.2 = getelementptr inbounds i8, i8* %ptr, i8 2
%l.2 = load i8, i8* %gep.2
%cmp.2 = icmp ugt i8 %l.2, 16383
%s.2 = select i1 %cmp.2, i8 %l.2, i8 %x
store i8 %s.2, i8* %gep.2, align 2
%gep.3 = getelementptr inbounds i8, i8* %ptr, i8 3
%l.3 = load i8, i8* %gep.3
%cmp.3 = icmp ugt i8 %l.3, 16383
%s.3 = select i1 %cmp.3, i8 %l.3, i8 %x
store i8 %s.3, i8* %gep.3, align 2
%gep.4 = getelementptr inbounds i8, i8* %ptr, i8 4
%l.4 = load i8, i8* %gep.4
%cmp.4 = icmp ugt i8 %l.4, 16383
%s.4 = select i1 %cmp.4, i8 %l.4, i8 %x
store i8 %s.4, i8* %gep.4, align 2
%gep.5 = getelementptr inbounds i8, i8* %ptr, i8 5
%l.5 = load i8, i8* %gep.5
%cmp.5 = icmp ugt i8 %l.5, 16383
%s.5 = select i1 %cmp.5, i8 %l.5, i8 %x
store i8 %s.5, i8* %gep.5, align 2
%gep.6 = getelementptr inbounds i8, i8* %ptr, i8 6
%l.6 = load i8, i8* %gep.6
%cmp.6 = icmp ugt i8 %l.6, 16383
%s.6 = select i1 %cmp.6, i8 %l.6, i8 %x
store i8 %s.6, i8* %gep.6, align 2
%gep.7 = getelementptr inbounds i8, i8* %ptr, i8 7
%l.7 = load i8, i8* %gep.7
%cmp.7 = icmp ugt i8 %l.7, 16383
%s.7 = select i1 %cmp.7, i8 %l.7, i8 %x
store i8 %s.7, i8* %gep.7, align 2
%gep.8 = getelementptr inbounds i8, i8* %ptr, i8 8
%l.8 = load i8, i8* %gep.8
%cmp.8 = icmp ugt i8 %l.8, 16383
%s.8 = select i1 %cmp.8, i8 %l.0, i8 %x
store i8 %s.0, i8* %gep.8, align 2
%gep.9 = getelementptr inbounds i8, i8* %ptr, i8 9
%l.9 = load i8, i8* %gep.9
%cmp.9 = icmp ugt i8 %l.9, 16383
%s.9 = select i1 %cmp.9, i8 %l.9, i8 %x
store i8 %s.9, i8* %gep.9, align 2
%gep.10 = getelementptr inbounds i8, i8* %ptr, i8 10
%l.10 = load i8, i8* %gep.10
%cmp.10 = icmp ugt i8 %l.10, 16383
%s.10 = select i1 %cmp.10, i8 %l.10, i8 %x
store i8 %s.10, i8* %gep.10, align 2
%gep.11 = getelementptr inbounds i8, i8* %ptr, i8 11
%l.11 = load i8, i8* %gep.11
%cmp.11 = icmp ugt i8 %l.11, 16383
%s.11 = select i1 %cmp.11, i8 %l.11, i8 %x
store i8 %s.11, i8* %gep.11, align 2
%gep.12 = getelementptr inbounds i8, i8* %ptr, i8 12
%l.12 = load i8, i8* %gep.12
%cmp.12 = icmp ugt i8 %l.12, 16383
%s.12 = select i1 %cmp.12, i8 %l.12, i8 %x
store i8 %s.12, i8* %gep.12, align 2
%gep.13 = getelementptr inbounds i8, i8* %ptr, i8 13
%l.13 = load i8, i8* %gep.13
%cmp.13 = icmp ugt i8 %l.13, 16383
%s.13 = select i1 %cmp.13, i8 %l.13, i8 %x
store i8 %s.13, i8* %gep.13, align 2
%gep.14 = getelementptr inbounds i8, i8* %ptr, i8 14
%l.14 = load i8, i8* %gep.14
%cmp.14 = icmp ugt i8 %l.14, 16383
%s.14 = select i1 %cmp.14, i8 %l.14, i8 %x
store i8 %s.14, i8* %gep.14, align 2
%gep.15 = getelementptr inbounds i8, i8* %ptr, i8 15
%l.15 = load i8, i8* %gep.15
%cmp.15 = icmp ugt i8 %l.15, 16383
%s.15 = select i1 %cmp.15, i8 %l.15, i8 %x
store i8 %s.15, i8* %gep.15, align 2
ret void
}
define void @select_uniform_ugt_4xi16(i16* %ptr, i16 %x) {
; CHECK-LABEL: @select_uniform_ugt_4xi16(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i16, i16* [[PTR:%.*]], i16 1
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 3
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i16* [[PTR]] to <4 x i16>*
; CHECK-NEXT: [[TMP1:%.*]] = load <4 x i16>, <4 x i16>* [[TMP0]], align 2
; CHECK-NEXT: [[TMP2:%.*]] = icmp ugt <4 x i16> [[TMP1]], <i16 16383, i16 16383, i16 16383, i16 16383>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <4 x i16> poison, i16 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <4 x i16> [[TMP3]], i16 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <4 x i16> [[TMP4]], i16 [[X]], i32 2
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <4 x i16> [[TMP5]], i16 [[X]], i32 3
; CHECK-NEXT: [[TMP7:%.*]] = select <4 x i1> [[TMP2]], <4 x i16> [[TMP1]], <4 x i16> [[TMP6]]
; CHECK-NEXT: [[TMP8:%.*]] = bitcast i16* [[PTR]] to <4 x i16>*
; CHECK-NEXT: store <4 x i16> [[TMP7]], <4 x i16>* [[TMP8]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i16, i16* %ptr
%cmp.0 = icmp ugt i16 %l.0, 16383
%s.0 = select i1 %cmp.0, i16 %l.0, i16 %x
store i16 %s.0, i16* %ptr, align 2
%gep.1 = getelementptr inbounds i16, i16* %ptr, i16 1
%l.1 = load i16, i16* %gep.1
%cmp.1 = icmp ugt i16 %l.1, 16383
%s.1 = select i1 %cmp.1, i16 %l.1, i16 %x
store i16 %s.1, i16* %gep.1, align 2
%gep.2 = getelementptr inbounds i16, i16* %ptr, i16 2
%l.2 = load i16, i16* %gep.2
%cmp.2 = icmp ugt i16 %l.2, 16383
%s.2 = select i1 %cmp.2, i16 %l.2, i16 %x
store i16 %s.2, i16* %gep.2, align 2
%gep.3 = getelementptr inbounds i16, i16* %ptr, i16 3
%l.3 = load i16, i16* %gep.3
%cmp.3 = icmp ugt i16 %l.3, 16383
%s.3 = select i1 %cmp.3, i16 %l.3, i16 %x
store i16 %s.3, i16* %gep.3, align 2
ret void
}
define void @select_uniform_ult_8xi16(i16* %ptr, i16 %x) {
; CHECK-LABEL: @select_uniform_ult_8xi16(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i16, i16* [[PTR:%.*]], i16 1
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 3
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 4
; CHECK-NEXT: [[GEP_5:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 5
; CHECK-NEXT: [[GEP_6:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 6
; CHECK-NEXT: [[GEP_7:%.*]] = getelementptr inbounds i16, i16* [[PTR]], i16 7
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i16* [[PTR]] to <8 x i16>*
; CHECK-NEXT: [[TMP1:%.*]] = load <8 x i16>, <8 x i16>* [[TMP0]], align 2
; CHECK-NEXT: [[TMP2:%.*]] = icmp ult <8 x i16> [[TMP1]], <i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <8 x i16> poison, i16 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <8 x i16> [[TMP3]], i16 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i16> [[TMP4]], i16 [[X]], i32 2
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <8 x i16> [[TMP5]], i16 [[X]], i32 3
; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i16> [[TMP6]], i16 [[X]], i32 4
; CHECK-NEXT: [[TMP8:%.*]] = insertelement <8 x i16> [[TMP7]], i16 [[X]], i32 5
; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i16> [[TMP8]], i16 [[X]], i32 6
; CHECK-NEXT: [[TMP10:%.*]] = insertelement <8 x i16> [[TMP9]], i16 [[X]], i32 7
; CHECK-NEXT: [[TMP11:%.*]] = select <8 x i1> [[TMP2]], <8 x i16> [[TMP1]], <8 x i16> [[TMP10]]
; CHECK-NEXT: [[TMP12:%.*]] = bitcast i16* [[PTR]] to <8 x i16>*
; CHECK-NEXT: store <8 x i16> [[TMP11]], <8 x i16>* [[TMP12]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i16, i16* %ptr
%cmp.0 = icmp ult i16 %l.0, 16383
%s.0 = select i1 %cmp.0, i16 %l.0, i16 %x
store i16 %s.0, i16* %ptr, align 2
%gep.1 = getelementptr inbounds i16, i16* %ptr, i16 1
%l.1 = load i16, i16* %gep.1
%cmp.1 = icmp ult i16 %l.1, 16383
%s.1 = select i1 %cmp.1, i16 %l.1, i16 %x
store i16 %s.1, i16* %gep.1, align 2
%gep.2 = getelementptr inbounds i16, i16* %ptr, i16 2
%l.2 = load i16, i16* %gep.2
%cmp.2 = icmp ult i16 %l.2, 16383
%s.2 = select i1 %cmp.2, i16 %l.2, i16 %x
store i16 %s.2, i16* %gep.2, align 2
%gep.3 = getelementptr inbounds i16, i16* %ptr, i16 3
%l.3 = load i16, i16* %gep.3
%cmp.3 = icmp ult i16 %l.3, 16383
%s.3 = select i1 %cmp.3, i16 %l.3, i16 %x
store i16 %s.3, i16* %gep.3, align 2
%gep.4 = getelementptr inbounds i16, i16* %ptr, i16 4
%l.4 = load i16, i16* %gep.4
%cmp.4 = icmp ult i16 %l.4, 16383
%s.4 = select i1 %cmp.4, i16 %l.4, i16 %x
store i16 %s.4, i16* %gep.4, align 2
%gep.5 = getelementptr inbounds i16, i16* %ptr, i16 5
%l.5 = load i16, i16* %gep.5
%cmp.5 = icmp ult i16 %l.5, 16383
%s.5 = select i1 %cmp.5, i16 %l.5, i16 %x
store i16 %s.5, i16* %gep.5, align 2
%gep.6 = getelementptr inbounds i16, i16* %ptr, i16 6
%l.6 = load i16, i16* %gep.6
%cmp.6 = icmp ult i16 %l.6, 16383
%s.6 = select i1 %cmp.6, i16 %l.6, i16 %x
store i16 %s.6, i16* %gep.6, align 2
%gep.7 = getelementptr inbounds i16, i16* %ptr, i16 7
%l.7 = load i16, i16* %gep.7
%cmp.7 = icmp ult i16 %l.7, 16383
%s.7 = select i1 %cmp.7, i16 %l.7, i16 %x
store i16 %s.7, i16* %gep.7, align 2
ret void
}
define void @select_uniform_eq_2xi32(i32* %ptr, i32 %x) {
; CHECK-LABEL: @select_uniform_eq_2xi32(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i32, i32* [[PTR:%.*]], i32 1
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i32* [[PTR]] to <2 x i32>*
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i32>, <2 x i32>* [[TMP0]], align 4
; CHECK-NEXT: [[TMP2:%.*]] = icmp eq <2 x i32> [[TMP1]], <i32 16383, i32 16383>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <2 x i32> poison, i32 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <2 x i32> [[TMP3]], i32 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = select <2 x i1> [[TMP2]], <2 x i32> [[TMP1]], <2 x i32> [[TMP4]]
; CHECK-NEXT: [[TMP6:%.*]] = bitcast i32* [[PTR]] to <2 x i32>*
; CHECK-NEXT: store <2 x i32> [[TMP5]], <2 x i32>* [[TMP6]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i32, i32* %ptr
%cmp.0 = icmp eq i32 %l.0, 16383
%s.0 = select i1 %cmp.0, i32 %l.0, i32 %x
store i32 %s.0, i32* %ptr, align 2
%gep.1 = getelementptr inbounds i32, i32* %ptr, i32 1
%l.1 = load i32, i32* %gep.1
%cmp.1 = icmp eq i32 %l.1, 16383
%s.1 = select i1 %cmp.1, i32 %l.1, i32 %x
store i32 %s.1, i32* %gep.1, align 2
ret void
}
define void @select_uniform_eq_4xi32(i32* %ptr, i32 %x) {
; CHECK-LABEL: @select_uniform_eq_4xi32(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i32, i32* [[PTR:%.*]], i32 1
; CHECK-NEXT: [[GEP_2:%.*]] = getelementptr inbounds i32, i32* [[PTR]], i32 2
; CHECK-NEXT: [[GEP_3:%.*]] = getelementptr inbounds i32, i32* [[PTR]], i32 3
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i32* [[PTR]] to <4 x i32>*
; CHECK-NEXT: [[TMP1:%.*]] = load <4 x i32>, <4 x i32>* [[TMP0]], align 4
; CHECK-NEXT: [[TMP2:%.*]] = icmp eq <4 x i32> [[TMP1]], <i32 16383, i32 16383, i32 16383, i32 16383>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <4 x i32> poison, i32 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <4 x i32> [[TMP3]], i32 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <4 x i32> [[TMP4]], i32 [[X]], i32 2
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <4 x i32> [[TMP5]], i32 [[X]], i32 3
; CHECK-NEXT: [[TMP7:%.*]] = select <4 x i1> [[TMP2]], <4 x i32> [[TMP1]], <4 x i32> [[TMP6]]
; CHECK-NEXT: [[TMP8:%.*]] = bitcast i32* [[PTR]] to <4 x i32>*
; CHECK-NEXT: store <4 x i32> [[TMP7]], <4 x i32>* [[TMP8]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i32, i32* %ptr
%cmp.0 = icmp eq i32 %l.0, 16383
%s.0 = select i1 %cmp.0, i32 %l.0, i32 %x
store i32 %s.0, i32* %ptr, align 2
%gep.1 = getelementptr inbounds i32, i32* %ptr, i32 1
%l.1 = load i32, i32* %gep.1
%cmp.1 = icmp eq i32 %l.1, 16383
%s.1 = select i1 %cmp.1, i32 %l.1, i32 %x
store i32 %s.1, i32* %gep.1, align 2
%gep.2 = getelementptr inbounds i32, i32* %ptr, i32 2
%l.2 = load i32, i32* %gep.2
%cmp.2 = icmp eq i32 %l.2, 16383
%s.2 = select i1 %cmp.2, i32 %l.2, i32 %x
store i32 %s.2, i32* %gep.2, align 2
%gep.3 = getelementptr inbounds i32, i32* %ptr, i32 3
%l.3 = load i32, i32* %gep.3
%cmp.3 = icmp eq i32 %l.3, 16383
%s.3 = select i1 %cmp.3, i32 %l.3, i32 %x
store i32 %s.3, i32* %gep.3, align 2
ret void
}
define void @select_uniform_ne_2xi64(i64* %ptr, i64 %x) {
; CHECK-LABEL: @select_uniform_ne_2xi64(
; CHECK-NEXT: entry:
; CHECK-NEXT: [[GEP_1:%.*]] = getelementptr inbounds i64, i64* [[PTR:%.*]], i64 1
; CHECK-NEXT: [[TMP0:%.*]] = bitcast i64* [[PTR]] to <2 x i64>*
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i64>, <2 x i64>* [[TMP0]], align 8
; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <2 x i64> [[TMP1]], <i64 16383, i64 16383>
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <2 x i64> poison, i64 [[X:%.*]], i32 0
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <2 x i64> [[TMP3]], i64 [[X]], i32 1
; CHECK-NEXT: [[TMP5:%.*]] = select <2 x i1> [[TMP2]], <2 x i64> [[TMP1]], <2 x i64> [[TMP4]]
; CHECK-NEXT: [[TMP6:%.*]] = bitcast i64* [[PTR]] to <2 x i64>*
; CHECK-NEXT: store <2 x i64> [[TMP5]], <2 x i64>* [[TMP6]], align 2
; CHECK-NEXT: ret void
;
entry:
%l.0 = load i64, i64* %ptr
%cmp.0 = icmp ne i64 %l.0, 16383
%s.0 = select i1 %cmp.0, i64 %l.0, i64 %x
store i64 %s.0, i64* %ptr, align 2
%gep.1 = getelementptr inbounds i64, i64* %ptr, i64 1
%l.1 = load i64, i64* %gep.1
%cmp.1 = icmp ne i64 %l.1, 16383
%s.1 = select i1 %cmp.1, i64 %l.1, i64 %x
store i64 %s.1, i64* %gep.1, align 2
ret void
}