blob: f7811aba5ab5f17983aee0b2e7366ec8f99c4f03 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
; RUN: opt -S -passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu -slp-revec -slp-max-reg-size=1024 -slp-threshold=-100 < %s | FileCheck %s
define <4 x i16> @test() {
; CHECK-LABEL: define <4 x i16> @test() {
; CHECK-NEXT: [[ENTRY:.*:]]
; CHECK-NEXT: [[TMP0:%.*]] = shufflevector <4 x i16> zeroinitializer, <4 x i16> poison, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3>
; CHECK-NEXT: [[TMP1:%.*]] = add <16 x i16> [[TMP0]], zeroinitializer
; CHECK-NEXT: [[RDX_OP:%.*]] = or <16 x i16> zeroinitializer, [[TMP1]]
; CHECK-NEXT: [[TMP36:%.*]] = shufflevector <16 x i16> [[RDX_OP]], <16 x i16> poison, <4 x i32> <i32 0, i32 4, i32 8, i32 12>
; CHECK-NEXT: [[TMP37:%.*]] = call i16 @llvm.vector.reduce.or.v4i16(<4 x i16> [[TMP36]])
; CHECK-NEXT: [[TMP38:%.*]] = insertelement <4 x i16> poison, i16 [[TMP37]], i64 0
; CHECK-NEXT: [[TMP39:%.*]] = shufflevector <16 x i16> [[RDX_OP]], <16 x i16> poison, <4 x i32> <i32 1, i32 5, i32 9, i32 13>
; CHECK-NEXT: [[TMP40:%.*]] = call i16 @llvm.vector.reduce.or.v4i16(<4 x i16> [[TMP39]])
; CHECK-NEXT: [[TMP41:%.*]] = insertelement <4 x i16> [[TMP38]], i16 [[TMP40]], i64 1
; CHECK-NEXT: [[TMP42:%.*]] = shufflevector <16 x i16> [[RDX_OP]], <16 x i16> poison, <4 x i32> <i32 2, i32 6, i32 10, i32 14>
; CHECK-NEXT: [[TMP43:%.*]] = call i16 @llvm.vector.reduce.or.v4i16(<4 x i16> [[TMP42]])
; CHECK-NEXT: [[TMP44:%.*]] = insertelement <4 x i16> [[TMP41]], i16 [[TMP43]], i64 2
; CHECK-NEXT: [[TMP45:%.*]] = shufflevector <16 x i16> [[RDX_OP]], <16 x i16> poison, <4 x i32> <i32 3, i32 7, i32 11, i32 15>
; CHECK-NEXT: [[TMP46:%.*]] = call i16 @llvm.vector.reduce.or.v4i16(<4 x i16> [[TMP45]])
; CHECK-NEXT: [[TMP47:%.*]] = insertelement <4 x i16> [[TMP44]], i16 [[TMP46]], i64 3
; CHECK-NEXT: [[OP_RDX9:%.*]] = or <4 x i16> [[TMP47]], zeroinitializer
; CHECK-NEXT: ret <4 x i16> [[OP_RDX9]]
;
entry:
%subi = add <4 x i16> zeroinitializer, zeroinitializer
%sub40.i = add <4 x i16> %subi, zeroinitializer
%sub41.i = add <4 x i16> %subi, zeroinitializer
%sub42.i = add <4 x i16> %subi, zeroinitializer
%sub43.i = add <4 x i16> %subi, zeroinitializer
%sub44.i = add <4 x i16> %subi, zeroinitializer
%sub45.i = add <4 x i16> %subi, zeroinitializer
%sub46.i = add <4 x i16> zeroinitializer, zeroinitializer
%sub47.i = add <4 x i16> zeroinitializer, zeroinitializer
%sub48.i = add <4 x i16> zeroinitializer, zeroinitializer
%sub49.i = add <4 x i16> zeroinitializer, zeroinitializer
%or40.i = or <4 x i16> %sub40.i, %sub41.i
%or41.i = or <4 x i16> %or40.i, %sub42.i
%or42.i = or <4 x i16> %or41.i, %sub43.i
%or43.i = or <4 x i16> %or42.i, %sub44.i
%or44.i = or <4 x i16> %or43.i, %sub45.i
%or45.i = or <4 x i16> %or44.i, %sub46.i
%or46.i = or <4 x i16> %or45.i, %sub47.i
%or47.i = or <4 x i16> %or46.i, %sub48.i
%or48.i = or <4 x i16> %or47.i, %sub49.i
%or50.i = or <4 x i16> %or48.i, %subi
%subii = add <4 x i16> zeroinitializer, zeroinitializer
%subi16.i = add <4 x i16> %subii, zeroinitializer
%subi17.i = add <4 x i16> %subii, zeroinitializer
%0 = or <4 x i16> %subi16.i, %subi17.i
%1 = or <4 x i16> %0, %or50.i
ret <4 x i16> %1
}