| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6 |
| ; RUN: opt -passes=slp-vectorizer -S -mtriple=riscv64 -mattr=+m,+v -riscv-v-vector-bits-min=-1 -riscv-v-slp-max-vf=0 < %s | FileCheck %s |
| |
| define void @test(ptr %dest, ptr %p) { |
| ; CHECK-LABEL: define void @test( |
| ; CHECK-SAME: ptr [[DEST:%.*]], ptr [[P:%.*]]) #[[ATTR0:[0-9]+]] { |
| ; CHECK-NEXT: [[ENTRY:.*:]] |
| ; CHECK-NEXT: [[INC0:%.*]] = getelementptr inbounds i16, ptr [[P]], i64 1 |
| ; CHECK-NEXT: [[INC2:%.*]] = getelementptr inbounds i16, ptr [[P]], i64 3 |
| ; CHECK-NEXT: [[E1:%.*]] = load i16, ptr [[INC0]], align 2 |
| ; CHECK-NEXT: [[E3:%.*]] = load i16, ptr [[INC2]], align 2 |
| ; CHECK-NEXT: [[TMP0:%.*]] = call <3 x i16> @llvm.masked.load.v3i16.p0(ptr align 4 [[P]], <3 x i1> <i1 true, i1 false, i1 true>, <3 x i16> poison) |
| ; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <3 x i16> [[TMP0]], <3 x i16> poison, <2 x i32> <i32 0, i32 2> |
| ; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <3 x i16> [[TMP0]], <3 x i16> poison, <4 x i32> <i32 0, i32 2, i32 2, i32 2> |
| ; CHECK-NEXT: [[TMP3:%.*]] = add <4 x i16> [[TMP2]], [[TMP2]] |
| ; CHECK-NEXT: store <4 x i16> [[TMP3]], ptr [[DEST]], align 4 |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %inc0 = getelementptr inbounds i16, ptr %p, i64 1 |
| %inc1 = getelementptr inbounds i16, ptr %p, i64 2 |
| %inc2 = getelementptr inbounds i16, ptr %p, i64 3 |
| %e0 = load i16, ptr %p, align 4 |
| %e1 = load i16, ptr %inc0, align 2 |
| %e2 = load i16, ptr %inc1, align 2 |
| %e3 = load i16, ptr %inc2, align 2 |
| |
| %a0 = add i16 %e0, %e0 |
| %a1 = add i16 %e2, %e2 |
| %a2 = add i16 %e2, %e2 |
| %a3 = add i16 %e2, %e2 |
| |
| %inc4 = getelementptr inbounds i16, ptr %dest, i64 1 |
| %inc5 = getelementptr inbounds i16, ptr %dest, i64 2 |
| %inc6 = getelementptr inbounds i16, ptr %dest, i64 3 |
| |
| store i16 %a0, ptr %dest, align 4 |
| store i16 %a1, ptr %inc4, align 2 |
| store i16 %a2, ptr %inc5, align 2 |
| store i16 %a3, ptr %inc6, align 2 |
| ret void |
| } |
| |
| define void @test1(ptr %dest, ptr %p) { |
| ; CHECK-LABEL: define void @test1( |
| ; CHECK-SAME: ptr [[DEST:%.*]], ptr [[P:%.*]]) #[[ATTR0]] { |
| ; CHECK-NEXT: [[ENTRY:.*:]] |
| ; CHECK-NEXT: [[INC0:%.*]] = getelementptr inbounds i16, ptr [[P]], i64 1 |
| ; CHECK-NEXT: [[INC1:%.*]] = getelementptr inbounds i16, ptr [[P]], i64 2 |
| ; CHECK-NEXT: [[INC2:%.*]] = getelementptr inbounds i16, ptr [[P]], i64 3 |
| ; CHECK-NEXT: [[E0:%.*]] = load i16, ptr [[P]], align 4 |
| ; CHECK-NEXT: [[E1:%.*]] = load i16, ptr [[INC0]], align 2 |
| ; CHECK-NEXT: [[E2:%.*]] = load i16, ptr [[INC1]], align 2 |
| ; CHECK-NEXT: [[E3:%.*]] = load i16, ptr [[INC2]], align 2 |
| ; CHECK-NEXT: [[A0:%.*]] = add i16 [[E0]], [[E0]] |
| ; CHECK-NEXT: [[A1:%.*]] = shl i16 [[E2]], 1 |
| ; CHECK-NEXT: [[A2:%.*]] = shl i16 [[E2]], 1 |
| ; CHECK-NEXT: [[A3:%.*]] = shl i16 [[E2]], 1 |
| ; CHECK-NEXT: [[INC4:%.*]] = getelementptr inbounds i16, ptr [[DEST]], i64 1 |
| ; CHECK-NEXT: [[INC5:%.*]] = getelementptr inbounds i16, ptr [[DEST]], i64 2 |
| ; CHECK-NEXT: [[INC6:%.*]] = getelementptr inbounds i16, ptr [[DEST]], i64 3 |
| ; CHECK-NEXT: store i16 [[A0]], ptr [[DEST]], align 4 |
| ; CHECK-NEXT: store i16 [[A1]], ptr [[INC4]], align 2 |
| ; CHECK-NEXT: store i16 [[A2]], ptr [[INC5]], align 2 |
| ; CHECK-NEXT: store i16 [[A3]], ptr [[INC6]], align 2 |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %inc0 = getelementptr inbounds i16, ptr %p, i64 1 |
| %inc1 = getelementptr inbounds i16, ptr %p, i64 2 |
| %inc2 = getelementptr inbounds i16, ptr %p, i64 3 |
| %e0 = load i16, ptr %p, align 4 |
| %e1 = load i16, ptr %inc0, align 2 |
| %e2 = load i16, ptr %inc1, align 2 |
| %e3 = load i16, ptr %inc2, align 2 |
| |
| %a0 = add i16 %e0, %e0 |
| %a1 = shl i16 %e2, 1 |
| %a2 = shl i16 %e2, 1 |
| %a3 = shl i16 %e2, 1 |
| |
| %inc4 = getelementptr inbounds i16, ptr %dest, i64 1 |
| %inc5 = getelementptr inbounds i16, ptr %dest, i64 2 |
| %inc6 = getelementptr inbounds i16, ptr %dest, i64 3 |
| |
| store i16 %a0, ptr %dest, align 4 |
| store i16 %a1, ptr %inc4, align 2 |
| store i16 %a2, ptr %inc5, align 2 |
| store i16 %a3, ptr %inc6, align 2 |
| ret void |
| } |