| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2 |
| ; Test vector intrinsics added with z15. |
| ; |
| ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z15 | FileCheck %s |
| |
| declare <16 x i8> @llvm.s390.vsld(<16 x i8>, <16 x i8>, i32) |
| declare <16 x i8> @llvm.s390.vsrd(<16 x i8>, <16 x i8>, i32) |
| |
| declare {<16 x i8>, i32} @llvm.s390.vstrsb(<16 x i8>, <16 x i8>, <16 x i8>) |
| declare {<16 x i8>, i32} @llvm.s390.vstrsh(<8 x i16>, <8 x i16>, <16 x i8>) |
| declare {<16 x i8>, i32} @llvm.s390.vstrsf(<4 x i32>, <4 x i32>, <16 x i8>) |
| declare {<16 x i8>, i32} @llvm.s390.vstrszb(<16 x i8>, <16 x i8>, <16 x i8>) |
| declare {<16 x i8>, i32} @llvm.s390.vstrszh(<8 x i16>, <8 x i16>, <16 x i8>) |
| declare {<16 x i8>, i32} @llvm.s390.vstrszf(<4 x i32>, <4 x i32>, <16 x i8>) |
| |
| |
| ; VSLD with the minimum useful value. |
| define <16 x i8> @test_vsld_1(<16 x i8> %a, <16 x i8> %b) { |
| ; CHECK-LABEL: test_vsld_1: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vsld %v24, %v24, %v26, 1 |
| ; CHECK-NEXT: br %r14 |
| %res = call <16 x i8> @llvm.s390.vsld(<16 x i8> %a, <16 x i8> %b, i32 1) |
| ret <16 x i8> %res |
| } |
| |
| ; VSLD with the maximum value. |
| define <16 x i8> @test_vsld_7(<16 x i8> %a, <16 x i8> %b) { |
| ; CHECK-LABEL: test_vsld_7: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vsld %v24, %v24, %v26, 7 |
| ; CHECK-NEXT: br %r14 |
| %res = call <16 x i8> @llvm.s390.vsld(<16 x i8> %a, <16 x i8> %b, i32 7) |
| ret <16 x i8> %res |
| } |
| |
| ; VSRD with the minimum useful value. |
| define <16 x i8> @test_vsrd_1(<16 x i8> %a, <16 x i8> %b) { |
| ; CHECK-LABEL: test_vsrd_1: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vsrd %v24, %v24, %v26, 1 |
| ; CHECK-NEXT: br %r14 |
| %res = call <16 x i8> @llvm.s390.vsrd(<16 x i8> %a, <16 x i8> %b, i32 1) |
| ret <16 x i8> %res |
| } |
| |
| ; VSRD with the maximum value. |
| define <16 x i8> @test_vsrd_7(<16 x i8> %a, <16 x i8> %b) { |
| ; CHECK-LABEL: test_vsrd_7: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vsrd %v24, %v24, %v26, 7 |
| ; CHECK-NEXT: br %r14 |
| %res = call <16 x i8> @llvm.s390.vsrd(<16 x i8> %a, <16 x i8> %b, i32 7) |
| ret <16 x i8> %res |
| } |
| |
| |
| ; VSTRSB. |
| define <16 x i8> @test_vstrsb(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrsb: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrsb %v24, %v24, %v26, %v28, 0 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrsb(<16 x i8> %a, <16 x i8> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |
| ; VSTRSH. |
| define <16 x i8> @test_vstrsh(<8 x i16> %a, <8 x i16> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrsh: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrsh %v24, %v24, %v26, %v28, 0 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrsh(<8 x i16> %a, <8 x i16> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |
| ; VSTRSFS. |
| define <16 x i8> @test_vstrsf(<4 x i32> %a, <4 x i32> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrsf: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrsf %v24, %v24, %v26, %v28, 0 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrsf(<4 x i32> %a, <4 x i32> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |
| ; VSTRSZB. |
| define <16 x i8> @test_vstrszb(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrszb: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrszb %v24, %v24, %v26, %v28 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrszb(<16 x i8> %a, <16 x i8> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |
| ; VSTRSZH. |
| define <16 x i8> @test_vstrszh(<8 x i16> %a, <8 x i16> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrszh: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrszh %v24, %v24, %v26, %v28 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrszh(<8 x i16> %a, <8 x i16> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |
| ; VSTRSZF. |
| define <16 x i8> @test_vstrszf(<4 x i32> %a, <4 x i32> %b, <16 x i8> %c, |
| ; CHECK-LABEL: test_vstrszf: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: vstrszf %v24, %v24, %v26, %v28 |
| ; CHECK-NEXT: ipm %r0 |
| ; CHECK-NEXT: srl %r0, 28 |
| ; CHECK-NEXT: st %r0, 0(%r2) |
| ; CHECK-NEXT: br %r14 |
| ptr %ccptr) { |
| %call = call {<16 x i8>, i32} @llvm.s390.vstrszf(<4 x i32> %a, <4 x i32> %b, |
| <16 x i8> %c) |
| %res = extractvalue {<16 x i8>, i32} %call, 0 |
| %cc = extractvalue {<16 x i8>, i32} %call, 1 |
| store i32 %cc, ptr %ccptr |
| ret <16 x i8> %res |
| } |
| |