blob: 0ac46085d683f320f47c4a0730cc9cc8eec93c0d [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 5
; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve,+sme,+sme2p1 -stop-before=finalize-isel -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK-BEFORE-ISEL
; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve,+sme,+sme2p1 -stop-after=finalize-isel -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK-AFTER-ISEL
target triple = "aarch64-unknown-linux-gnu"
declare void @bar_enabled(<vscale x 4 x i32>) #0
declare void @bar(<vscale x 4 x i32>)
declare <vscale x 4 x i32> @bar_retv_enabled() #0
declare <vscale x 4 x i32> @bar_retv()
; Non-streaming -> calls streaming callee
define void @foo_non_streaming_pass_arg(ptr %arg) {
; CHECK-BEFORE-ISEL-LABEL: name: foo_non_streaming_pass_arg
; CHECK-BEFORE-ISEL: bb.0.entry:
; CHECK-BEFORE-ISEL-NEXT: liveins: $x0
; CHECK-BEFORE-ISEL-NEXT: {{ $}}
; CHECK-BEFORE-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-BEFORE-ISEL-NEXT: [[LDR_ZXI:%[0-9]+]]:zpr = LDR_ZXI [[COPY]], 0 :: (load (<vscale x 1 x s128>) from %ir.arg)
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: CHECK_MATCHING_VL_PSEUDO
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: $z0 = COPY [[LDR_ZXI]]
; CHECK-BEFORE-ISEL-NEXT: BL @bar_enabled, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit $z0, implicit-def $sp
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: RET_ReallyLR
;
; CHECK-AFTER-ISEL-LABEL: name: foo_non_streaming_pass_arg
; CHECK-AFTER-ISEL: bb.0.entry:
; CHECK-AFTER-ISEL-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000)
; CHECK-AFTER-ISEL-NEXT: liveins: $x0
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-AFTER-ISEL-NEXT: [[LDR_ZXI:%[0-9]+]]:zpr = LDR_ZXI [[COPY]], 0 :: (load (<vscale x 1 x s128>) from %ir.arg)
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: [[RDVLI_XI:%[0-9]+]]:gpr64 = RDVLI_XI 1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY1:%[0-9]+]]:gpr64sp = COPY [[RDVLI_XI]]
; CHECK-AFTER-ISEL-NEXT: [[ADDSVL_XXI:%[0-9]+]]:gpr64sp = ADDSVL_XXI [[COPY1]], -1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY2:%[0-9]+]]:gpr64 = COPY [[ADDSVL_XXI]]
; CHECK-AFTER-ISEL-NEXT: CBZX [[COPY2]], %bb.2
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.1.entry:
; CHECK-AFTER-ISEL-NEXT: successors:
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: BRK 1
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.2.entry:
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: $z0 = COPY [[LDR_ZXI]]
; CHECK-AFTER-ISEL-NEXT: BL @bar_enabled, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit $z0, implicit-def $sp
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: RET_ReallyLR
entry:
%v = load <vscale x 4 x i32>, ptr %arg, align 16
tail call void @bar_enabled(<vscale x 4 x i32> %v) #0
ret void
}
; Streaming -> calls non-streaming callee
define void @foo_streaming_pass_arg(ptr %arg) #0 {
; CHECK-BEFORE-ISEL-LABEL: name: foo_streaming_pass_arg
; CHECK-BEFORE-ISEL: bb.0.entry:
; CHECK-BEFORE-ISEL-NEXT: liveins: $x0
; CHECK-BEFORE-ISEL-NEXT: {{ $}}
; CHECK-BEFORE-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-BEFORE-ISEL-NEXT: [[LDR_ZXI:%[0-9]+]]:zpr = LDR_ZXI [[COPY]], 0 :: (load (<vscale x 1 x s128>) from %ir.arg)
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: CHECK_MATCHING_VL_PSEUDO
; CHECK-BEFORE-ISEL-NEXT: $z0 = COPY [[LDR_ZXI]]
; CHECK-BEFORE-ISEL-NEXT: BL @bar, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit $z0, implicit-def $sp
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: RET_ReallyLR
;
; CHECK-AFTER-ISEL-LABEL: name: foo_streaming_pass_arg
; CHECK-AFTER-ISEL: bb.0.entry:
; CHECK-AFTER-ISEL-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000)
; CHECK-AFTER-ISEL-NEXT: liveins: $x0
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-AFTER-ISEL-NEXT: [[LDR_ZXI:%[0-9]+]]:zpr = LDR_ZXI [[COPY]], 0 :: (load (<vscale x 1 x s128>) from %ir.arg)
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: [[RDVLI_XI:%[0-9]+]]:gpr64 = RDVLI_XI 1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY1:%[0-9]+]]:gpr64sp = COPY [[RDVLI_XI]]
; CHECK-AFTER-ISEL-NEXT: [[ADDSVL_XXI:%[0-9]+]]:gpr64sp = ADDSVL_XXI [[COPY1]], -1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY2:%[0-9]+]]:gpr64 = COPY [[ADDSVL_XXI]]
; CHECK-AFTER-ISEL-NEXT: CBZX [[COPY2]], %bb.2
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.1.entry:
; CHECK-AFTER-ISEL-NEXT: successors:
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: BRK 1
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.2.entry:
; CHECK-AFTER-ISEL-NEXT: $z0 = COPY [[LDR_ZXI]]
; CHECK-AFTER-ISEL-NEXT: BL @bar, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit $z0, implicit-def $sp
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: RET_ReallyLR
entry:
%v = load <vscale x 4 x i32>, ptr %arg, align 16
tail call void @bar(<vscale x 4 x i32> %v)
ret void
}
; Non-streaming -> returns SVE value from streaming callee
define void @foo_non_streaming_retval(ptr %ptr) {
; CHECK-BEFORE-ISEL-LABEL: name: foo_non_streaming_retval
; CHECK-BEFORE-ISEL: bb.0.entry:
; CHECK-BEFORE-ISEL-NEXT: liveins: $x0
; CHECK-BEFORE-ISEL-NEXT: {{ $}}
; CHECK-BEFORE-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: CHECK_MATCHING_VL_PSEUDO
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: BL @bar_retv_enabled, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit-def $sp, implicit-def $z0
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: [[COPY1:%[0-9]+]]:zpr = COPY $z0
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: [[COPY2:%[0-9]+]]:zpr = COPY [[COPY1]]
; CHECK-BEFORE-ISEL-NEXT: STR_ZXI [[COPY2]], [[COPY]], 0 :: (store (<vscale x 1 x s128>) into %ir.ptr)
; CHECK-BEFORE-ISEL-NEXT: RET_ReallyLR
;
; CHECK-AFTER-ISEL-LABEL: name: foo_non_streaming_retval
; CHECK-AFTER-ISEL: bb.0.entry:
; CHECK-AFTER-ISEL-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000)
; CHECK-AFTER-ISEL-NEXT: liveins: $x0
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: [[RDVLI_XI:%[0-9]+]]:gpr64 = RDVLI_XI 1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY1:%[0-9]+]]:gpr64sp = COPY [[RDVLI_XI]]
; CHECK-AFTER-ISEL-NEXT: [[ADDSVL_XXI:%[0-9]+]]:gpr64sp = ADDSVL_XXI [[COPY1]], -1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY2:%[0-9]+]]:gpr64 = COPY [[ADDSVL_XXI]]
; CHECK-AFTER-ISEL-NEXT: CBZX [[COPY2]], %bb.2
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.1.entry:
; CHECK-AFTER-ISEL-NEXT: successors:
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: BRK 1
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.2.entry:
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: BL @bar_retv_enabled, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit-def $sp, implicit-def $z0
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: [[COPY3:%[0-9]+]]:zpr = COPY $z0
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: [[COPY4:%[0-9]+]]:zpr = COPY [[COPY3]]
; CHECK-AFTER-ISEL-NEXT: STR_ZXI [[COPY4]], [[COPY]], 0 :: (store (<vscale x 1 x s128>) into %ir.ptr)
; CHECK-AFTER-ISEL-NEXT: RET_ReallyLR
entry:
%v = tail call <vscale x 4 x i32> @bar_retv_enabled() #0
store <vscale x 4 x i32> %v, ptr %ptr, align 16
ret void
}
; Streaming -> returns SVE value from non-streaming callee
define void @foo_streaming_retval(ptr %ptr) #0 {
; CHECK-BEFORE-ISEL-LABEL: name: foo_streaming_retval
; CHECK-BEFORE-ISEL: bb.0.entry:
; CHECK-BEFORE-ISEL-NEXT: liveins: $x0
; CHECK-BEFORE-ISEL-NEXT: {{ $}}
; CHECK-BEFORE-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: CHECK_MATCHING_VL_PSEUDO
; CHECK-BEFORE-ISEL-NEXT: BL @bar_retv, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit-def $sp, implicit-def $z0
; CHECK-BEFORE-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-BEFORE-ISEL-NEXT: [[COPY1:%[0-9]+]]:zpr = COPY $z0
; CHECK-BEFORE-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-BEFORE-ISEL-NEXT: [[COPY2:%[0-9]+]]:zpr = COPY [[COPY1]]
; CHECK-BEFORE-ISEL-NEXT: STR_ZXI [[COPY2]], [[COPY]], 0 :: (store (<vscale x 1 x s128>) into %ir.ptr)
; CHECK-BEFORE-ISEL-NEXT: RET_ReallyLR
;
; CHECK-AFTER-ISEL-LABEL: name: foo_streaming_retval
; CHECK-AFTER-ISEL: bb.0.entry:
; CHECK-AFTER-ISEL-NEXT: successors: %bb.1(0x40000000), %bb.2(0x40000000)
; CHECK-AFTER-ISEL-NEXT: liveins: $x0
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: [[COPY:%[0-9]+]]:gpr64common = COPY $x0
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKDOWN 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 0, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit-def $sp, implicit-def $z0, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: [[RDVLI_XI:%[0-9]+]]:gpr64 = RDVLI_XI 1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY1:%[0-9]+]]:gpr64sp = COPY [[RDVLI_XI]]
; CHECK-AFTER-ISEL-NEXT: [[ADDSVL_XXI:%[0-9]+]]:gpr64sp = ADDSVL_XXI [[COPY1]], -1, implicit $vg
; CHECK-AFTER-ISEL-NEXT: [[COPY2:%[0-9]+]]:gpr64 = COPY [[ADDSVL_XXI]]
; CHECK-AFTER-ISEL-NEXT: CBZX [[COPY2]], %bb.2
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.1.entry:
; CHECK-AFTER-ISEL-NEXT: successors:
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: BRK 1
; CHECK-AFTER-ISEL-NEXT: {{ $}}
; CHECK-AFTER-ISEL-NEXT: bb.2.entry:
; CHECK-AFTER-ISEL-NEXT: BL @bar_retv, csr_aarch64_sve_aapcs, implicit-def dead $lr, implicit $sp, implicit-def $sp, implicit-def $z0
; CHECK-AFTER-ISEL-NEXT: ADJCALLSTACKUP 0, 0, implicit-def dead $sp, implicit $sp
; CHECK-AFTER-ISEL-NEXT: [[COPY3:%[0-9]+]]:zpr = COPY $z0
; CHECK-AFTER-ISEL-NEXT: MSRpstatesvcrImm1 1, 1, csr_aarch64_smstartstop, implicit-def dead $nzcv, implicit $vg, implicit-def $vg, implicit-def $fpmr
; CHECK-AFTER-ISEL-NEXT: [[COPY4:%[0-9]+]]:zpr = COPY [[COPY3]]
; CHECK-AFTER-ISEL-NEXT: STR_ZXI [[COPY4]], [[COPY]], 0 :: (store (<vscale x 1 x s128>) into %ir.ptr)
; CHECK-AFTER-ISEL-NEXT: RET_ReallyLR
entry:
%v = tail call <vscale x 4 x i32> @bar_retv()
store <vscale x 4 x i32> %v, ptr %ptr, align 16
ret void
}
attributes #0 = { "aarch64_pstate_sm_enabled" }
attributes #1 = { "aarch64_pstate_sm_compatible" }