blob: 6a10df68ddc716ef909b4217718654edb722221f [file] [edit]
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=aarch64 -run-pass=early-machinelicm -o - %s | FileCheck %s
# This test verifies that cross-bank copies (e.g., GPR to FPR, FPR to GPR)
# are hoisted out of loops by MachineLICM, as they are expensive on AArch64.
--- |
declare void @use_float(float)
declare void @use_int(i32)
define void @gpr_to_fpr_virtual_copy_hoisted() {
ret void
}
define void @gpr_to_fpr_physical_copy_hoisted() {
ret void
}
define void @fpr_to_gpr_virtual_copy_hoisted() {
ret void
}
...
---
name: gpr_to_fpr_virtual_copy_hoisted
tracksRegLiveness: true
body: |
; CHECK-LABEL: name: gpr_to_fpr_virtual_copy_hoisted
; CHECK: bb.0:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: liveins: $w0, $w1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[COPY:%[0-9]+]]:gpr32 = COPY $w0
; CHECK-NEXT: [[COPY1:%[0-9]+]]:gpr32 = COPY $w1
; CHECK-NEXT: [[COPY2:%[0-9]+]]:gpr32all = COPY $wzr
; CHECK-NEXT: [[COPY3:%[0-9]+]]:gpr32all = COPY [[COPY2]]
; CHECK-NEXT: [[COPY4:%[0-9]+]]:fpr32 = COPY [[COPY1]]
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.1:
; CHECK-NEXT: successors: %bb.3(0x40000000), %bb.2(0x40000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[PHI:%[0-9]+]]:gpr32common = PHI [[COPY3]], %bb.0, %5, %bb.2
; CHECK-NEXT: [[SUBSWrr:%[0-9]+]]:gpr32 = SUBSWrr [[PHI]], [[COPY]], implicit-def $nzcv
; CHECK-NEXT: Bcc 1, %bb.3, implicit $nzcv
; CHECK-NEXT: B %bb.2
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.2:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: $s0 = COPY [[COPY4]]
; CHECK-NEXT: BL @use_float, implicit-def dead $lr, implicit $sp, implicit $s0, implicit-def $sp
; CHECK-NEXT: [[ADDWri:%[0-9]+]]:gpr32sp = ADDWri [[PHI]], 1, 0
; CHECK-NEXT: [[COPY5:%[0-9]+]]:gpr32all = COPY [[ADDWri]]
; CHECK-NEXT: B %bb.1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.3:
; CHECK-NEXT: RET_ReallyLR
bb.0:
liveins: $w0, $w1
%1:gpr32 = COPY $w0
%0:gpr32 = COPY $w1
%3:gpr32all = COPY $wzr
%2:gpr32all = COPY %3:gpr32all
bb.1:
%4:gpr32common = PHI %2:gpr32all, %bb.0, %5:gpr32all, %bb.2
%6:gpr32 = SUBSWrr %4:gpr32common, %1:gpr32, implicit-def $nzcv
Bcc 1, %bb.3, implicit $nzcv
B %bb.2
bb.2:
%7:fpr32 = COPY %0:gpr32
$s0 = COPY %7:fpr32
BL @use_float, implicit-def dead $lr, implicit $sp, implicit $s0, implicit-def $sp
%8:gpr32sp = ADDWri %4:gpr32common, 1, 0
%5:gpr32all = COPY %8:gpr32sp
B %bb.1
bb.3:
RET_ReallyLR
...
---
name: gpr_to_fpr_physical_copy_hoisted
tracksRegLiveness: true
body: |
; CHECK-LABEL: name: gpr_to_fpr_physical_copy_hoisted
; CHECK: bb.0:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[COPY:%[0-9]+]]:gpr32 = COPY $w0
; CHECK-NEXT: [[COPY1:%[0-9]+]]:gpr32all = COPY $wzr
; CHECK-NEXT: [[COPY2:%[0-9]+]]:gpr32all = COPY [[COPY1]]
; CHECK-NEXT: [[COPY3:%[0-9]+]]:fpr32 = COPY $wzr
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.1:
; CHECK-NEXT: successors: %bb.3(0x40000000), %bb.2(0x40000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[PHI:%[0-9]+]]:gpr32common = PHI [[COPY2]], %bb.0, %4, %bb.2
; CHECK-NEXT: [[SUBSWrr:%[0-9]+]]:gpr32 = SUBSWrr [[PHI]], [[COPY]], implicit-def $nzcv
; CHECK-NEXT: Bcc 1, %bb.3, implicit $nzcv
; CHECK-NEXT: B %bb.2
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.2:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: $s0 = COPY [[COPY3]]
; CHECK-NEXT: BL @use_float, implicit-def dead $lr, implicit $sp, implicit $s0, implicit-def $sp
; CHECK-NEXT: [[ADDWri:%[0-9]+]]:gpr32sp = ADDWri [[PHI]], 1, 0
; CHECK-NEXT: [[COPY4:%[0-9]+]]:gpr32all = COPY [[ADDWri]]
; CHECK-NEXT: B %bb.1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.3:
; CHECK-NEXT: RET_ReallyLR
bb.0:
liveins: $w0
%1:gpr32 = COPY $w0
%3:gpr32all = COPY $wzr
%2:gpr32all = COPY %3:gpr32all
bb.1:
%4:gpr32common = PHI %2:gpr32all, %bb.0, %5:gpr32all, %bb.2
%6:gpr32 = SUBSWrr %4:gpr32common, %1:gpr32, implicit-def $nzcv
Bcc 1, %bb.3, implicit $nzcv
B %bb.2
bb.2:
%7:fpr32 = COPY $wzr
$s0 = COPY %7:fpr32
BL @use_float, implicit-def dead $lr, implicit $sp, implicit $s0, implicit-def $sp
%8:gpr32sp = ADDWri %4:gpr32common, 1, 0
%5:gpr32all = COPY %8:gpr32sp
B %bb.1
bb.3:
RET_ReallyLR
...
---
name: fpr_to_gpr_virtual_copy_hoisted
tracksRegLiveness: true
body: |
; CHECK-LABEL: name: fpr_to_gpr_virtual_copy_hoisted
; CHECK: bb.0:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: liveins: $w0, $s0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[COPY:%[0-9]+]]:gpr32 = COPY $w0
; CHECK-NEXT: [[COPY1:%[0-9]+]]:fpr32 = COPY $s0
; CHECK-NEXT: [[COPY2:%[0-9]+]]:gpr32all = COPY $wzr
; CHECK-NEXT: [[COPY3:%[0-9]+]]:gpr32all = COPY [[COPY2]]
; CHECK-NEXT: [[COPY4:%[0-9]+]]:gpr32 = COPY [[COPY1]]
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.1:
; CHECK-NEXT: successors: %bb.3(0x40000000), %bb.2(0x40000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[PHI:%[0-9]+]]:gpr32common = PHI [[COPY3]], %bb.0, %5, %bb.2
; CHECK-NEXT: [[SUBSWrr:%[0-9]+]]:gpr32 = SUBSWrr [[PHI]], [[COPY]], implicit-def $nzcv
; CHECK-NEXT: Bcc 1, %bb.3, implicit $nzcv
; CHECK-NEXT: B %bb.2
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.2:
; CHECK-NEXT: successors: %bb.1(0x80000000)
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: $w0 = COPY [[COPY4]]
; CHECK-NEXT: BL @use_int, implicit-def dead $lr, implicit $sp, implicit $w0, implicit-def $sp
; CHECK-NEXT: [[ADDWri:%[0-9]+]]:gpr32sp = ADDWri [[PHI]], 1, 0
; CHECK-NEXT: [[COPY5:%[0-9]+]]:gpr32all = COPY [[ADDWri]]
; CHECK-NEXT: B %bb.1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: bb.3:
; CHECK-NEXT: RET_ReallyLR
bb.0:
liveins: $w0, $s0
%1:gpr32 = COPY $w0
%0:fpr32 = COPY $s0
%3:gpr32all = COPY $wzr
%2:gpr32all = COPY %3:gpr32all
bb.1:
%4:gpr32common = PHI %2:gpr32all, %bb.0, %5:gpr32all, %bb.2
%6:gpr32 = SUBSWrr %4:gpr32common, %1:gpr32, implicit-def $nzcv
Bcc 1, %bb.3, implicit $nzcv
B %bb.2
bb.2:
%7:gpr32 = COPY %0:fpr32
$w0 = COPY %7:gpr32
BL @use_int, implicit-def dead $lr, implicit $sp, implicit $w0, implicit-def $sp
%8:gpr32sp = ADDWri %4:gpr32common, 1, 0
%5:gpr32all = COPY %8:gpr32sp
B %bb.1
bb.3:
RET_ReallyLR
...