blob: e9a2fcabd62982dc8b40847ab7b27c3ffec22671 [file] [log] [blame]
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=aarch64 -run-pass=aarch64-postlegalizer-lowering -verify-machineinstrs %s -o - | FileCheck %s --check-prefix=LOWER
# RUN: llc -mtriple=aarch64 -global-isel -start-before=aarch64-postlegalizer-lowering -stop-after=instruction-select -verify-machineinstrs %s -o - | FileCheck %s --check-prefix=SELECT
#
# Check that we swap the order of operands on comparisons when it is likely
# to introduce a folding opportunity.
#
# The condition code for the compare should be changed when appropriate.
#
# TODO: emitBinOp doesn't know about selectArithExtendedRegister, so some of
# these cases don't hit in selection yet.
...
---
name: swap_sextinreg_lhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_sextinreg_lhs
; LOWER: liveins: $x0, $x1
; LOWER: %reg:_(s64) = COPY $x0
; LOWER: %cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %cmp:_(s32) = G_ICMP intpred(sle), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_sextinreg_lhs
; SELECT: liveins: $x0, $x1
; SELECT: %reg:gpr64all = COPY $x0
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %reg.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: %cmp_rhs:gpr64sp = COPY $x1
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 32, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 12, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%reg:_(s64) = COPY $x0
%cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
%cmp_rhs:_(s64) = COPY $x1
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_more_than_one_use
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; The LHS of the compare is used in an add, and a second compare. Don't
; swap, since we don't gain any folding opportunities here.
; LOWER-LABEL: name: dont_swap_more_than_one_use
; LOWER: liveins: $x0, $x1
; LOWER: %reg0:_(s64) = COPY $x0
; LOWER: %cmp_lhs:_(s64) = G_SEXT_INREG %reg0, 8
; LOWER: %add:_(s64) = G_ADD %cmp_lhs, %reg0
; LOWER: %cmp2:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %add
; LOWER: $w0 = COPY %cmp2(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_more_than_one_use
; SELECT: liveins: $x0, $x1
; SELECT: %reg0:gpr64 = COPY $x0
; SELECT: %cmp_lhs:gpr64 = SBFMXri %reg0, 0, 7
; SELECT: %add:gpr64 = ADDXrr %cmp_lhs, %reg0
; SELECT: [[SUBSXrr:%[0-9]+]]:gpr64 = SUBSXrr %cmp_lhs, %add, implicit-def $nzcv
; SELECT: %cmp2:gpr32 = CSINCWr $wzr, $wzr, 11, implicit $nzcv
; SELECT: $w0 = COPY %cmp2
; SELECT: RET_ReallyLR implicit $w0
%reg0:_(s64) = COPY $x0
%cmp_lhs:_(s64) = G_SEXT_INREG %reg0, 8
%reg1:_(s64) = COPY $x1
%cmp1:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %reg1
%add:_(s64) = G_ADD %cmp_lhs(s64), %reg0
%cmp2:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %add
$w0 = COPY %cmp2(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_legal_arith_immed_on_rhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; Arithmetic immediates can be folded into compares. If we have one, then
; don't bother changing anything.
; LOWER-LABEL: name: dont_swap_legal_arith_immed_on_rhs
; LOWER: liveins: $x0, $x1
; LOWER: %reg:_(s64) = COPY $x0
; LOWER: %cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
; LOWER: %cmp_rhs:_(s64) = G_CONSTANT i64 12
; LOWER: %cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_legal_arith_immed_on_rhs
; SELECT: liveins: $x0, $x1
; SELECT: %reg:gpr64 = COPY $x0
; SELECT: %cmp_lhs:gpr64common = SBFMXri %reg, 0, 7
; SELECT: [[SUBSXri:%[0-9]+]]:gpr64 = SUBSXri %cmp_lhs, 12, 0, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 11, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%reg:_(s64) = COPY $x0
%cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
%cmp_rhs:_(s64) = G_CONSTANT i64 12
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_non_arith_immed_on_rhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; If we have a non-arithmetic immediate on the rhs, then we can swap to get
; a guaranteed folding opportunity.
; LOWER-LABEL: name: swap_non_arith_immed_on_rhs
; LOWER: liveins: $x0, $x1
; LOWER: %reg:_(s64) = COPY $x0
; LOWER: %cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
; LOWER: %cmp_rhs:_(s64) = G_CONSTANT i64 1234567
; LOWER: %cmp:_(s32) = G_ICMP intpred(sle), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_non_arith_immed_on_rhs
; SELECT: liveins: $x0, $x1
; SELECT: %reg:gpr64all = COPY $x0
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %reg.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: [[MOVi32imm:%[0-9]+]]:gpr32 = MOVi32imm 1234567
; SELECT: %cmp_rhs:gpr64sp = SUBREG_TO_REG 0, [[MOVi32imm]], %subreg.sub_32
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 32, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 12, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%reg:_(s64) = COPY $x0
%cmp_lhs:_(s64) = G_SEXT_INREG %reg, 8
%cmp_rhs:_(s64) = G_CONSTANT i64 1234567
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_and_lhs_0xFF
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_and_lhs_0xFF
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %and_lhs:_(s64) = COPY $x0
; LOWER: %cst:_(s64) = G_CONSTANT i64 255
; LOWER: %cmp_lhs:_(s64) = G_AND %and_lhs, %cst
; LOWER: %cmp:_(s32) = G_ICMP intpred(sle), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_and_lhs_0xFF
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64sp = COPY $x1
; SELECT: %and_lhs:gpr64all = COPY $x0
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %and_lhs.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 0, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 12, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%and_lhs:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 255
%cmp_lhs:_(s64) = G_AND %and_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_and_lhs_0xFFFF
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_and_lhs_0xFFFF
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %cst:_(s64) = G_CONSTANT i64 65535
; LOWER: %and_lhs:_(s64) = COPY $x0
; LOWER: %cmp_lhs:_(s64) = G_AND %and_lhs, %cst
; LOWER: %cmp:_(s32) = G_ICMP intpred(sle), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_and_lhs_0xFFFF
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64sp = COPY $x1
; SELECT: %and_lhs:gpr64all = COPY $x0
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %and_lhs.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 8, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 12, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%cst:_(s64) = G_CONSTANT i64 65535
%and_lhs:_(s64) = COPY $x0
%cmp_lhs:_(s64) = G_AND %and_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_and_lhs_0xFFFFFFFF
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_and_lhs_0xFFFFFFFF
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %and_lhs:_(s64) = COPY $x0
; LOWER: %cst:_(s64) = G_CONSTANT i64 4294967295
; LOWER: %cmp_lhs:_(s64) = G_AND %and_lhs, %cst
; LOWER: %cmp:_(s32) = G_ICMP intpred(sle), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_and_lhs_0xFFFFFFFF
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64sp = COPY $x1
; SELECT: %and_lhs:gpr64all = COPY $x0
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %and_lhs.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 16, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 12, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%and_lhs:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 4294967295
%cmp_lhs:_(s64) = G_AND %and_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_and_lhs_wrong_mask
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; 7 isn't an extend mask for G_AND, so there's no folding opportunities
; here.
;
; LOWER-LABEL: name: dont_swap_and_lhs_wrong_mask
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %and_lhs:_(s64) = COPY $x0
; LOWER: %not_an_extend_mask:_(s64) = G_CONSTANT i64 7
; LOWER: %cmp_lhs:_(s64) = G_AND %and_lhs, %not_an_extend_mask
; LOWER: %cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_and_lhs_wrong_mask
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %and_lhs:gpr64 = COPY $x0
; SELECT: %cmp_lhs:gpr64common = ANDXri %and_lhs, 4098
; SELECT: [[SUBSXrr:%[0-9]+]]:gpr64 = SUBSXrr %cmp_lhs, %cmp_rhs, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 11, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%and_lhs:_(s64) = COPY $x0
%not_an_extend_mask:_(s64) = G_CONSTANT i64 7
%cmp_lhs:_(s64) = G_AND %and_lhs, %not_an_extend_mask(s64)
%cmp:_(s32) = G_ICMP intpred(sge), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_shl_lhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_shl_lhs
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %shl_lhs:_(s64) = COPY $x0
; LOWER: %cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_lhs:_(s64) = G_SHL %shl_lhs, %cst(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(sgt), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_shl_lhs
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %shl_lhs:gpr64 = COPY $x0
; SELECT: [[SUBSXrs:%[0-9]+]]:gpr64 = SUBSXrs %cmp_rhs, %shl_lhs, 1, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 13, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%shl_lhs:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 1
%cmp_lhs:_(s64) = G_SHL %shl_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_ashr_lhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_ashr_lhs
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %ashr_lhs:_(s64) = COPY $x0
; LOWER: %cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_lhs:_(s64) = G_ASHR %ashr_lhs, %cst(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(sgt), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_ashr_lhs
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %ashr_lhs:gpr64 = COPY $x0
; SELECT: [[SUBSXrs:%[0-9]+]]:gpr64 = SUBSXrs %cmp_rhs, %ashr_lhs, 129, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 13, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%ashr_lhs:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 1
%cmp_lhs:_(s64) = G_ASHR %ashr_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_lshr_lhs
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; LOWER-LABEL: name: swap_lshr_lhs
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %lshr_lhs:_(s64) = COPY $x0
; LOWER: %cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_lhs:_(s64) = G_LSHR %lshr_lhs, %cst(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(sgt), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_lshr_lhs
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %lshr_lhs:gpr64 = COPY $x0
; SELECT: [[SUBSXrs:%[0-9]+]]:gpr64 = SUBSXrs %cmp_rhs, %lshr_lhs, 65, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 13, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%lshr_lhs:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 1
%cmp_lhs:_(s64) = G_LSHR %lshr_lhs, %cst(s64)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_shift_s64_cst_too_large
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; Constant for the shift must be <= 63.
; LOWER-LABEL: name: dont_swap_shift_s64_cst_too_large
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %shl_lhs:_(s64) = COPY $x0
; LOWER: %too_large:_(s64) = G_CONSTANT i64 64
; LOWER: %cmp_lhs:_(s64) = G_SHL %shl_lhs, %too_large(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_shift_s64_cst_too_large
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %shl_lhs:gpr64 = COPY $x0
; SELECT: [[MOVi32imm:%[0-9]+]]:gpr32 = MOVi32imm 64
; SELECT: %too_large:gpr64 = SUBREG_TO_REG 0, [[MOVi32imm]], %subreg.sub_32
; SELECT: %cmp_lhs:gpr64 = LSLVXr %shl_lhs, %too_large
; SELECT: [[SUBSXrr:%[0-9]+]]:gpr64 = SUBSXrr %cmp_lhs, %cmp_rhs, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 10, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%shl_lhs:_(s64) = COPY $x0
%too_large:_(s64) = G_CONSTANT i64 64
%cmp_lhs:_(s64) = G_SHL %shl_lhs, %too_large(s64)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_shift_s32_cst_too_large
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $w0, $w1
; Constant for the shift must be <= 32.
; LOWER-LABEL: name: dont_swap_shift_s32_cst_too_large
; LOWER: liveins: $w0, $w1
; LOWER: %cmp_rhs:_(s32) = COPY $w1
; LOWER: %shl_lhs:_(s32) = COPY $w0
; LOWER: %cst:_(s32) = G_CONSTANT i32 32
; LOWER: %cmp_lhs:_(s32) = G_SHL %shl_lhs, %cst(s32)
; LOWER: %cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s32), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_shift_s32_cst_too_large
; SELECT: liveins: $w0, $w1
; SELECT: %cmp_rhs:gpr32 = COPY $w1
; SELECT: %shl_lhs:gpr32 = COPY $w0
; SELECT: %cst:gpr32 = MOVi32imm 32
; SELECT: %cmp_lhs:gpr32 = LSLVWr %shl_lhs, %cst
; SELECT: [[SUBSWrr:%[0-9]+]]:gpr32 = SUBSWrr %cmp_lhs, %cmp_rhs, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 10, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s32) = COPY $w1
%shl_lhs:_(s32) = COPY $w0
%cst:_(s32) = G_CONSTANT i32 32
%cmp_lhs:_(s32) = G_SHL %shl_lhs, %cst(s32)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s32), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_cmn_lhs_no_folding_opportunities
legalized: true
tracksRegLiveness: true
body: |
bb.0.entry:
liveins: $x0, $x1
; No reason to swap a CMN on the LHS when it won't introduce a constant
; folding opportunity. We can recognise CMNs on the LHS and RHS, so there's
; nothing to gain here.
; LOWER-LABEL: name: dont_swap_cmn_lhs_no_folding_opportunities
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %sub_rhs:_(s64) = COPY $x0
; LOWER: %zero:_(s64) = G_CONSTANT i64 0
; LOWER: %cmp_lhs:_(s64) = G_SUB %zero, %sub_rhs
; LOWER: %cmp:_(s32) = G_ICMP intpred(ne), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_cmn_lhs_no_folding_opportunities
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %sub_rhs:gpr64 = COPY $x0
; SELECT: [[ADDSXrr:%[0-9]+]]:gpr64 = ADDSXrr %sub_rhs, %cmp_rhs, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 0, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%sub_rhs:_(s64) = COPY $x0
%zero:_(s64) = G_CONSTANT i64 0
%cmp_lhs:_(s64) = G_SUB %zero, %sub_rhs
%cmp:_(s32) = G_ICMP intpred(ne), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_cmn_lhs
legalized: true
tracksRegLiveness: true
body: |
bb.0.entry:
liveins: $x0, $x1
; Swap when we can see a constant folding opportunity through the sub on
; the LHS.
; LOWER-LABEL: name: swap_cmn_lhs
; LOWER: liveins: $x0, $x1
; LOWER: %cmp_rhs:_(s64) = COPY $x1
; LOWER: %shl_lhs:_(s64) = COPY $x0
; LOWER: %zero:_(s64) = G_CONSTANT i64 0
; LOWER: %cst:_(s64) = G_CONSTANT i64 63
; LOWER: %sub_rhs:_(s64) = G_SHL %shl_lhs, %cst(s64)
; LOWER: %cmp_lhs:_(s64) = G_SUB %zero, %sub_rhs
; LOWER: %cmp:_(s32) = G_ICMP intpred(ne), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_cmn_lhs
; SELECT: liveins: $x0, $x1
; SELECT: %cmp_rhs:gpr64 = COPY $x1
; SELECT: %shl_lhs:gpr64 = COPY $x0
; SELECT: [[ADDSXrs:%[0-9]+]]:gpr64 = ADDSXrs %cmp_rhs, %shl_lhs, 63, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 0, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%cmp_rhs:_(s64) = COPY $x1
%shl_lhs:_(s64) = COPY $x0
%zero:_(s64) = G_CONSTANT i64 0
%cst:_(s64) = G_CONSTANT i64 63
%sub_rhs:_(s64) = G_SHL %shl_lhs, %cst(s64)
%cmp_lhs:_(s64) = G_SUB %zero, %sub_rhs
%cmp:_(s32) = G_ICMP intpred(ne), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_cmn_lhs_when_rhs_more_profitable
legalized: true
tracksRegLiveness: true
body: |
bb.0.entry:
liveins: $x0, $x1
; Don't swap when the RHS's subtract offers a better constant folding
; opportunity than the LHS's subtract.
;
; In this case, the RHS has a supported extend, plus a shift with a constant
; <= 4.
; LOWER-LABEL: name: dont_swap_cmn_lhs_when_rhs_more_profitable
; LOWER: liveins: $x0, $x1
; LOWER: %zero:_(s64) = G_CONSTANT i64 0
; LOWER: %reg0:_(s64) = COPY $x0
; LOWER: %shl_cst:_(s64) = G_CONSTANT i64 63
; LOWER: %shl:_(s64) = G_SHL %reg0, %shl_cst(s64)
; LOWER: %cmp_lhs:_(s64) = G_SUB %zero, %shl
; LOWER: %reg1:_(s64) = COPY $x1
; LOWER: %sext_in_reg:_(s64) = G_SEXT_INREG %reg1, 1
; LOWER: %ashr_cst:_(s64) = G_CONSTANT i64 3
; LOWER: %ashr:_(s64) = G_ASHR %sext_in_reg, %ashr_cst(s64)
; LOWER: %cmp_rhs:_(s64) = G_SUB %zero, %ashr
; LOWER: %cmp:_(s32) = G_ICMP intpred(eq), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_cmn_lhs_when_rhs_more_profitable
; SELECT: liveins: $x0, $x1
; SELECT: %reg0:gpr64 = COPY $x0
; SELECT: %shl:gpr64 = UBFMXri %reg0, 1, 0
; SELECT: %zero:gpr64 = COPY $xzr
; SELECT: %reg1:gpr64 = COPY $x1
; SELECT: %sext_in_reg:gpr64 = SBFMXri %reg1, 0, 0
; SELECT: %cmp_rhs:gpr64 = SUBSXrs %zero, %sext_in_reg, 131, implicit-def $nzcv
; SELECT: [[ADDSXrr:%[0-9]+]]:gpr64 = ADDSXrr %shl, %cmp_rhs, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 1, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%zero:_(s64) = G_CONSTANT i64 0
%reg0:_(s64) = COPY $x0
%shl_cst:_(s64) = G_CONSTANT i64 63
%shl:_(s64) = G_SHL %reg0, %shl_cst(s64)
%cmp_lhs:_(s64) = G_SUB %zero, %shl
%reg1:_(s64) = COPY $x1
%sext_in_reg:_(s64) = G_SEXT_INREG %reg1, 1
%ashr_cst:_(s64) = G_CONSTANT i64 3
%ashr:_(s64) = G_ASHR %sext_in_reg, %ashr_cst(s64)
%cmp_rhs:_(s64) = G_SUB %zero, %ashr
%cmp:_(s32) = G_ICMP intpred(eq), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: dont_swap_rhs_with_supported_extend
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; The RHS offers more constant folding opportunities than the LHS.
; LOWER-LABEL: name: dont_swap_rhs_with_supported_extend
; LOWER: liveins: $x0, $x1
; LOWER: %reg0:_(s64) = COPY $x0
; LOWER: %lhs_cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_lhs:_(s64) = G_SHL %reg0, %lhs_cst(s64)
; LOWER: %reg1:_(s64) = COPY $x1
; LOWER: %and_mask:_(s64) = G_CONSTANT i64 255
; LOWER: %and:_(s64) = G_AND %reg1, %and_mask
; LOWER: %rhs_cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_rhs:_(s64) = G_ASHR %and, %rhs_cst(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: dont_swap_rhs_with_supported_extend
; SELECT: liveins: $x0, $x1
; SELECT: %reg0:gpr64 = COPY $x0
; SELECT: %cmp_lhs:gpr64 = UBFMXri %reg0, 63, 62
; SELECT: %reg1:gpr64 = COPY $x1
; SELECT: %and:gpr64common = ANDXri %reg1, 4103
; SELECT: [[SUBSXrs:%[0-9]+]]:gpr64 = SUBSXrs %cmp_lhs, %and, 129, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 10, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%reg0:_(s64) = COPY $x0
%lhs_cst:_(s64) = G_CONSTANT i64 1
%cmp_lhs:_(s64) = G_SHL %reg0, %lhs_cst(s64)
%reg1:_(s64) = COPY $x1
%and_mask:_(s64) = G_CONSTANT i64 255
%and:_(s64) = G_AND %reg1, %and_mask(s64)
%rhs_cst:_(s64) = G_CONSTANT i64 1
%cmp_rhs:_(s64) = G_ASHR %and, %rhs_cst(s64)
%cmp:_(s32) = G_ICMP intpred(slt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0
...
---
name: swap_rhs_with_supported_extend
legalized: true
tracksRegLiveness: true
body: |
bb.0:
liveins: $x0, $x1
; In this case, both the LHS and RHS are fed by a supported extend. However,
; the LHS' shift has a constant <= 4. This makes it more profitable, so
; we should swap the operands.
; LOWER-LABEL: name: swap_rhs_with_supported_extend
; LOWER: liveins: $x0, $x1
; LOWER: %reg0:_(s64) = COPY $x0
; LOWER: %and_mask:_(s64) = G_CONSTANT i64 255
; LOWER: %and:_(s64) = G_AND %reg0, %and_mask
; LOWER: %lhs_cst:_(s64) = G_CONSTANT i64 1
; LOWER: %cmp_lhs:_(s64) = G_SHL %and, %lhs_cst(s64)
; LOWER: %rhs_cst:_(s64) = G_CONSTANT i64 5
; LOWER: %cmp_rhs:_(s64) = G_ASHR %and, %rhs_cst(s64)
; LOWER: %cmp:_(s32) = G_ICMP intpred(slt), %cmp_rhs(s64), %cmp_lhs
; LOWER: $w0 = COPY %cmp(s32)
; LOWER: RET_ReallyLR implicit $w0
; SELECT-LABEL: name: swap_rhs_with_supported_extend
; SELECT: liveins: $x0, $x1
; SELECT: %reg0:gpr64 = COPY $x0
; SELECT: %and:gpr64common = ANDXri %reg0, 4103
; SELECT: [[COPY:%[0-9]+]]:gpr32all = COPY %reg0.sub_32
; SELECT: [[COPY1:%[0-9]+]]:gpr32 = COPY [[COPY]]
; SELECT: %cmp_rhs:gpr64common = SBFMXri %and, 5, 63
; SELECT: [[SUBSXrx:%[0-9]+]]:gpr64 = SUBSXrx %cmp_rhs, [[COPY1]], 1, implicit-def $nzcv
; SELECT: %cmp:gpr32 = CSINCWr $wzr, $wzr, 10, implicit $nzcv
; SELECT: $w0 = COPY %cmp
; SELECT: RET_ReallyLR implicit $w0
%reg0:_(s64) = COPY $x0
%and_mask:_(s64) = G_CONSTANT i64 255
%and:_(s64) = G_AND %reg0, %and_mask(s64)
%lhs_cst:_(s64) = G_CONSTANT i64 1
%cmp_lhs:_(s64) = G_SHL %and, %lhs_cst(s64)
%rhs_cst:_(s64) = G_CONSTANT i64 5
%cmp_rhs:_(s64) = G_ASHR %and, %rhs_cst(s64)
%cmp:_(s32) = G_ICMP intpred(sgt), %cmp_lhs(s64), %cmp_rhs
$w0 = COPY %cmp(s32)
RET_ReallyLR implicit $w0