blob: 0e1e15f9b6b912eaa527ad154f10ba36429b2d4e [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=arm64-eabi -aarch64-neon-syntax=apple | FileCheck %s --check-prefixes=CHECK,CHECK-SD
; RUN: llc < %s -mtriple=arm64-eabi -aarch64-neon-syntax=apple -global-isel | FileCheck %s --check-prefixes=CHECK,CHECK-GI
define void @testLeftGood8x8(<8 x i8> %src1, <8 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood8x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.8b v0, v1, #3
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood8x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.8b v2, #7
; CHECK-GI-NEXT: shl.8b v1, v1, #3
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i8> %src1, <i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7>
%vshl_n = shl <8 x i8> %src2, <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>
%result = or <8 x i8> %and.i, %vshl_n
store <8 x i8> %result, ptr %dest, align 8
ret void
}
define void @testLeftBad8x8(<8 x i8> %src1, <8 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad8x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: movi.8b v2, #165
; CHECK-SD-NEXT: add.8b v1, v1, v1
; CHECK-SD-NEXT: and.8b v0, v0, v2
; CHECK-SD-NEXT: orr.8b v0, v0, v1
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad8x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.8b v2, #165
; CHECK-GI-NEXT: shl.8b v1, v1, #1
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i8> %src1, <i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165>
%vshl_n = shl <8 x i8> %src2, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
%result = or <8 x i8> %and.i, %vshl_n
store <8 x i8> %result, ptr %dest, align 8
ret void
}
define void @testRightGood8x8(<8 x i8> %src1, <8 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood8x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.8b v0, v1, #3
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood8x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.8b v2, #224
; CHECK-GI-NEXT: ushr.8b v1, v1, #3
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i8> %src1, <i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224>
%vshl_n = lshr <8 x i8> %src2, <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>
%result = or <8 x i8> %and.i, %vshl_n
store <8 x i8> %result, ptr %dest, align 8
ret void
}
define void @testRightBad8x8(<8 x i8> %src1, <8 x i8> %src2, ptr %dest) nounwind {
; CHECK-LABEL: testRightBad8x8:
; CHECK: // %bb.0:
; CHECK-NEXT: movi.8b v2, #165
; CHECK-NEXT: ushr.8b v1, v1, #1
; CHECK-NEXT: and.8b v0, v0, v2
; CHECK-NEXT: orr.8b v0, v0, v1
; CHECK-NEXT: str d0, [x0]
; CHECK-NEXT: ret
%and.i = and <8 x i8> %src1, <i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165>
%vshl_n = lshr <8 x i8> %src2, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
%result = or <8 x i8> %and.i, %vshl_n
store <8 x i8> %result, ptr %dest, align 8
ret void
}
define void @testLeftGood16x8(<16 x i8> %src1, <16 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood16x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.16b v0, v1, #3
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood16x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.16b v2, #7
; CHECK-GI-NEXT: shl.16b v1, v1, #3
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <16 x i8> %src1, <i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7, i8 7>
%vshl_n = shl <16 x i8> %src2, <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>
%result = or <16 x i8> %and.i, %vshl_n
store <16 x i8> %result, ptr %dest, align 16
ret void
}
define void @testLeftBad16x8(<16 x i8> %src1, <16 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad16x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: movi.16b v2, #165
; CHECK-SD-NEXT: add.16b v1, v1, v1
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad16x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.16b v2, #165
; CHECK-GI-NEXT: shl.16b v1, v1, #1
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <16 x i8> %src1, <i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165>
%vshl_n = shl <16 x i8> %src2, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
%result = or <16 x i8> %and.i, %vshl_n
store <16 x i8> %result, ptr %dest, align 16
ret void
}
define void @testRightGood16x8(<16 x i8> %src1, <16 x i8> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood16x8:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.16b v0, v1, #3
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood16x8:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.16b v2, #224
; CHECK-GI-NEXT: ushr.16b v1, v1, #3
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <16 x i8> %src1, <i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224, i8 224>
%vshl_n = lshr <16 x i8> %src2, <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>
%result = or <16 x i8> %and.i, %vshl_n
store <16 x i8> %result, ptr %dest, align 16
ret void
}
define void @testRightBad16x8(<16 x i8> %src1, <16 x i8> %src2, ptr %dest) nounwind {
; CHECK-LABEL: testRightBad16x8:
; CHECK: // %bb.0:
; CHECK-NEXT: movi.16b v2, #165
; CHECK-NEXT: ushr.16b v1, v1, #1
; CHECK-NEXT: and.16b v0, v0, v2
; CHECK-NEXT: orr.16b v0, v0, v1
; CHECK-NEXT: str q0, [x0]
; CHECK-NEXT: ret
%and.i = and <16 x i8> %src1, <i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165, i8 165>
%vshl_n = lshr <16 x i8> %src2, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
%result = or <16 x i8> %and.i, %vshl_n
store <16 x i8> %result, ptr %dest, align 16
ret void
}
define void @testLeftGood4x16(<4 x i16> %src1, <4 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood4x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.4h v0, v1, #14
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood4x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.4h v2, #192, lsl #8
; CHECK-GI-NEXT: shl.4h v1, v1, #14
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i16> %src1, <i16 16383, i16 16383, i16 16383, i16 16383>
%vshl_n = shl <4 x i16> %src2, <i16 14, i16 14, i16 14, i16 14>
%result = or <4 x i16> %and.i, %vshl_n
store <4 x i16> %result, ptr %dest, align 8
ret void
}
define void @testLeftBad4x16(<4 x i16> %src1, <4 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad4x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #16500 // =0x4074
; CHECK-SD-NEXT: shl.4h v1, v1, #14
; CHECK-SD-NEXT: dup.4h v2, w8
; CHECK-SD-NEXT: and.8b v0, v0, v2
; CHECK-SD-NEXT: orr.8b v0, v0, v1
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad4x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI9_0
; CHECK-GI-NEXT: shl.4h v1, v1, #14
; CHECK-GI-NEXT: ldr d2, [x8, :lo12:.LCPI9_0]
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i16> %src1, <i16 16500, i16 16500, i16 16500, i16 16500>
%vshl_n = shl <4 x i16> %src2, <i16 14, i16 14, i16 14, i16 14>
%result = or <4 x i16> %and.i, %vshl_n
store <4 x i16> %result, ptr %dest, align 8
ret void
}
define void @testRightGood4x16(<4 x i16> %src1, <4 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood4x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.4h v0, v1, #14
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood4x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.4h v2, #3
; CHECK-GI-NEXT: ushr.4h v1, v1, #14
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i16> %src1, <i16 65532, i16 65532, i16 65532, i16 65532>
%vshl_n = lshr <4 x i16> %src2, <i16 14, i16 14, i16 14, i16 14>
%result = or <4 x i16> %and.i, %vshl_n
store <4 x i16> %result, ptr %dest, align 8
ret void
}
define void @testRightBad4x16(<4 x i16> %src1, <4 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightBad4x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #16500 // =0x4074
; CHECK-SD-NEXT: dup.4h v2, w8
; CHECK-SD-NEXT: and.8b v0, v0, v2
; CHECK-SD-NEXT: usra.4h v0, v1, #14
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightBad4x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI11_0
; CHECK-GI-NEXT: ushr.4h v1, v1, #14
; CHECK-GI-NEXT: ldr d2, [x8, :lo12:.LCPI11_0]
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i16> %src1, <i16 16500, i16 16500, i16 16500, i16 16500>
%vshl_n = lshr <4 x i16> %src2, <i16 14, i16 14, i16 14, i16 14>
%result = or <4 x i16> %and.i, %vshl_n
store <4 x i16> %result, ptr %dest, align 8
ret void
}
define void @testLeftGood8x16(<8 x i16> %src1, <8 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood8x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.8h v0, v1, #14
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood8x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.8h v2, #192, lsl #8
; CHECK-GI-NEXT: shl.8h v1, v1, #14
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i16> %src1, <i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383, i16 16383>
%vshl_n = shl <8 x i16> %src2, <i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14>
%result = or <8 x i16> %and.i, %vshl_n
store <8 x i16> %result, ptr %dest, align 16
ret void
}
define void @testLeftBad8x16(<8 x i16> %src1, <8 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad8x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #16500 // =0x4074
; CHECK-SD-NEXT: shl.8h v1, v1, #14
; CHECK-SD-NEXT: dup.8h v2, w8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad8x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI13_0
; CHECK-GI-NEXT: shl.8h v1, v1, #14
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI13_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i16> %src1, <i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500>
%vshl_n = shl <8 x i16> %src2, <i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14>
%result = or <8 x i16> %and.i, %vshl_n
store <8 x i16> %result, ptr %dest, align 16
ret void
}
define void @testRightGood8x16(<8 x i16> %src1, <8 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood8x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.8h v0, v1, #14
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood8x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.8h v2, #3
; CHECK-GI-NEXT: ushr.8h v1, v1, #14
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i16> %src1, <i16 65532, i16 65532, i16 65532, i16 65532, i16 65532, i16 65532, i16 65532, i16 65532>
%vshl_n = lshr <8 x i16> %src2, <i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14>
%result = or <8 x i16> %and.i, %vshl_n
store <8 x i16> %result, ptr %dest, align 16
ret void
}
define void @testRightBad8x16(<8 x i16> %src1, <8 x i16> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightBad8x16:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #16500 // =0x4074
; CHECK-SD-NEXT: dup.8h v2, w8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: usra.8h v0, v1, #14
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightBad8x16:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI15_0
; CHECK-GI-NEXT: ushr.8h v1, v1, #14
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI15_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <8 x i16> %src1, <i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500, i16 16500>
%vshl_n = lshr <8 x i16> %src2, <i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14, i16 14>
%result = or <8 x i16> %and.i, %vshl_n
store <8 x i16> %result, ptr %dest, align 16
ret void
}
define void @testLeftGood2x32(<2 x i32> %src1, <2 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood2x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.2s v0, v1, #22
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood2x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.2s v2, #63, msl #16
; CHECK-GI-NEXT: shl.2s v1, v1, #22
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i32> %src1, <i32 4194303, i32 4194303>
%vshl_n = shl <2 x i32> %src2, <i32 22, i32 22>
%result = or <2 x i32> %and.i, %vshl_n
store <2 x i32> %result, ptr %dest, align 8
ret void
}
define void @testLeftBad2x32(<2 x i32> %src1, <2 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad2x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #4194300 // =0x3ffffc
; CHECK-SD-NEXT: shl.2s v1, v1, #22
; CHECK-SD-NEXT: dup.2s v2, w8
; CHECK-SD-NEXT: and.8b v0, v0, v2
; CHECK-SD-NEXT: orr.8b v0, v0, v1
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad2x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI17_0
; CHECK-GI-NEXT: shl.2s v1, v1, #22
; CHECK-GI-NEXT: ldr d2, [x8, :lo12:.LCPI17_0]
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i32> %src1, <i32 4194300, i32 4194300>
%vshl_n = shl <2 x i32> %src2, <i32 22, i32 22>
%result = or <2 x i32> %and.i, %vshl_n
store <2 x i32> %result, ptr %dest, align 8
ret void
}
define void @testRightGood2x32(<2 x i32> %src1, <2 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood2x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.2s v0, v1, #22
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood2x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.2s v2, #3, msl #8
; CHECK-GI-NEXT: ushr.2s v1, v1, #22
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i32> %src1, <i32 4294966272, i32 4294966272>
%vshl_n = lshr <2 x i32> %src2, <i32 22, i32 22>
%result = or <2 x i32> %and.i, %vshl_n
store <2 x i32> %result, ptr %dest, align 8
ret void
}
define void @testRightBad2x32(<2 x i32> %src1, <2 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightBad2x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #4194300 // =0x3ffffc
; CHECK-SD-NEXT: ushr.2s v1, v1, #22
; CHECK-SD-NEXT: dup.2s v2, w8
; CHECK-SD-NEXT: and.8b v0, v0, v2
; CHECK-SD-NEXT: orr.8b v0, v0, v1
; CHECK-SD-NEXT: str d0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightBad2x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI19_0
; CHECK-GI-NEXT: ushr.2s v1, v1, #22
; CHECK-GI-NEXT: ldr d2, [x8, :lo12:.LCPI19_0]
; CHECK-GI-NEXT: and.8b v0, v0, v2
; CHECK-GI-NEXT: orr.8b v0, v0, v1
; CHECK-GI-NEXT: str d0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i32> %src1, <i32 4194300, i32 4194300>
%vshl_n = lshr <2 x i32> %src2, <i32 22, i32 22>
%result = or <2 x i32> %and.i, %vshl_n
store <2 x i32> %result, ptr %dest, align 8
ret void
}
define void @testLeftGood4x32(<4 x i32> %src1, <4 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood4x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.4s v0, v1, #22
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood4x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.4s v2, #63, msl #16
; CHECK-GI-NEXT: shl.4s v1, v1, #22
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i32> %src1, <i32 4194303, i32 4194303, i32 4194303, i32 4194303>
%vshl_n = shl <4 x i32> %src2, <i32 22, i32 22, i32 22, i32 22>
%result = or <4 x i32> %and.i, %vshl_n
store <4 x i32> %result, ptr %dest, align 16
ret void
}
define void @testLeftBad4x32(<4 x i32> %src1, <4 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad4x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #4194300 // =0x3ffffc
; CHECK-SD-NEXT: shl.4s v1, v1, #22
; CHECK-SD-NEXT: dup.4s v2, w8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad4x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI21_0
; CHECK-GI-NEXT: shl.4s v1, v1, #22
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI21_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i32> %src1, <i32 4194300, i32 4194300, i32 4194300, i32 4194300>
%vshl_n = shl <4 x i32> %src2, <i32 22, i32 22, i32 22, i32 22>
%result = or <4 x i32> %and.i, %vshl_n
store <4 x i32> %result, ptr %dest, align 16
ret void
}
define void @testRightGood4x32(<4 x i32> %src1, <4 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood4x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.4s v0, v1, #22
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood4x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mvni.4s v2, #3, msl #8
; CHECK-GI-NEXT: ushr.4s v1, v1, #22
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i32> %src1, <i32 4294966272, i32 4294966272, i32 4294966272, i32 4294966272>
%vshl_n = lshr <4 x i32> %src2, <i32 22, i32 22, i32 22, i32 22>
%result = or <4 x i32> %and.i, %vshl_n
store <4 x i32> %result, ptr %dest, align 16
ret void
}
define void @testRightBad4x32(<4 x i32> %src1, <4 x i32> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightBad4x32:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov w8, #4194300 // =0x3ffffc
; CHECK-SD-NEXT: ushr.4s v1, v1, #22
; CHECK-SD-NEXT: dup.4s v2, w8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightBad4x32:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI23_0
; CHECK-GI-NEXT: ushr.4s v1, v1, #22
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI23_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <4 x i32> %src1, <i32 4194300, i32 4194300, i32 4194300, i32 4194300>
%vshl_n = lshr <4 x i32> %src2, <i32 22, i32 22, i32 22, i32 22>
%result = or <4 x i32> %and.i, %vshl_n
store <4 x i32> %result, ptr %dest, align 16
ret void
}
define void @testLeftGood2x64(<2 x i64> %src1, <2 x i64> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftGood2x64:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sli.2d v0, v1, #48
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftGood2x64:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.2d v2, #0x00ffffffffffff
; CHECK-GI-NEXT: shl.2d v1, v1, #48
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i64> %src1, <i64 281474976710655, i64 281474976710655>
%vshl_n = shl <2 x i64> %src2, <i64 48, i64 48>
%result = or <2 x i64> %and.i, %vshl_n
store <2 x i64> %result, ptr %dest, align 16
ret void
}
define void @testLeftBad2x64(<2 x i64> %src1, <2 x i64> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftBad2x64:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov x8, #10 // =0xa
; CHECK-SD-NEXT: shl.2d v1, v1, #48
; CHECK-SD-NEXT: movk x8, #1, lsl #48
; CHECK-SD-NEXT: dup.2d v2, x8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftBad2x64:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI25_0
; CHECK-GI-NEXT: shl.2d v1, v1, #48
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI25_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i64> %src1, <i64 281474976710666, i64 281474976710666>
%vshl_n = shl <2 x i64> %src2, <i64 48, i64 48>
%result = or <2 x i64> %and.i, %vshl_n
store <2 x i64> %result, ptr %dest, align 16
ret void
}
define void @testRightGood2x64(<2 x i64> %src1, <2 x i64> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightGood2x64:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: sri.2d v0, v1, #48
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightGood2x64:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: movi.2d v2, #0xffffffffffff0000
; CHECK-GI-NEXT: ushr.2d v1, v1, #48
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i64> %src1, <i64 18446744073709486080, i64 18446744073709486080>
%vshl_n = lshr <2 x i64> %src2, <i64 48, i64 48>
%result = or <2 x i64> %and.i, %vshl_n
store <2 x i64> %result, ptr %dest, align 16
ret void
}
define void @testRightBad2x64(<2 x i64> %src1, <2 x i64> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testRightBad2x64:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: mov x8, #10 // =0xa
; CHECK-SD-NEXT: ushr.2d v1, v1, #48
; CHECK-SD-NEXT: movk x8, #1, lsl #48
; CHECK-SD-NEXT: dup.2d v2, x8
; CHECK-SD-NEXT: and.16b v0, v0, v2
; CHECK-SD-NEXT: orr.16b v0, v0, v1
; CHECK-SD-NEXT: str q0, [x0]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testRightBad2x64:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: adrp x8, .LCPI27_0
; CHECK-GI-NEXT: ushr.2d v1, v1, #48
; CHECK-GI-NEXT: ldr q2, [x8, :lo12:.LCPI27_0]
; CHECK-GI-NEXT: and.16b v0, v0, v2
; CHECK-GI-NEXT: orr.16b v0, v0, v1
; CHECK-GI-NEXT: str q0, [x0]
; CHECK-GI-NEXT: ret
%and.i = and <2 x i64> %src1, <i64 281474976710666, i64 281474976710666>
%vshl_n = lshr <2 x i64> %src2, <i64 48, i64 48>
%result = or <2 x i64> %and.i, %vshl_n
store <2 x i64> %result, ptr %dest, align 16
ret void
}
define void @testLeftShouldNotCreateSLI1x128(<1 x i128> %src1, <1 x i128> %src2, ptr %dest) nounwind {
; CHECK-SD-LABEL: testLeftShouldNotCreateSLI1x128:
; CHECK-SD: // %bb.0:
; CHECK-SD-NEXT: bfi x1, x2, #6, #58
; CHECK-SD-NEXT: stp x0, x1, [x4]
; CHECK-SD-NEXT: ret
;
; CHECK-GI-LABEL: testLeftShouldNotCreateSLI1x128:
; CHECK-GI: // %bb.0:
; CHECK-GI-NEXT: mov.d v0[0], x0
; CHECK-GI-NEXT: bfi x1, x2, #6, #58
; CHECK-GI-NEXT: mov.d v0[1], x1
; CHECK-GI-NEXT: str q0, [x4]
; CHECK-GI-NEXT: ret
%and.i = and <1 x i128> %src1, <i128 1180591620717411303423>
%vshl_n = shl <1 x i128> %src2, <i128 70>
%result = or <1 x i128> %and.i, %vshl_n
store <1 x i128> %result, ptr %dest, align 16
ret void
}
define void @testLeftNotAllConstantBuildVec8x8(<8 x i8> %src1, <8 x i8> %src2, ptr %dest) nounwind {
; CHECK-LABEL: testLeftNotAllConstantBuildVec8x8:
; CHECK: // %bb.0:
; CHECK-NEXT: adrp x8, .LCPI29_0
; CHECK-NEXT: shl.8b v1, v1, #3
; CHECK-NEXT: ldr d2, [x8, :lo12:.LCPI29_0]
; CHECK-NEXT: and.8b v0, v0, v2
; CHECK-NEXT: orr.8b v0, v0, v1
; CHECK-NEXT: str d0, [x0]
; CHECK-NEXT: ret
%and.i = and <8 x i8> %src1, <i8 7, i8 7, i8 255, i8 7, i8 7, i8 7, i8 255, i8 7>
%vshl_n = shl <8 x i8> %src2, <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>
%result = or <8 x i8> %and.i, %vshl_n
store <8 x i8> %result, ptr %dest, align 8
ret void
}