| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6 |
| ; RUN: llc -mtriple=powerpc64le < %s | FileCheck %s |
| |
| ; Legal |
| define <4 x i32> @srem_v4i32(<4 x i32> %x, <4 x i32> %y, <4 x i1> %m) { |
| ; CHECK-LABEL: srem_v4i32: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: xxleqv 32, 32, 32 |
| ; CHECK-NEXT: vspltisw 5, 1 |
| ; CHECK-NEXT: xxsldwi 1, 34, 34, 1 |
| ; CHECK-NEXT: vslw 4, 4, 0 |
| ; CHECK-NEXT: xxswapd 4, 34 |
| ; CHECK-NEXT: xxsldwi 6, 34, 34, 3 |
| ; CHECK-NEXT: mffprwz 4, 1 |
| ; CHECK-NEXT: vsraw 4, 4, 0 |
| ; CHECK-NEXT: xxsel 0, 37, 35, 36 |
| ; CHECK-NEXT: xxsldwi 2, 0, 0, 1 |
| ; CHECK-NEXT: xxswapd 3, 0 |
| ; CHECK-NEXT: xxsldwi 5, 0, 0, 3 |
| ; CHECK-NEXT: mffprwz 3, 2 |
| ; CHECK-NEXT: mffprwz 5, 3 |
| ; CHECK-NEXT: divw 6, 4, 3 |
| ; CHECK-NEXT: mullw 3, 6, 3 |
| ; CHECK-NEXT: mffprwz 6, 4 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: divw 4, 6, 5 |
| ; CHECK-NEXT: mullw 4, 4, 5 |
| ; CHECK-NEXT: sub 4, 6, 4 |
| ; CHECK-NEXT: rldimi 4, 3, 32, 0 |
| ; CHECK-NEXT: mffprwz 3, 5 |
| ; CHECK-NEXT: mtfprd 1, 4 |
| ; CHECK-NEXT: mffprwz 4, 6 |
| ; CHECK-NEXT: divw 5, 4, 3 |
| ; CHECK-NEXT: mullw 3, 5, 3 |
| ; CHECK-NEXT: mfvsrwz 5, 34 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mffprwz 4, 0 |
| ; CHECK-NEXT: divw 6, 5, 4 |
| ; CHECK-NEXT: mullw 4, 6, 4 |
| ; CHECK-NEXT: sub 4, 5, 4 |
| ; CHECK-NEXT: rldimi 4, 3, 32, 0 |
| ; CHECK-NEXT: mtfprd 0, 4 |
| ; CHECK-NEXT: xxmrghd 34, 0, 1 |
| ; CHECK-NEXT: blr |
| %res = call <4 x i32> @llvm.masked.srem(<4 x i32> %x, <4 x i32> %y, <4 x i1> %m) |
| ret <4 x i32> %res |
| } |
| |
| define <2 x i64> @srem_v2i64(<2 x i64> %x, <2 x i64> %y, <2 x i1> %m) { |
| ; CHECK-LABEL: srem_v2i64: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: xxleqv 32, 32, 32 |
| ; CHECK-NEXT: vspltisw 5, 1 |
| ; CHECK-NEXT: mfvsrd 4, 34 |
| ; CHECK-NEXT: xxswapd 2, 34 |
| ; CHECK-NEXT: vsld 4, 4, 0 |
| ; CHECK-NEXT: vsrad 4, 4, 0 |
| ; CHECK-NEXT: vupklsw 5, 5 |
| ; CHECK-NEXT: xxsel 0, 37, 35, 36 |
| ; CHECK-NEXT: mffprd 3, 0 |
| ; CHECK-NEXT: divd 5, 4, 3 |
| ; CHECK-NEXT: mulld 3, 5, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mffprd 4, 2 |
| ; CHECK-NEXT: xxswapd 1, 0 |
| ; CHECK-NEXT: mtfprd 0, 3 |
| ; CHECK-NEXT: mffprd 3, 1 |
| ; CHECK-NEXT: divd 5, 4, 3 |
| ; CHECK-NEXT: mulld 3, 5, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mtfprd 1, 3 |
| ; CHECK-NEXT: xxmrghd 34, 0, 1 |
| ; CHECK-NEXT: blr |
| %res = call <2 x i64> @llvm.masked.srem(<2 x i64> %x, <2 x i64> %y, <2 x i1> %m) |
| ret <2 x i64> %res |
| } |
| |
| ; Splitting |
| define <4 x i64> @srem_v4i64(<4 x i64> %x, <4 x i64> %y, <4 x i1> %m) { |
| ; CHECK-LABEL: srem_v4i64: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: xxmrglw 32, 38, 38 |
| ; CHECK-NEXT: xxleqv 39, 39, 39 |
| ; CHECK-NEXT: xxmrghw 33, 38, 38 |
| ; CHECK-NEXT: mfvsrd 3, 34 |
| ; CHECK-NEXT: vspltisw 6, 1 |
| ; CHECK-NEXT: mfvsrd 4, 35 |
| ; CHECK-NEXT: xxswapd 2, 34 |
| ; CHECK-NEXT: xxswapd 4, 35 |
| ; CHECK-NEXT: vsld 0, 0, 7 |
| ; CHECK-NEXT: mffprd 5, 2 |
| ; CHECK-NEXT: vsrad 0, 0, 7 |
| ; CHECK-NEXT: vupklsw 6, 6 |
| ; CHECK-NEXT: xxsel 0, 38, 36, 32 |
| ; CHECK-NEXT: vsld 4, 1, 7 |
| ; CHECK-NEXT: mffprd 6, 0 |
| ; CHECK-NEXT: vsrad 4, 4, 7 |
| ; CHECK-NEXT: divd 9, 3, 6 |
| ; CHECK-NEXT: mulld 6, 9, 6 |
| ; CHECK-NEXT: sub 3, 3, 6 |
| ; CHECK-NEXT: xxswapd 3, 0 |
| ; CHECK-NEXT: mffprd 8, 3 |
| ; CHECK-NEXT: mtfprd 0, 3 |
| ; CHECK-NEXT: xxsel 1, 38, 37, 36 |
| ; CHECK-NEXT: mffprd 7, 1 |
| ; CHECK-NEXT: divd 9, 4, 7 |
| ; CHECK-NEXT: mulld 7, 9, 7 |
| ; CHECK-NEXT: divd 9, 5, 8 |
| ; CHECK-NEXT: sub 4, 4, 7 |
| ; CHECK-NEXT: mulld 8, 9, 8 |
| ; CHECK-NEXT: sub 3, 5, 8 |
| ; CHECK-NEXT: xxswapd 5, 1 |
| ; CHECK-NEXT: mffprd 5, 4 |
| ; CHECK-NEXT: mtfprd 1, 4 |
| ; CHECK-NEXT: mffprd 4, 5 |
| ; CHECK-NEXT: mtfprd 2, 3 |
| ; CHECK-NEXT: divd 3, 5, 4 |
| ; CHECK-NEXT: mulld 3, 3, 4 |
| ; CHECK-NEXT: sub 3, 5, 3 |
| ; CHECK-NEXT: xxmrghd 34, 0, 2 |
| ; CHECK-NEXT: mtfprd 0, 3 |
| ; CHECK-NEXT: xxmrghd 35, 1, 0 |
| ; CHECK-NEXT: blr |
| %res = call <4 x i64> @llvm.masked.srem(<4 x i64> %x, <4 x i64> %y, <4 x i1> %m) |
| ret <4 x i64> %res |
| } |
| |
| ; Widening |
| define <2 x i32> @srem_v2i32(<2 x i32> %x, <2 x i32> %y, <2 x i1> %m) { |
| ; CHECK-LABEL: srem_v2i32: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: addis 3, 2, .LCPI3_0@toc@ha |
| ; CHECK-NEXT: xxlxor 32, 32, 32 |
| ; CHECK-NEXT: xxsldwi 1, 34, 34, 1 |
| ; CHECK-NEXT: addi 3, 3, .LCPI3_0@toc@l |
| ; CHECK-NEXT: mffprwz 4, 1 |
| ; CHECK-NEXT: xxswapd 4, 34 |
| ; CHECK-NEXT: xxsldwi 6, 34, 34, 3 |
| ; CHECK-NEXT: lxvd2x 0, 0, 3 |
| ; CHECK-NEXT: xxswapd 37, 0 |
| ; CHECK-NEXT: vperm 4, 0, 4, 5 |
| ; CHECK-NEXT: xxleqv 32, 32, 32 |
| ; CHECK-NEXT: vspltisw 5, 1 |
| ; CHECK-NEXT: vslw 4, 4, 0 |
| ; CHECK-NEXT: vsraw 4, 4, 0 |
| ; CHECK-NEXT: xxsel 0, 37, 35, 36 |
| ; CHECK-NEXT: xxsldwi 2, 0, 0, 1 |
| ; CHECK-NEXT: xxswapd 3, 0 |
| ; CHECK-NEXT: xxsldwi 5, 0, 0, 3 |
| ; CHECK-NEXT: mffprwz 3, 2 |
| ; CHECK-NEXT: mffprwz 5, 3 |
| ; CHECK-NEXT: divw 6, 4, 3 |
| ; CHECK-NEXT: mullw 3, 6, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mffprwz 4, 4 |
| ; CHECK-NEXT: divw 6, 4, 5 |
| ; CHECK-NEXT: mullw 5, 6, 5 |
| ; CHECK-NEXT: sub 4, 4, 5 |
| ; CHECK-NEXT: rldimi 4, 3, 32, 0 |
| ; CHECK-NEXT: mffprwz 3, 5 |
| ; CHECK-NEXT: mtfprd 1, 4 |
| ; CHECK-NEXT: mffprwz 4, 6 |
| ; CHECK-NEXT: divw 5, 4, 3 |
| ; CHECK-NEXT: mullw 3, 5, 3 |
| ; CHECK-NEXT: mfvsrwz 5, 34 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mffprwz 4, 0 |
| ; CHECK-NEXT: divw 6, 5, 4 |
| ; CHECK-NEXT: mullw 4, 6, 4 |
| ; CHECK-NEXT: sub 4, 5, 4 |
| ; CHECK-NEXT: rldimi 4, 3, 32, 0 |
| ; CHECK-NEXT: mtfprd 0, 4 |
| ; CHECK-NEXT: xxmrghd 34, 0, 1 |
| ; CHECK-NEXT: blr |
| %res = call <2 x i32> @llvm.masked.srem(<2 x i32> %x, <2 x i32> %y, <2 x i1> %m) |
| ret <2 x i32> %res |
| } |
| |
| ; Promotion |
| define <4 x i16> @srem_v4i16(<4 x i16> %x, <4 x i16> %y, <4 x i1> %m) { |
| ; CHECK-LABEL: srem_v4i16: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: xxswapd 0, 36 |
| ; CHECK-NEXT: xxsldwi 1, 36, 36, 1 |
| ; CHECK-NEXT: mfvsrwz 3, 36 |
| ; CHECK-NEXT: li 7, 0 |
| ; CHECK-NEXT: xxsldwi 2, 36, 36, 3 |
| ; CHECK-NEXT: std 25, -56(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: std 30, -16(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: std 29, -24(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: mffprwz 4, 0 |
| ; CHECK-NEXT: mffprwz 5, 1 |
| ; CHECK-NEXT: std 28, -32(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: std 27, -40(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: mffprwz 6, 2 |
| ; CHECK-NEXT: std 26, -48(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: mtvsrd 36, 3 |
| ; CHECK-NEXT: mfvsrd 3, 34 |
| ; CHECK-NEXT: mtvsrd 37, 4 |
| ; CHECK-NEXT: mtvsrd 32, 5 |
| ; CHECK-NEXT: rldicl 8, 3, 48, 48 |
| ; CHECK-NEXT: rldicl 9, 3, 32, 48 |
| ; CHECK-NEXT: extsh 8, 8 |
| ; CHECK-NEXT: extsh 9, 9 |
| ; CHECK-NEXT: vmrghh 5, 0, 5 |
| ; CHECK-NEXT: mtvsrd 32, 6 |
| ; CHECK-NEXT: vmrghh 4, 0, 4 |
| ; CHECK-NEXT: mtvsrd 32, 7 |
| ; CHECK-NEXT: clrldi 7, 3, 48 |
| ; CHECK-NEXT: rldicl 3, 3, 16, 48 |
| ; CHECK-NEXT: extsh 7, 7 |
| ; CHECK-NEXT: extsh 3, 3 |
| ; CHECK-NEXT: xxmrglw 1, 36, 37 |
| ; CHECK-NEXT: vspltish 4, 15 |
| ; CHECK-NEXT: vsplth 0, 0, 3 |
| ; CHECK-NEXT: xxspltw 0, 32, 3 |
| ; CHECK-NEXT: vspltish 0, 1 |
| ; CHECK-NEXT: xxmrgld 37, 0, 1 |
| ; CHECK-NEXT: xxswapd 1, 34 |
| ; CHECK-NEXT: vslh 5, 5, 4 |
| ; CHECK-NEXT: mffprd 4, 1 |
| ; CHECK-NEXT: vsrah 4, 5, 4 |
| ; CHECK-NEXT: clrldi 10, 4, 48 |
| ; CHECK-NEXT: rldicl 11, 4, 48, 48 |
| ; CHECK-NEXT: rldicl 12, 4, 32, 48 |
| ; CHECK-NEXT: rldicl 4, 4, 16, 48 |
| ; CHECK-NEXT: extsh 10, 10 |
| ; CHECK-NEXT: extsh 11, 11 |
| ; CHECK-NEXT: extsh 12, 12 |
| ; CHECK-NEXT: extsh 4, 4 |
| ; CHECK-NEXT: xxsel 0, 32, 35, 36 |
| ; CHECK-NEXT: mffprd 5, 0 |
| ; CHECK-NEXT: clrldi 0, 5, 48 |
| ; CHECK-NEXT: rldicl 30, 5, 48, 48 |
| ; CHECK-NEXT: rldicl 29, 5, 32, 48 |
| ; CHECK-NEXT: rldicl 5, 5, 16, 48 |
| ; CHECK-NEXT: extsh 0, 0 |
| ; CHECK-NEXT: extsh 30, 30 |
| ; CHECK-NEXT: extsh 29, 29 |
| ; CHECK-NEXT: extsh 5, 5 |
| ; CHECK-NEXT: xxswapd 2, 0 |
| ; CHECK-NEXT: mffprd 6, 2 |
| ; CHECK-NEXT: clrldi 28, 6, 48 |
| ; CHECK-NEXT: rldicl 27, 6, 48, 48 |
| ; CHECK-NEXT: rldicl 26, 6, 32, 48 |
| ; CHECK-NEXT: rldicl 6, 6, 16, 48 |
| ; CHECK-NEXT: divw 25, 7, 0 |
| ; CHECK-NEXT: extsh 28, 28 |
| ; CHECK-NEXT: extsh 27, 27 |
| ; CHECK-NEXT: extsh 26, 26 |
| ; CHECK-NEXT: extsh 6, 6 |
| ; CHECK-NEXT: mullw 0, 25, 0 |
| ; CHECK-NEXT: divw 25, 8, 30 |
| ; CHECK-NEXT: sub 7, 7, 0 |
| ; CHECK-NEXT: mtvsrd 34, 7 |
| ; CHECK-NEXT: mullw 30, 25, 30 |
| ; CHECK-NEXT: divw 25, 9, 29 |
| ; CHECK-NEXT: sub 8, 8, 30 |
| ; CHECK-NEXT: ld 30, -16(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: mtvsrd 35, 8 |
| ; CHECK-NEXT: mullw 29, 25, 29 |
| ; CHECK-NEXT: divw 25, 3, 5 |
| ; CHECK-NEXT: sub 9, 9, 29 |
| ; CHECK-NEXT: ld 29, -24(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: mtvsrd 36, 9 |
| ; CHECK-NEXT: mullw 5, 25, 5 |
| ; CHECK-NEXT: divw 25, 10, 28 |
| ; CHECK-NEXT: sub 3, 3, 5 |
| ; CHECK-NEXT: mtvsrd 37, 3 |
| ; CHECK-NEXT: mullw 28, 25, 28 |
| ; CHECK-NEXT: divw 25, 11, 27 |
| ; CHECK-NEXT: sub 3, 10, 28 |
| ; CHECK-NEXT: ld 28, -32(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: mullw 27, 25, 27 |
| ; CHECK-NEXT: divw 25, 12, 26 |
| ; CHECK-NEXT: sub 5, 11, 27 |
| ; CHECK-NEXT: ld 27, -40(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: mullw 26, 25, 26 |
| ; CHECK-NEXT: divw 25, 4, 6 |
| ; CHECK-NEXT: sub 7, 12, 26 |
| ; CHECK-NEXT: ld 26, -48(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: mullw 6, 25, 6 |
| ; CHECK-NEXT: ld 25, -56(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: vmrghh 2, 3, 2 |
| ; CHECK-NEXT: vmrghh 3, 5, 4 |
| ; CHECK-NEXT: mtvsrd 36, 3 |
| ; CHECK-NEXT: mtvsrd 37, 5 |
| ; CHECK-NEXT: sub 3, 4, 6 |
| ; CHECK-NEXT: mtvsrd 32, 3 |
| ; CHECK-NEXT: xxmrglw 0, 35, 34 |
| ; CHECK-NEXT: vmrghh 4, 5, 4 |
| ; CHECK-NEXT: mtvsrd 37, 7 |
| ; CHECK-NEXT: vmrghh 5, 0, 5 |
| ; CHECK-NEXT: xxmrglw 1, 37, 36 |
| ; CHECK-NEXT: xxmrgld 34, 0, 1 |
| ; CHECK-NEXT: blr |
| %res = call <4 x i16> @llvm.masked.srem(<4 x i16> %x, <4 x i16> %y, <4 x i1> %m) |
| ret <4 x i16> %res |
| } |
| |
| ; Scalarization |
| define <1 x i64> @srem_v1i164(<1 x i64> %x, <1 x i64> %y, <1 x i1> %m) { |
| ; CHECK-LABEL: srem_v1i164: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: andi. 5, 5, 1 |
| ; CHECK-NEXT: li 5, 1 |
| ; CHECK-NEXT: iselgt 4, 4, 5 |
| ; CHECK-NEXT: divd 5, 3, 4 |
| ; CHECK-NEXT: mulld 4, 5, 4 |
| ; CHECK-NEXT: sub 3, 3, 4 |
| ; CHECK-NEXT: blr |
| %res = call <1 x i64> @llvm.masked.srem(<1 x i64> %x, <1 x i64> %y, <1 x i1> %m) |
| ret <1 x i64> %res |
| } |
| |
| ; Expansion |
| define <2 x i128> @srem_v2i128(<2 x i128> %x, <2 x i128> %y, <2 x i1> %m) nounwind { |
| ; CHECK-LABEL: srem_v2i128: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: mfocrf 12, 32 |
| ; CHECK-NEXT: stw 12, 8(1) |
| ; CHECK-NEXT: mflr 0 |
| ; CHECK-NEXT: stdu 1, -128(1) |
| ; CHECK-NEXT: li 3, 48 |
| ; CHECK-NEXT: std 0, 144(1) |
| ; CHECK-NEXT: xxswapd 0, 38 |
| ; CHECK-NEXT: xxswapd 1, 37 |
| ; CHECK-NEXT: std 30, 112(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: li 30, 1 |
| ; CHECK-NEXT: std 29, 104(1) # 8-byte Folded Spill |
| ; CHECK-NEXT: li 29, 0 |
| ; CHECK-NEXT: stxvd2x 61, 1, 3 # 16-byte Folded Spill |
| ; CHECK-NEXT: li 3, 64 |
| ; CHECK-NEXT: mfvsrd 4, 35 |
| ; CHECK-NEXT: stxvd2x 62, 1, 3 # 16-byte Folded Spill |
| ; CHECK-NEXT: li 3, 80 |
| ; CHECK-NEXT: vmr 30, 2 |
| ; CHECK-NEXT: stxvd2x 63, 1, 3 # 16-byte Folded Spill |
| ; CHECK-NEXT: mffprd 3, 0 |
| ; CHECK-NEXT: vmr 31, 4 |
| ; CHECK-NEXT: andi. 3, 3, 1 |
| ; CHECK-NEXT: mfvsrd 3, 38 |
| ; CHECK-NEXT: crmove 8, 1 |
| ; CHECK-NEXT: andi. 3, 3, 1 |
| ; CHECK-NEXT: mffprd 3, 1 |
| ; CHECK-NEXT: iselgt 5, 3, 30 |
| ; CHECK-NEXT: mfvsrd 3, 37 |
| ; CHECK-NEXT: xxswapd 0, 35 |
| ; CHECK-NEXT: iselgt 6, 3, 29 |
| ; CHECK-NEXT: mffprd 3, 0 |
| ; CHECK-NEXT: bl __modti3 |
| ; CHECK-NEXT: nop |
| ; CHECK-NEXT: xxswapd 0, 63 |
| ; CHECK-NEXT: mtfprd 1, 3 |
| ; CHECK-NEXT: mtfprd 2, 4 |
| ; CHECK-NEXT: mfvsrd 4, 62 |
| ; CHECK-NEXT: mffprd 3, 0 |
| ; CHECK-NEXT: isel 5, 3, 30, 8 |
| ; CHECK-NEXT: mfvsrd 3, 63 |
| ; CHECK-NEXT: isel 6, 3, 29, 8 |
| ; CHECK-NEXT: xxswapd 0, 62 |
| ; CHECK-NEXT: mffprd 3, 0 |
| ; CHECK-NEXT: xxmrghd 61, 2, 1 |
| ; CHECK-NEXT: bl __modti3 |
| ; CHECK-NEXT: nop |
| ; CHECK-NEXT: mtfprd 0, 3 |
| ; CHECK-NEXT: li 3, 80 |
| ; CHECK-NEXT: mtfprd 1, 4 |
| ; CHECK-NEXT: ld 30, 112(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: vmr 3, 29 |
| ; CHECK-NEXT: ld 29, 104(1) # 8-byte Folded Reload |
| ; CHECK-NEXT: lxvd2x 63, 1, 3 # 16-byte Folded Reload |
| ; CHECK-NEXT: li 3, 64 |
| ; CHECK-NEXT: lxvd2x 62, 1, 3 # 16-byte Folded Reload |
| ; CHECK-NEXT: li 3, 48 |
| ; CHECK-NEXT: lxvd2x 61, 1, 3 # 16-byte Folded Reload |
| ; CHECK-NEXT: xxmrghd 34, 1, 0 |
| ; CHECK-NEXT: addi 1, 1, 128 |
| ; CHECK-NEXT: ld 0, 16(1) |
| ; CHECK-NEXT: lwz 12, 8(1) |
| ; CHECK-NEXT: mtlr 0 |
| ; CHECK-NEXT: mtocrf 32, 12 |
| ; CHECK-NEXT: blr |
| %res = call <2 x i128> @llvm.masked.srem(<2 x i128> %x, <2 x i128> %y, <2 x i1> %m) |
| ret <2 x i128> %res |
| } |
| |
| ; Promotion and widening |
| define <3 x i10> @srem_v3i10(<3 x i10> %x, <3 x i10> %y, <3 x i1> %m) { |
| ; CHECK-LABEL: srem_v3i10: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: lbz 12, 96(1) |
| ; CHECK-NEXT: li 11, 0 |
| ; CHECK-NEXT: mtfprwz 2, 7 |
| ; CHECK-NEXT: rldimi 9, 10, 32, 0 |
| ; CHECK-NEXT: mtvsrwz 33, 8 |
| ; CHECK-NEXT: vspltisw 4, 11 |
| ; CHECK-NEXT: xxleqv 38, 38, 38 |
| ; CHECK-NEXT: vadduwm 4, 4, 4 |
| ; CHECK-NEXT: rldimi 12, 11, 32, 0 |
| ; CHECK-NEXT: addis 11, 2, .LCPI7_0@toc@ha |
| ; CHECK-NEXT: addi 11, 11, .LCPI7_0@toc@l |
| ; CHECK-NEXT: mtfprd 1, 12 |
| ; CHECK-NEXT: lxvd2x 0, 0, 11 |
| ; CHECK-NEXT: xxswapd 34, 0 |
| ; CHECK-NEXT: mtfprwz 0, 6 |
| ; CHECK-NEXT: xxmrghw 35, 2, 0 |
| ; CHECK-NEXT: mtfprd 0, 9 |
| ; CHECK-NEXT: vperm 3, 1, 3, 2 |
| ; CHECK-NEXT: mtvsrwz 33, 5 |
| ; CHECK-NEXT: vslw 3, 3, 4 |
| ; CHECK-NEXT: vsraw 3, 3, 4 |
| ; CHECK-NEXT: xxmrghd 37, 1, 0 |
| ; CHECK-NEXT: mtfprwz 0, 3 |
| ; CHECK-NEXT: mtfprwz 1, 4 |
| ; CHECK-NEXT: vslw 5, 5, 6 |
| ; CHECK-NEXT: vsraw 5, 5, 6 |
| ; CHECK-NEXT: xxmrghw 32, 1, 0 |
| ; CHECK-NEXT: vperm 0, 1, 0, 2 |
| ; CHECK-NEXT: vspltisw 1, 1 |
| ; CHECK-NEXT: xxsel 0, 33, 35, 37 |
| ; CHECK-NEXT: vslw 3, 0, 4 |
| ; CHECK-NEXT: vsraw 3, 3, 4 |
| ; CHECK-NEXT: xxswapd 1, 0 |
| ; CHECK-NEXT: xxsldwi 3, 0, 0, 1 |
| ; CHECK-NEXT: mffprwz 3, 1 |
| ; CHECK-NEXT: xxswapd 2, 35 |
| ; CHECK-NEXT: xxsldwi 4, 35, 35, 1 |
| ; CHECK-NEXT: mffprwz 4, 2 |
| ; CHECK-NEXT: divw 5, 4, 3 |
| ; CHECK-NEXT: mullw 3, 5, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mffprwz 4, 4 |
| ; CHECK-NEXT: mtfprwz 1, 3 |
| ; CHECK-NEXT: mffprwz 3, 3 |
| ; CHECK-NEXT: divw 5, 4, 3 |
| ; CHECK-NEXT: mullw 3, 5, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mfvsrwz 4, 35 |
| ; CHECK-NEXT: mtfprwz 2, 3 |
| ; CHECK-NEXT: mffprwz 3, 0 |
| ; CHECK-NEXT: divw 5, 4, 3 |
| ; CHECK-NEXT: mullw 3, 5, 3 |
| ; CHECK-NEXT: sub 3, 4, 3 |
| ; CHECK-NEXT: mtvsrwz 35, 3 |
| ; CHECK-NEXT: xxmrghw 36, 2, 1 |
| ; CHECK-NEXT: vperm 2, 3, 4, 2 |
| ; CHECK-NEXT: mfvsrwz 5, 34 |
| ; CHECK-NEXT: xxswapd 0, 34 |
| ; CHECK-NEXT: xxsldwi 1, 34, 34, 1 |
| ; CHECK-NEXT: mffprwz 3, 0 |
| ; CHECK-NEXT: mffprwz 4, 1 |
| ; CHECK-NEXT: blr |
| %res = call <3 x i10> @llvm.masked.srem(<3 x i10> %x, <3 x i10> %y, <3 x i1> %m) |
| ret <3 x i10> %res |
| } |