blob: aebec8c7dba04985e7b8c3490bbf6119286dae82 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=armv5-unknown-linux-gnu < %s | FileCheck %s --check-prefixes=ARM5
; RUN: llc -mtriple=armv6-unknown-linux-gnu < %s | FileCheck %s --check-prefixes=ARM6
; RUN: llc -mtriple=armv7-unknown-linux-gnu < %s | FileCheck %s --check-prefixes=ARM7
; RUN: llc -mtriple=armv8-unknown-linux-gnu < %s | FileCheck %s --check-prefixes=ARM8
; RUN: llc -mtriple=armv7-unknown-linux-gnu -mattr=+neon < %s | FileCheck %s --check-prefixes=NEON7
; RUN: llc -mtriple=armv8-unknown-linux-gnu -mattr=+neon < %s | FileCheck %s --check-prefixes=NEON8
define i1 @test_srem_odd(i29 %X) nounwind {
; ARM5-LABEL: test_srem_odd:
; ARM5: @ %bb.0:
; ARM5-NEXT: ldr r2, .LCPI0_1
; ARM5-NEXT: ldr r1, .LCPI0_0
; ARM5-NEXT: mla r3, r0, r2, r1
; ARM5-NEXT: ldr r2, .LCPI0_2
; ARM5-NEXT: mov r0, #0
; ARM5-NEXT: bic r1, r3, #-536870912
; ARM5-NEXT: cmp r1, r2
; ARM5-NEXT: movlo r0, #1
; ARM5-NEXT: bx lr
; ARM5-NEXT: .p2align 2
; ARM5-NEXT: @ %bb.1:
; ARM5-NEXT: .LCPI0_0:
; ARM5-NEXT: .long 2711469 @ 0x295fad
; ARM5-NEXT: .LCPI0_1:
; ARM5-NEXT: .long 526025035 @ 0x1f5a814b
; ARM5-NEXT: .LCPI0_2:
; ARM5-NEXT: .long 5422939 @ 0x52bf5b
;
; ARM6-LABEL: test_srem_odd:
; ARM6: @ %bb.0:
; ARM6-NEXT: ldr r2, .LCPI0_1
; ARM6-NEXT: ldr r1, .LCPI0_0
; ARM6-NEXT: mla r0, r0, r2, r1
; ARM6-NEXT: ldr r2, .LCPI0_2
; ARM6-NEXT: bic r1, r0, #-536870912
; ARM6-NEXT: mov r0, #0
; ARM6-NEXT: cmp r1, r2
; ARM6-NEXT: movlo r0, #1
; ARM6-NEXT: bx lr
; ARM6-NEXT: .p2align 2
; ARM6-NEXT: @ %bb.1:
; ARM6-NEXT: .LCPI0_0:
; ARM6-NEXT: .long 2711469 @ 0x295fad
; ARM6-NEXT: .LCPI0_1:
; ARM6-NEXT: .long 526025035 @ 0x1f5a814b
; ARM6-NEXT: .LCPI0_2:
; ARM6-NEXT: .long 5422939 @ 0x52bf5b
;
; ARM7-LABEL: test_srem_odd:
; ARM7: @ %bb.0:
; ARM7-NEXT: movw r1, #24493
; ARM7-NEXT: movw r2, #33099
; ARM7-NEXT: movt r1, #41
; ARM7-NEXT: movt r2, #8026
; ARM7-NEXT: mla r0, r0, r2, r1
; ARM7-NEXT: movw r2, #48987
; ARM7-NEXT: movt r2, #82
; ARM7-NEXT: bic r1, r0, #-536870912
; ARM7-NEXT: mov r0, #0
; ARM7-NEXT: cmp r1, r2
; ARM7-NEXT: movwlo r0, #1
; ARM7-NEXT: bx lr
;
; ARM8-LABEL: test_srem_odd:
; ARM8: @ %bb.0:
; ARM8-NEXT: movw r1, #24493
; ARM8-NEXT: movw r2, #33099
; ARM8-NEXT: movt r1, #41
; ARM8-NEXT: movt r2, #8026
; ARM8-NEXT: mla r0, r0, r2, r1
; ARM8-NEXT: movw r2, #48987
; ARM8-NEXT: movt r2, #82
; ARM8-NEXT: bic r1, r0, #-536870912
; ARM8-NEXT: mov r0, #0
; ARM8-NEXT: cmp r1, r2
; ARM8-NEXT: movwlo r0, #1
; ARM8-NEXT: bx lr
;
; NEON7-LABEL: test_srem_odd:
; NEON7: @ %bb.0:
; NEON7-NEXT: movw r1, #24493
; NEON7-NEXT: movw r2, #33099
; NEON7-NEXT: movt r1, #41
; NEON7-NEXT: movt r2, #8026
; NEON7-NEXT: mla r0, r0, r2, r1
; NEON7-NEXT: movw r2, #48987
; NEON7-NEXT: movt r2, #82
; NEON7-NEXT: bic r1, r0, #-536870912
; NEON7-NEXT: mov r0, #0
; NEON7-NEXT: cmp r1, r2
; NEON7-NEXT: movwlo r0, #1
; NEON7-NEXT: bx lr
;
; NEON8-LABEL: test_srem_odd:
; NEON8: @ %bb.0:
; NEON8-NEXT: movw r1, #24493
; NEON8-NEXT: movw r2, #33099
; NEON8-NEXT: movt r1, #41
; NEON8-NEXT: movt r2, #8026
; NEON8-NEXT: mla r0, r0, r2, r1
; NEON8-NEXT: movw r2, #48987
; NEON8-NEXT: movt r2, #82
; NEON8-NEXT: bic r1, r0, #-536870912
; NEON8-NEXT: mov r0, #0
; NEON8-NEXT: cmp r1, r2
; NEON8-NEXT: movwlo r0, #1
; NEON8-NEXT: bx lr
%srem = srem i29 %X, 99
%cmp = icmp eq i29 %srem, 0
ret i1 %cmp
}
define i1 @test_srem_even(i4 %X) nounwind {
; ARM5-LABEL: test_srem_even:
; ARM5: @ %bb.0:
; ARM5-NEXT: ldr r2, .LCPI1_0
; ARM5-NEXT: lsl r0, r0, #28
; ARM5-NEXT: asr r12, r0, #28
; ARM5-NEXT: smull r3, r1, r12, r2
; ARM5-NEXT: add r1, r1, r1, lsr #31
; ARM5-NEXT: add r1, r1, r1, lsl #1
; ARM5-NEXT: mvn r1, r1, lsl #1
; ARM5-NEXT: add r0, r1, r0, asr #28
; ARM5-NEXT: clz r0, r0
; ARM5-NEXT: lsr r0, r0, #5
; ARM5-NEXT: bx lr
; ARM5-NEXT: .p2align 2
; ARM5-NEXT: @ %bb.1:
; ARM5-NEXT: .LCPI1_0:
; ARM5-NEXT: .long 715827883 @ 0x2aaaaaab
;
; ARM6-LABEL: test_srem_even:
; ARM6: @ %bb.0:
; ARM6-NEXT: ldr r2, .LCPI1_0
; ARM6-NEXT: lsl r0, r0, #28
; ARM6-NEXT: asr r1, r0, #28
; ARM6-NEXT: smmul r1, r1, r2
; ARM6-NEXT: add r1, r1, r1, lsr #31
; ARM6-NEXT: add r1, r1, r1, lsl #1
; ARM6-NEXT: mvn r1, r1, lsl #1
; ARM6-NEXT: add r0, r1, r0, asr #28
; ARM6-NEXT: clz r0, r0
; ARM6-NEXT: lsr r0, r0, #5
; ARM6-NEXT: bx lr
; ARM6-NEXT: .p2align 2
; ARM6-NEXT: @ %bb.1:
; ARM6-NEXT: .LCPI1_0:
; ARM6-NEXT: .long 715827883 @ 0x2aaaaaab
;
; ARM7-LABEL: test_srem_even:
; ARM7: @ %bb.0:
; ARM7-NEXT: movw r2, #43691
; ARM7-NEXT: sbfx r1, r0, #0, #4
; ARM7-NEXT: movt r2, #10922
; ARM7-NEXT: lsl r0, r0, #28
; ARM7-NEXT: smmul r1, r1, r2
; ARM7-NEXT: add r1, r1, r1, lsr #31
; ARM7-NEXT: add r1, r1, r1, lsl #1
; ARM7-NEXT: mvn r1, r1, lsl #1
; ARM7-NEXT: add r0, r1, r0, asr #28
; ARM7-NEXT: clz r0, r0
; ARM7-NEXT: lsr r0, r0, #5
; ARM7-NEXT: bx lr
;
; ARM8-LABEL: test_srem_even:
; ARM8: @ %bb.0:
; ARM8-NEXT: movw r2, #43691
; ARM8-NEXT: sbfx r1, r0, #0, #4
; ARM8-NEXT: movt r2, #10922
; ARM8-NEXT: lsl r0, r0, #28
; ARM8-NEXT: smmul r1, r1, r2
; ARM8-NEXT: add r1, r1, r1, lsr #31
; ARM8-NEXT: add r1, r1, r1, lsl #1
; ARM8-NEXT: mvn r1, r1, lsl #1
; ARM8-NEXT: add r0, r1, r0, asr #28
; ARM8-NEXT: clz r0, r0
; ARM8-NEXT: lsr r0, r0, #5
; ARM8-NEXT: bx lr
;
; NEON7-LABEL: test_srem_even:
; NEON7: @ %bb.0:
; NEON7-NEXT: movw r2, #43691
; NEON7-NEXT: sbfx r1, r0, #0, #4
; NEON7-NEXT: movt r2, #10922
; NEON7-NEXT: lsl r0, r0, #28
; NEON7-NEXT: smmul r1, r1, r2
; NEON7-NEXT: add r1, r1, r1, lsr #31
; NEON7-NEXT: add r1, r1, r1, lsl #1
; NEON7-NEXT: mvn r1, r1, lsl #1
; NEON7-NEXT: add r0, r1, r0, asr #28
; NEON7-NEXT: clz r0, r0
; NEON7-NEXT: lsr r0, r0, #5
; NEON7-NEXT: bx lr
;
; NEON8-LABEL: test_srem_even:
; NEON8: @ %bb.0:
; NEON8-NEXT: movw r2, #43691
; NEON8-NEXT: sbfx r1, r0, #0, #4
; NEON8-NEXT: movt r2, #10922
; NEON8-NEXT: lsl r0, r0, #28
; NEON8-NEXT: smmul r1, r1, r2
; NEON8-NEXT: add r1, r1, r1, lsr #31
; NEON8-NEXT: add r1, r1, r1, lsl #1
; NEON8-NEXT: mvn r1, r1, lsl #1
; NEON8-NEXT: add r0, r1, r0, asr #28
; NEON8-NEXT: clz r0, r0
; NEON8-NEXT: lsr r0, r0, #5
; NEON8-NEXT: bx lr
%srem = srem i4 %X, 6
%cmp = icmp eq i4 %srem, 1
ret i1 %cmp
}
define i1 @test_srem_pow2_setne(i6 %X) nounwind {
; ARM5-LABEL: test_srem_pow2_setne:
; ARM5: @ %bb.0:
; ARM5-NEXT: lsl r1, r0, #26
; ARM5-NEXT: mov r2, #3
; ARM5-NEXT: asr r1, r1, #26
; ARM5-NEXT: and r1, r2, r1, lsr #9
; ARM5-NEXT: add r1, r0, r1
; ARM5-NEXT: and r1, r1, #60
; ARM5-NEXT: sub r0, r0, r1
; ARM5-NEXT: ands r0, r0, #63
; ARM5-NEXT: movne r0, #1
; ARM5-NEXT: bx lr
;
; ARM6-LABEL: test_srem_pow2_setne:
; ARM6: @ %bb.0:
; ARM6-NEXT: lsl r1, r0, #26
; ARM6-NEXT: mov r2, #3
; ARM6-NEXT: asr r1, r1, #26
; ARM6-NEXT: and r1, r2, r1, lsr #9
; ARM6-NEXT: add r1, r0, r1
; ARM6-NEXT: and r1, r1, #60
; ARM6-NEXT: sub r0, r0, r1
; ARM6-NEXT: ands r0, r0, #63
; ARM6-NEXT: movne r0, #1
; ARM6-NEXT: bx lr
;
; ARM7-LABEL: test_srem_pow2_setne:
; ARM7: @ %bb.0:
; ARM7-NEXT: sbfx r1, r0, #0, #6
; ARM7-NEXT: ubfx r1, r1, #9, #2
; ARM7-NEXT: add r1, r0, r1
; ARM7-NEXT: and r1, r1, #60
; ARM7-NEXT: sub r0, r0, r1
; ARM7-NEXT: ands r0, r0, #63
; ARM7-NEXT: movwne r0, #1
; ARM7-NEXT: bx lr
;
; ARM8-LABEL: test_srem_pow2_setne:
; ARM8: @ %bb.0:
; ARM8-NEXT: sbfx r1, r0, #0, #6
; ARM8-NEXT: ubfx r1, r1, #9, #2
; ARM8-NEXT: add r1, r0, r1
; ARM8-NEXT: and r1, r1, #60
; ARM8-NEXT: sub r0, r0, r1
; ARM8-NEXT: ands r0, r0, #63
; ARM8-NEXT: movwne r0, #1
; ARM8-NEXT: bx lr
;
; NEON7-LABEL: test_srem_pow2_setne:
; NEON7: @ %bb.0:
; NEON7-NEXT: sbfx r1, r0, #0, #6
; NEON7-NEXT: ubfx r1, r1, #9, #2
; NEON7-NEXT: add r1, r0, r1
; NEON7-NEXT: and r1, r1, #60
; NEON7-NEXT: sub r0, r0, r1
; NEON7-NEXT: ands r0, r0, #63
; NEON7-NEXT: movwne r0, #1
; NEON7-NEXT: bx lr
;
; NEON8-LABEL: test_srem_pow2_setne:
; NEON8: @ %bb.0:
; NEON8-NEXT: sbfx r1, r0, #0, #6
; NEON8-NEXT: ubfx r1, r1, #9, #2
; NEON8-NEXT: add r1, r0, r1
; NEON8-NEXT: and r1, r1, #60
; NEON8-NEXT: sub r0, r0, r1
; NEON8-NEXT: ands r0, r0, #63
; NEON8-NEXT: movwne r0, #1
; NEON8-NEXT: bx lr
%srem = srem i6 %X, 4
%cmp = icmp ne i6 %srem, 0
ret i1 %cmp
}
define <3 x i1> @test_srem_vec(<3 x i33> %X) nounwind {
; ARM5-LABEL: test_srem_vec:
; ARM5: @ %bb.0:
; ARM5-NEXT: push {r4, r5, r6, lr}
; ARM5-NEXT: and r1, r1, #1
; ARM5-NEXT: mov r5, r3
; ARM5-NEXT: rsb r1, r1, #0
; ARM5-NEXT: mov r6, r2
; ARM5-NEXT: mov r2, #9
; ARM5-NEXT: mov r3, #0
; ARM5-NEXT: bl __moddi3
; ARM5-NEXT: eor r0, r0, #3
; ARM5-NEXT: mov r2, #9
; ARM5-NEXT: orrs r4, r0, r1
; ARM5-NEXT: and r0, r5, #1
; ARM5-NEXT: rsb r1, r0, #0
; ARM5-NEXT: mov r0, r6
; ARM5-NEXT: mov r3, #0
; ARM5-NEXT: movne r4, #1
; ARM5-NEXT: bl __moddi3
; ARM5-NEXT: mov r2, #1
; ARM5-NEXT: bic r1, r2, r1
; ARM5-NEXT: mvn r2, #2
; ARM5-NEXT: eor r0, r0, r2
; ARM5-NEXT: orrs r5, r0, r1
; ARM5-NEXT: ldr r0, [sp, #20]
; ARM5-NEXT: mvn r2, #8
; ARM5-NEXT: mvn r3, #0
; ARM5-NEXT: and r0, r0, #1
; ARM5-NEXT: movne r5, #1
; ARM5-NEXT: rsb r1, r0, #0
; ARM5-NEXT: ldr r0, [sp, #16]
; ARM5-NEXT: bl __moddi3
; ARM5-NEXT: eor r0, r0, #3
; ARM5-NEXT: orrs r2, r0, r1
; ARM5-NEXT: mov r0, r4
; ARM5-NEXT: movne r2, #1
; ARM5-NEXT: mov r1, r5
; ARM5-NEXT: pop {r4, r5, r6, pc}
;
; ARM6-LABEL: test_srem_vec:
; ARM6: @ %bb.0:
; ARM6-NEXT: push {r4, r5, r6, lr}
; ARM6-NEXT: and r1, r1, #1
; ARM6-NEXT: mov r5, r3
; ARM6-NEXT: rsb r1, r1, #0
; ARM6-NEXT: mov r6, r2
; ARM6-NEXT: mov r2, #9
; ARM6-NEXT: mov r3, #0
; ARM6-NEXT: bl __moddi3
; ARM6-NEXT: eor r0, r0, #3
; ARM6-NEXT: mov r2, #9
; ARM6-NEXT: orrs r4, r0, r1
; ARM6-NEXT: and r0, r5, #1
; ARM6-NEXT: rsb r1, r0, #0
; ARM6-NEXT: mov r0, r6
; ARM6-NEXT: mov r3, #0
; ARM6-NEXT: movne r4, #1
; ARM6-NEXT: bl __moddi3
; ARM6-NEXT: mov r2, #1
; ARM6-NEXT: bic r1, r2, r1
; ARM6-NEXT: mvn r2, #2
; ARM6-NEXT: eor r0, r0, r2
; ARM6-NEXT: orrs r5, r0, r1
; ARM6-NEXT: ldr r0, [sp, #20]
; ARM6-NEXT: mvn r2, #8
; ARM6-NEXT: mvn r3, #0
; ARM6-NEXT: and r0, r0, #1
; ARM6-NEXT: movne r5, #1
; ARM6-NEXT: rsb r1, r0, #0
; ARM6-NEXT: ldr r0, [sp, #16]
; ARM6-NEXT: bl __moddi3
; ARM6-NEXT: eor r0, r0, #3
; ARM6-NEXT: orrs r2, r0, r1
; ARM6-NEXT: mov r0, r4
; ARM6-NEXT: movne r2, #1
; ARM6-NEXT: mov r1, r5
; ARM6-NEXT: pop {r4, r5, r6, pc}
;
; ARM7-LABEL: test_srem_vec:
; ARM7: @ %bb.0:
; ARM7-NEXT: push {r4, r5, r6, r7, r11, lr}
; ARM7-NEXT: vpush {d8, d9}
; ARM7-NEXT: mov r6, r0
; ARM7-NEXT: and r0, r3, #1
; ARM7-NEXT: mov r5, r1
; ARM7-NEXT: rsb r1, r0, #0
; ARM7-NEXT: mov r0, r2
; ARM7-NEXT: mov r2, #9
; ARM7-NEXT: mov r3, #0
; ARM7-NEXT: bl __moddi3
; ARM7-NEXT: mov r7, r0
; ARM7-NEXT: and r0, r5, #1
; ARM7-NEXT: mov r4, r1
; ARM7-NEXT: rsb r1, r0, #0
; ARM7-NEXT: mov r0, r6
; ARM7-NEXT: mov r2, #9
; ARM7-NEXT: mov r3, #0
; ARM7-NEXT: bl __moddi3
; ARM7-NEXT: vmov.32 d8[0], r0
; ARM7-NEXT: ldr r0, [sp, #44]
; ARM7-NEXT: ldr r2, [sp, #40]
; ARM7-NEXT: mov r5, r1
; ARM7-NEXT: and r0, r0, #1
; ARM7-NEXT: mvn r3, #0
; ARM7-NEXT: rsb r1, r0, #0
; ARM7-NEXT: vmov.32 d9[0], r7
; ARM7-NEXT: mov r0, r2
; ARM7-NEXT: mvn r2, #8
; ARM7-NEXT: bl __moddi3
; ARM7-NEXT: vmov.32 d16[0], r0
; ARM7-NEXT: adr r0, .LCPI3_0
; ARM7-NEXT: vmov.32 d9[1], r4
; ARM7-NEXT: vld1.64 {d18, d19}, [r0:128]
; ARM7-NEXT: adr r0, .LCPI3_1
; ARM7-NEXT: vmov.32 d16[1], r1
; ARM7-NEXT: vmov.32 d8[1], r5
; ARM7-NEXT: vand q8, q8, q9
; ARM7-NEXT: vld1.64 {d20, d21}, [r0:128]
; ARM7-NEXT: adr r0, .LCPI3_2
; ARM7-NEXT: vand q11, q4, q9
; ARM7-NEXT: vld1.64 {d18, d19}, [r0:128]
; ARM7-NEXT: vceq.i32 q10, q11, q10
; ARM7-NEXT: vceq.i32 q8, q8, q9
; ARM7-NEXT: vrev64.32 q9, q10
; ARM7-NEXT: vrev64.32 q11, q8
; ARM7-NEXT: vand q9, q10, q9
; ARM7-NEXT: vand q8, q8, q11
; ARM7-NEXT: vmvn q9, q9
; ARM7-NEXT: vmvn q8, q8
; ARM7-NEXT: vmovn.i64 d18, q9
; ARM7-NEXT: vmovn.i64 d16, q8
; ARM7-NEXT: vmov.32 r0, d18[0]
; ARM7-NEXT: vmov.32 r1, d18[1]
; ARM7-NEXT: vmov.32 r2, d16[0]
; ARM7-NEXT: vpop {d8, d9}
; ARM7-NEXT: pop {r4, r5, r6, r7, r11, pc}
; ARM7-NEXT: .p2align 4
; ARM7-NEXT: @ %bb.1:
; ARM7-NEXT: .LCPI3_0:
; ARM7-NEXT: .long 4294967295 @ 0xffffffff
; ARM7-NEXT: .long 1 @ 0x1
; ARM7-NEXT: .long 4294967295 @ 0xffffffff
; ARM7-NEXT: .long 1 @ 0x1
; ARM7-NEXT: .LCPI3_1:
; ARM7-NEXT: .long 3 @ 0x3
; ARM7-NEXT: .long 0 @ 0x0
; ARM7-NEXT: .long 4294967293 @ 0xfffffffd
; ARM7-NEXT: .long 1 @ 0x1
; ARM7-NEXT: .LCPI3_2:
; ARM7-NEXT: .long 3 @ 0x3
; ARM7-NEXT: .long 0 @ 0x0
; ARM7-NEXT: .zero 4
; ARM7-NEXT: .long 0 @ 0x0
;
; ARM8-LABEL: test_srem_vec:
; ARM8: @ %bb.0:
; ARM8-NEXT: push {r4, r5, r6, r7, r11, lr}
; ARM8-NEXT: vpush {d8, d9}
; ARM8-NEXT: mov r6, r0
; ARM8-NEXT: and r0, r3, #1
; ARM8-NEXT: mov r5, r1
; ARM8-NEXT: rsb r1, r0, #0
; ARM8-NEXT: mov r0, r2
; ARM8-NEXT: mov r2, #9
; ARM8-NEXT: mov r3, #0
; ARM8-NEXT: bl __moddi3
; ARM8-NEXT: mov r7, r0
; ARM8-NEXT: and r0, r5, #1
; ARM8-NEXT: mov r4, r1
; ARM8-NEXT: rsb r1, r0, #0
; ARM8-NEXT: mov r0, r6
; ARM8-NEXT: mov r2, #9
; ARM8-NEXT: mov r3, #0
; ARM8-NEXT: bl __moddi3
; ARM8-NEXT: vmov.32 d8[0], r0
; ARM8-NEXT: ldr r0, [sp, #44]
; ARM8-NEXT: ldr r2, [sp, #40]
; ARM8-NEXT: mov r5, r1
; ARM8-NEXT: and r0, r0, #1
; ARM8-NEXT: mvn r3, #0
; ARM8-NEXT: rsb r1, r0, #0
; ARM8-NEXT: vmov.32 d9[0], r7
; ARM8-NEXT: mov r0, r2
; ARM8-NEXT: mvn r2, #8
; ARM8-NEXT: bl __moddi3
; ARM8-NEXT: vmov.32 d16[0], r0
; ARM8-NEXT: adr r0, .LCPI3_0
; ARM8-NEXT: vmov.32 d9[1], r4
; ARM8-NEXT: vld1.64 {d18, d19}, [r0:128]
; ARM8-NEXT: adr r0, .LCPI3_1
; ARM8-NEXT: vmov.32 d16[1], r1
; ARM8-NEXT: vmov.32 d8[1], r5
; ARM8-NEXT: vand q8, q8, q9
; ARM8-NEXT: vld1.64 {d20, d21}, [r0:128]
; ARM8-NEXT: adr r0, .LCPI3_2
; ARM8-NEXT: vand q11, q4, q9
; ARM8-NEXT: vld1.64 {d18, d19}, [r0:128]
; ARM8-NEXT: vceq.i32 q10, q11, q10
; ARM8-NEXT: vceq.i32 q8, q8, q9
; ARM8-NEXT: vrev64.32 q9, q10
; ARM8-NEXT: vrev64.32 q11, q8
; ARM8-NEXT: vand q9, q10, q9
; ARM8-NEXT: vand q8, q8, q11
; ARM8-NEXT: vmvn q9, q9
; ARM8-NEXT: vmvn q8, q8
; ARM8-NEXT: vmovn.i64 d18, q9
; ARM8-NEXT: vmovn.i64 d16, q8
; ARM8-NEXT: vmov.32 r0, d18[0]
; ARM8-NEXT: vmov.32 r1, d18[1]
; ARM8-NEXT: vmov.32 r2, d16[0]
; ARM8-NEXT: vpop {d8, d9}
; ARM8-NEXT: pop {r4, r5, r6, r7, r11, pc}
; ARM8-NEXT: .p2align 4
; ARM8-NEXT: @ %bb.1:
; ARM8-NEXT: .LCPI3_0:
; ARM8-NEXT: .long 4294967295 @ 0xffffffff
; ARM8-NEXT: .long 1 @ 0x1
; ARM8-NEXT: .long 4294967295 @ 0xffffffff
; ARM8-NEXT: .long 1 @ 0x1
; ARM8-NEXT: .LCPI3_1:
; ARM8-NEXT: .long 3 @ 0x3
; ARM8-NEXT: .long 0 @ 0x0
; ARM8-NEXT: .long 4294967293 @ 0xfffffffd
; ARM8-NEXT: .long 1 @ 0x1
; ARM8-NEXT: .LCPI3_2:
; ARM8-NEXT: .long 3 @ 0x3
; ARM8-NEXT: .long 0 @ 0x0
; ARM8-NEXT: .zero 4
; ARM8-NEXT: .long 0 @ 0x0
;
; NEON7-LABEL: test_srem_vec:
; NEON7: @ %bb.0:
; NEON7-NEXT: push {r4, r5, r6, r7, r11, lr}
; NEON7-NEXT: vpush {d8, d9}
; NEON7-NEXT: mov r6, r0
; NEON7-NEXT: and r0, r3, #1
; NEON7-NEXT: mov r5, r1
; NEON7-NEXT: rsb r1, r0, #0
; NEON7-NEXT: mov r0, r2
; NEON7-NEXT: mov r2, #9
; NEON7-NEXT: mov r3, #0
; NEON7-NEXT: bl __moddi3
; NEON7-NEXT: mov r7, r0
; NEON7-NEXT: and r0, r5, #1
; NEON7-NEXT: mov r4, r1
; NEON7-NEXT: rsb r1, r0, #0
; NEON7-NEXT: mov r0, r6
; NEON7-NEXT: mov r2, #9
; NEON7-NEXT: mov r3, #0
; NEON7-NEXT: bl __moddi3
; NEON7-NEXT: vmov.32 d8[0], r0
; NEON7-NEXT: ldr r0, [sp, #44]
; NEON7-NEXT: ldr r2, [sp, #40]
; NEON7-NEXT: mov r5, r1
; NEON7-NEXT: and r0, r0, #1
; NEON7-NEXT: mvn r3, #0
; NEON7-NEXT: rsb r1, r0, #0
; NEON7-NEXT: vmov.32 d9[0], r7
; NEON7-NEXT: mov r0, r2
; NEON7-NEXT: mvn r2, #8
; NEON7-NEXT: bl __moddi3
; NEON7-NEXT: vmov.32 d16[0], r0
; NEON7-NEXT: adr r0, .LCPI3_0
; NEON7-NEXT: vmov.32 d9[1], r4
; NEON7-NEXT: vld1.64 {d18, d19}, [r0:128]
; NEON7-NEXT: adr r0, .LCPI3_1
; NEON7-NEXT: vmov.32 d16[1], r1
; NEON7-NEXT: vmov.32 d8[1], r5
; NEON7-NEXT: vand q8, q8, q9
; NEON7-NEXT: vld1.64 {d20, d21}, [r0:128]
; NEON7-NEXT: adr r0, .LCPI3_2
; NEON7-NEXT: vand q11, q4, q9
; NEON7-NEXT: vld1.64 {d18, d19}, [r0:128]
; NEON7-NEXT: vceq.i32 q10, q11, q10
; NEON7-NEXT: vceq.i32 q8, q8, q9
; NEON7-NEXT: vrev64.32 q9, q10
; NEON7-NEXT: vrev64.32 q11, q8
; NEON7-NEXT: vand q9, q10, q9
; NEON7-NEXT: vand q8, q8, q11
; NEON7-NEXT: vmvn q9, q9
; NEON7-NEXT: vmvn q8, q8
; NEON7-NEXT: vmovn.i64 d18, q9
; NEON7-NEXT: vmovn.i64 d16, q8
; NEON7-NEXT: vmov.32 r0, d18[0]
; NEON7-NEXT: vmov.32 r1, d18[1]
; NEON7-NEXT: vmov.32 r2, d16[0]
; NEON7-NEXT: vpop {d8, d9}
; NEON7-NEXT: pop {r4, r5, r6, r7, r11, pc}
; NEON7-NEXT: .p2align 4
; NEON7-NEXT: @ %bb.1:
; NEON7-NEXT: .LCPI3_0:
; NEON7-NEXT: .long 4294967295 @ 0xffffffff
; NEON7-NEXT: .long 1 @ 0x1
; NEON7-NEXT: .long 4294967295 @ 0xffffffff
; NEON7-NEXT: .long 1 @ 0x1
; NEON7-NEXT: .LCPI3_1:
; NEON7-NEXT: .long 3 @ 0x3
; NEON7-NEXT: .long 0 @ 0x0
; NEON7-NEXT: .long 4294967293 @ 0xfffffffd
; NEON7-NEXT: .long 1 @ 0x1
; NEON7-NEXT: .LCPI3_2:
; NEON7-NEXT: .long 3 @ 0x3
; NEON7-NEXT: .long 0 @ 0x0
; NEON7-NEXT: .zero 4
; NEON7-NEXT: .long 0 @ 0x0
;
; NEON8-LABEL: test_srem_vec:
; NEON8: @ %bb.0:
; NEON8-NEXT: push {r4, r5, r6, r7, r11, lr}
; NEON8-NEXT: vpush {d8, d9}
; NEON8-NEXT: mov r6, r0
; NEON8-NEXT: and r0, r3, #1
; NEON8-NEXT: mov r5, r1
; NEON8-NEXT: rsb r1, r0, #0
; NEON8-NEXT: mov r0, r2
; NEON8-NEXT: mov r2, #9
; NEON8-NEXT: mov r3, #0
; NEON8-NEXT: bl __moddi3
; NEON8-NEXT: mov r7, r0
; NEON8-NEXT: and r0, r5, #1
; NEON8-NEXT: mov r4, r1
; NEON8-NEXT: rsb r1, r0, #0
; NEON8-NEXT: mov r0, r6
; NEON8-NEXT: mov r2, #9
; NEON8-NEXT: mov r3, #0
; NEON8-NEXT: bl __moddi3
; NEON8-NEXT: vmov.32 d8[0], r0
; NEON8-NEXT: ldr r0, [sp, #44]
; NEON8-NEXT: ldr r2, [sp, #40]
; NEON8-NEXT: mov r5, r1
; NEON8-NEXT: and r0, r0, #1
; NEON8-NEXT: mvn r3, #0
; NEON8-NEXT: rsb r1, r0, #0
; NEON8-NEXT: vmov.32 d9[0], r7
; NEON8-NEXT: mov r0, r2
; NEON8-NEXT: mvn r2, #8
; NEON8-NEXT: bl __moddi3
; NEON8-NEXT: vmov.32 d16[0], r0
; NEON8-NEXT: adr r0, .LCPI3_0
; NEON8-NEXT: vmov.32 d9[1], r4
; NEON8-NEXT: vld1.64 {d18, d19}, [r0:128]
; NEON8-NEXT: adr r0, .LCPI3_1
; NEON8-NEXT: vmov.32 d16[1], r1
; NEON8-NEXT: vmov.32 d8[1], r5
; NEON8-NEXT: vand q8, q8, q9
; NEON8-NEXT: vld1.64 {d20, d21}, [r0:128]
; NEON8-NEXT: adr r0, .LCPI3_2
; NEON8-NEXT: vand q11, q4, q9
; NEON8-NEXT: vld1.64 {d18, d19}, [r0:128]
; NEON8-NEXT: vceq.i32 q10, q11, q10
; NEON8-NEXT: vceq.i32 q8, q8, q9
; NEON8-NEXT: vrev64.32 q9, q10
; NEON8-NEXT: vrev64.32 q11, q8
; NEON8-NEXT: vand q9, q10, q9
; NEON8-NEXT: vand q8, q8, q11
; NEON8-NEXT: vmvn q9, q9
; NEON8-NEXT: vmvn q8, q8
; NEON8-NEXT: vmovn.i64 d18, q9
; NEON8-NEXT: vmovn.i64 d16, q8
; NEON8-NEXT: vmov.32 r0, d18[0]
; NEON8-NEXT: vmov.32 r1, d18[1]
; NEON8-NEXT: vmov.32 r2, d16[0]
; NEON8-NEXT: vpop {d8, d9}
; NEON8-NEXT: pop {r4, r5, r6, r7, r11, pc}
; NEON8-NEXT: .p2align 4
; NEON8-NEXT: @ %bb.1:
; NEON8-NEXT: .LCPI3_0:
; NEON8-NEXT: .long 4294967295 @ 0xffffffff
; NEON8-NEXT: .long 1 @ 0x1
; NEON8-NEXT: .long 4294967295 @ 0xffffffff
; NEON8-NEXT: .long 1 @ 0x1
; NEON8-NEXT: .LCPI3_1:
; NEON8-NEXT: .long 3 @ 0x3
; NEON8-NEXT: .long 0 @ 0x0
; NEON8-NEXT: .long 4294967293 @ 0xfffffffd
; NEON8-NEXT: .long 1 @ 0x1
; NEON8-NEXT: .LCPI3_2:
; NEON8-NEXT: .long 3 @ 0x3
; NEON8-NEXT: .long 0 @ 0x0
; NEON8-NEXT: .zero 4
; NEON8-NEXT: .long 0 @ 0x0
%srem = srem <3 x i33> %X, <i33 9, i33 9, i33 -9>
%cmp = icmp ne <3 x i33> %srem, <i33 3, i33 -3, i33 3>
ret <3 x i1> %cmp
}