|  | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | 
|  | ; RUN: llc -mtriple=arm-eabi -mattr=+neon,+fullfp16 %s -o - | FileCheck --check-prefixes=CHECK,CHECK-LE %s | 
|  | ; RUN: llc -mtriple=armeb-eabi -mattr=+neon,+fullfp16 %s -o - | FileCheck --check-prefixes=CHECK,CHECK-BE %s | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i8> @v_movi8() nounwind { | 
|  | ; CHECK-LABEL: v_movi8: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d0, #0x8 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <8 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @v_movi16a() nounwind { | 
|  | ; CHECK-LABEL: v_movi16a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d0, #0x10 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i16> < i16 16, i16 16, i16 16, i16 16 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @v_movi16b() nounwind { | 
|  | ; CHECK-LABEL: v_movi16b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d0, #0x1000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i16> < i16 4096, i16 4096, i16 4096, i16 4096 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @v_mvni16a() nounwind { | 
|  | ; CHECK-LABEL: v_mvni16a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d0, #0x10 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i16> < i16 65519, i16 65519, i16 65519, i16 65519 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @v_mvni16b() nounwind { | 
|  | ; CHECK-LABEL: v_mvni16b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d0, #0x1000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i16> < i16 61439, i16 61439, i16 61439, i16 61439 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32a() nounwind { | 
|  | ; CHECK-LABEL: v_movi32a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x20 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 32, i32 32 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32b() nounwind { | 
|  | ; CHECK-LABEL: v_movi32b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x2000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 8192, i32 8192 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32c() nounwind { | 
|  | ; CHECK-LABEL: v_movi32c: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x200000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 2097152, i32 2097152 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32d() nounwind { | 
|  | ; CHECK-LABEL: v_movi32d: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x20000000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 536870912, i32 536870912 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32e() nounwind { | 
|  | ; CHECK-LABEL: v_movi32e: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x20ff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 8447, i32 8447 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_movi32f() nounwind { | 
|  | ; CHECK-LABEL: v_movi32f: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d0, #0x20ffff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 2162687, i32 2162687 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32a() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x20 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 4294967263, i32 4294967263 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32b() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x2000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 4294959103, i32 4294959103 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32c() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32c: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x200000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 4292870143, i32 4292870143 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32d() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32d: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x20000000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 3758096383, i32 3758096383 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32e() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32e: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x20ff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 4294958848, i32 4294958848 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @v_mvni32f() nounwind { | 
|  | ; CHECK-LABEL: v_mvni32f: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d0, #0x20ffff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i32> < i32 4292804608, i32 4292804608 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <1 x i64> @v_movi64() nounwind { | 
|  | ; CHECK-LABEL: v_movi64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i64 d0, #0xff0000ff0000ffff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <1 x i64> < i64 18374687574888349695 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <16 x i8> @v_movQi8() nounwind { | 
|  | ; CHECK-LABEL: v_movQi8: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q0, #0x8 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <16 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i16> @v_movQi16a() nounwind { | 
|  | ; CHECK-LABEL: v_movQi16a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q0, #0x10 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <8 x i16> < i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i16> @v_movQi16b() nounwind { | 
|  | ; CHECK-LABEL: v_movQi16b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q0, #0x1000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <8 x i16> < i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32a() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32a: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x20 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 32, i32 32, i32 32, i32 32 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32b() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32b: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x2000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 8192, i32 8192, i32 8192, i32 8192 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32c() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32c: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x200000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 2097152, i32 2097152, i32 2097152, i32 2097152 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32d() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32d: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x20000000 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 536870912, i32 536870912, i32 536870912, i32 536870912 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32e() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32e: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x20ff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 8447, i32 8447, i32 8447, i32 8447 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @v_movQi32f() nounwind { | 
|  | ; CHECK-LABEL: v_movQi32f: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q0, #0x20ffff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <4 x i32> < i32 2162687, i32 2162687, i32 2162687, i32 2162687 > | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i64> @v_movQi64() nounwind { | 
|  | ; CHECK-LABEL: v_movQi64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i64 q0, #0xff0000ff0000ffff | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | ret <2 x i64> < i64 18374687574888349695, i64 18374687574888349695 > | 
|  | } | 
|  |  | 
|  | ; Check for correct assembler printing for immediate values. | 
|  | %struct.int8x8_t = type { <8 x i8> } | 
|  | define arm_aapcs_vfpcc void @vdupn128(ptr noalias nocapture sret(%struct.int8x8_t) %agg.result) nounwind { | 
|  | ; CHECK-LABEL: vdupn128: | 
|  | ; CHECK:       @ %bb.0: @ %entry | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x80 | 
|  | ; CHECK-NEXT:    vstr d16, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | entry: | 
|  | %0 = getelementptr inbounds %struct.int8x8_t, ptr %agg.result, i32 0, i32 0 ; <ptr> [#uses=1] | 
|  | store <8 x i8> <i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128>, ptr %0, align 8 | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @vdupnneg75(ptr noalias nocapture sret(%struct.int8x8_t) %agg.result) nounwind { | 
|  | ; CHECK-LABEL: vdupnneg75: | 
|  | ; CHECK:       @ %bb.0: @ %entry | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0xb5 | 
|  | ; CHECK-NEXT:    vstr d16, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | entry: | 
|  | %0 = getelementptr inbounds %struct.int8x8_t, ptr %agg.result, i32 0, i32 0 ; <ptr> [#uses=1] | 
|  | store <8 x i8> <i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75>, ptr %0, align 8 | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i16> @vmovls8(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovls8: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.8 {d16}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    vmovl.s8 q0, d16 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovls8: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.8 {d16}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    vmovl.s8 q8, d16 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q0, q8 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i8>, ptr %A | 
|  | %tmp2 = sext <8 x i8> %tmp1 to <8 x i16> | 
|  | ret <8 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @vmovls16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovls16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.16 {d16}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    vmovl.s16 q0, d16 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovls16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.16 {d16}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    vmovl.s16 q8, d16 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q0, q8 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i16>, ptr %A | 
|  | %tmp2 = sext <4 x i16> %tmp1 to <4 x i32> | 
|  | ret <4 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i64> @vmovls32(ptr %A) nounwind { | 
|  | ; CHECK-LABEL: vmovls32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vld1.32 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    vmovl.s32 q0, d16 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i32>, ptr %A | 
|  | %tmp2 = sext <2 x i32> %tmp1 to <2 x i64> | 
|  | ret <2 x i64> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i16> @vmovlu8(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovlu8: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.8 {d16}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    vmovl.u8 q0, d16 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovlu8: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.8 {d16}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    vmovl.u8 q8, d16 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q0, q8 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i8>, ptr %A | 
|  | %tmp2 = zext <8 x i8> %tmp1 to <8 x i16> | 
|  | ret <8 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i32> @vmovlu16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovlu16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.16 {d16}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    vmovl.u16 q0, d16 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovlu16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.16 {d16}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    vmovl.u16 q8, d16 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q0, q8 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i16>, ptr %A | 
|  | %tmp2 = zext <4 x i16> %tmp1 to <4 x i32> | 
|  | ret <4 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i64> @vmovlu32(ptr %A) nounwind { | 
|  | ; CHECK-LABEL: vmovlu32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vld1.32 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    vmovl.u32 q0, d16 | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i32>, ptr %A | 
|  | %tmp2 = zext <2 x i32> %tmp1 to <2 x i64> | 
|  | ret <2 x i64> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i8> @vmovni16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovni16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vmovn.i16 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovni16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vmovn.i16 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.8 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i16>, ptr %A | 
|  | %tmp2 = trunc <8 x i16> %tmp1 to <8 x i8> | 
|  | ret <8 x i8> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @vmovni32(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovni32: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vmovn.i32 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovni32: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vmovn.i32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i32>, ptr %A | 
|  | %tmp2 = trunc <4 x i32> %tmp1 to <4 x i16> | 
|  | ret <4 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @vmovni64(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vmovni64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vmovn.i64 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vmovni64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vmovn.i64 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i64>, ptr %A | 
|  | %tmp2 = trunc <2 x i64> %tmp1 to <2 x i32> | 
|  | ret <2 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i8> @vqmovns16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovns16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.s16 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovns16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovn.s16 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.8 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i16>, ptr %A | 
|  | %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16> %tmp1) | 
|  | ret <8 x i8> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @vqmovns32(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovns32: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.s32 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovns32: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovn.s32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i32>, ptr %A | 
|  | %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32> %tmp1) | 
|  | ret <4 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @vqmovns64(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovns64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.s64 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovns64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vqmovn.s64 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i64>, ptr %A | 
|  | %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64> %tmp1) | 
|  | ret <2 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i8> @vqmovnu16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovnu16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.u16 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovnu16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovn.u16 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.8 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i16>, ptr %A | 
|  | %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16> %tmp1) | 
|  | ret <8 x i8> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @vqmovnu32(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovnu32: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.u32 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovnu32: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovn.u32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i32>, ptr %A | 
|  | %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32> %tmp1) | 
|  | ret <4 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @vqmovnu64(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovnu64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovn.u64 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovnu64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vqmovn.u64 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i64>, ptr %A | 
|  | %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64> %tmp1) | 
|  | ret <2 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <8 x i8> @vqmovuns16(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovuns16: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovun.s16 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovuns16: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.16 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovun.s16 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.8 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <8 x i16>, ptr %A | 
|  | %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16> %tmp1) | 
|  | ret <8 x i8> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <4 x i16> @vqmovuns32(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovuns32: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovun.s32 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovuns32: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vqmovun.s32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i32>, ptr %A | 
|  | %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32> %tmp1) | 
|  | ret <4 x i16> %tmp2 | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc <2 x i32> @vqmovuns64(ptr %A) nounwind { | 
|  | ; CHECK-LE-LABEL: vqmovuns64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    vqmovun.s64 d0, q8 | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: vqmovuns64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vqmovun.s64 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 d0, d16 | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <2 x i64>, ptr %A | 
|  | %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64> %tmp1) | 
|  | ret <2 x i32> %tmp2 | 
|  | } | 
|  |  | 
|  | declare <8 x i8>  @llvm.arm.neon.vqmovns.v8i8(<8 x i16>) nounwind readnone | 
|  | declare <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32>) nounwind readnone | 
|  | declare <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64>) nounwind readnone | 
|  |  | 
|  | declare <8 x i8>  @llvm.arm.neon.vqmovnu.v8i8(<8 x i16>) nounwind readnone | 
|  | declare <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32>) nounwind readnone | 
|  | declare <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64>) nounwind readnone | 
|  |  | 
|  | declare <8 x i8>  @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16>) nounwind readnone | 
|  | declare <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32>) nounwind readnone | 
|  | declare <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64>) nounwind readnone | 
|  |  | 
|  | ; Truncating vector stores are not supported.  The following should not crash. | 
|  | ; Radar 8598391. | 
|  | define arm_aapcs_vfpcc void @noTruncStore(ptr %a, ptr %b) nounwind { | 
|  | ; CHECK-LE-LABEL: noTruncStore: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0:128] | 
|  | ; CHECK-LE-NEXT:    vmovn.i32 d16, q8 | 
|  | ; CHECK-LE-NEXT:    vstr d16, [r1] | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: noTruncStore: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0:128] | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vmovn.i32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d16, d16 | 
|  | ; CHECK-BE-NEXT:    vstr d16, [r1] | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %tmp1 = load <4 x i32>, ptr %a, align 16 | 
|  | %tmp2 = trunc <4 x i32> %tmp1 to <4 x i16> | 
|  | store <4 x i16> %tmp2, ptr %b, align 8 | 
|  | ret void | 
|  | } | 
|  |  | 
|  | ; Use vmov.f32 to materialize f32 immediate splats | 
|  | ; rdar://10437054 | 
|  | define arm_aapcs_vfpcc void @v_mov_v2f32(ptr nocapture %p) nounwind { | 
|  | ; CHECK-LABEL: v_mov_v2f32: | 
|  | ; CHECK:       @ %bb.0: @ %entry | 
|  | ; CHECK-NEXT:    vmov.f32 d16, #-1.600000e+01 | 
|  | ; CHECK-NEXT:    vstr d16, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | entry: | 
|  | store <2 x float> <float -1.600000e+01, float -1.600000e+01>, ptr %p, align 4 | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mov_v4f32(ptr nocapture %p) nounwind { | 
|  | ; CHECK-LE-LABEL: v_mov_v4f32: | 
|  | ; CHECK-LE:       @ %bb.0: @ %entry | 
|  | ; CHECK-LE-NEXT:    vmov.f32 q8, #3.100000e+01 | 
|  | ; CHECK-LE-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: v_mov_v4f32: | 
|  | ; CHECK-BE:       @ %bb.0: @ %entry | 
|  | ; CHECK-BE-NEXT:    vmov.f32 q8, #3.100000e+01 | 
|  | ; CHECK-BE-NEXT:    vstmia r0, {d16, d17} | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | entry: | 
|  | store <4 x float> <float 3.100000e+01, float 3.100000e+01, float 3.100000e+01, float 3.100000e+01>, ptr %p, align 4 | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mov_v4f32_undef(ptr nocapture %p) nounwind { | 
|  | ; CHECK-LE-LABEL: v_mov_v4f32_undef: | 
|  | ; CHECK-LE:       @ %bb.0: @ %entry | 
|  | ; CHECK-LE-NEXT:    vmov.f32 q8, #1.000000e+00 | 
|  | ; CHECK-LE-NEXT:    vld1.64 {d18, d19}, [r0] | 
|  | ; CHECK-LE-NEXT:    vadd.f32 q8, q9, q8 | 
|  | ; CHECK-LE-NEXT:    vst1.64 {d16, d17}, [r0] | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; CHECK-BE-LABEL: v_mov_v4f32_undef: | 
|  | ; CHECK-BE:       @ %bb.0: @ %entry | 
|  | ; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    vmov.f32 q9, #1.000000e+00 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vadd.f32 q8, q8, q9 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vst1.64 {d16, d17}, [r0] | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | entry: | 
|  | %a = load <4 x float> , ptr %p | 
|  | %b = fadd <4 x float> %a, <float undef, float 1.0, float 1.0, float 1.0> | 
|  | store <4 x float> %b, ptr %p | 
|  | ret void | 
|  | } | 
|  |  | 
|  | ; Vector any_extends must be selected as either vmovl.u or vmovl.s. | 
|  | ; rdar://10723651 | 
|  | define arm_aapcs_vfpcc void @any_extend(<4 x i1> %x, <4 x i32> %y) nounwind ssp { | 
|  | ; CHECK-LE-LABEL: any_extend: | 
|  | ; CHECK-LE:       @ %bb.0: @ %entry | 
|  | ; CHECK-LE-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-LE-NEXT:    vand d16, d0, d16 | 
|  | ; CHECK-LE-NEXT:    vmovl.u16 q8, d16 | 
|  | ; CHECK-LE-NEXT:    vsub.i32 q8, q8, q1 | 
|  | ; CHECK-LE-NEXT:    vmovn.i32 d16, q8 | 
|  | ; CHECK-LE-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; | 
|  | ; CHECK-BE-LABEL: any_extend: | 
|  | ; CHECK-BE:       @ %bb.0: @ %entry | 
|  | ; CHECK-BE-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-BE-NEXT:    vrev64.16 d17, d0 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q9, q1 | 
|  | ; CHECK-BE-NEXT:    vand d16, d17, d16 | 
|  | ; CHECK-BE-NEXT:    vmovl.u16 q8, d16 | 
|  | ; CHECK-BE-NEXT:    vsub.i32 q8, q8, q9 | 
|  | ; CHECK-BE-NEXT:    vmovn.i32 d16, q8 | 
|  | ; CHECK-BE-NEXT:    vst1.16 {d16}, [r0] | 
|  | entry: | 
|  | %and.i186 = zext <4 x i1> %x to <4 x i32> | 
|  | %add.i185 = sub <4 x i32> %and.i186, %y | 
|  | %sub.i = sub <4 x i32> %add.i185, zeroinitializer | 
|  | %add.i = add <4 x i32> %sub.i, zeroinitializer | 
|  | %vmovn.i = trunc <4 x i32> %add.i to <4 x i16> | 
|  | tail call void @llvm.arm.neon.vst1.p0.v4i16(ptr undef, <4 x i16> %vmovn.i, i32 2) | 
|  | unreachable | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_sti8(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_sti8: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.8 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v8i8(ptr %p, <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, i32 1) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <4 x i16> | 
|  | call void @llvm.arm.neon.vst1.p0.v4i16(ptr %p, <4 x i16> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <4 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f16(ptr %p, <4 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <2 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <2 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi8_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi8_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi16_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi16_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v4i16(ptr %p, <4 x i16> <i16 1, i16 1, i16 1, i16 1>, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi16_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi16_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 1, i16 1, i16 1, i16 1> to <4 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f16(ptr %p, <4 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi16_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi16_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 1, i16 1, i16 1, i16 1> to <2 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi16_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi16_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 1, i16 1, i16 1, i16 1> to <2 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi16_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi16_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 1, i16 1, i16 1, i16 1> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi32_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> <i32 1, i32 1>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x i32> <i32 1, i32 1> to <2 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi32_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi32_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 d16, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x i32> <i32 1, i32 1> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movf32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movf32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.f32 d16, #1.000000e+00 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> <float 1.0, float 1.0>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void@v_movf32_sti32(ptr %p) { | 
|  | ; FIXME: We should use vmov.f32 instead of mov then vdup | 
|  | ; CHECK-LABEL: v_movf32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-NEXT:    vdup.32 d16, r1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x float> <float 1.0, float 1.0> to <2 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movf32_sti64(ptr %p) { | 
|  | ; CHECK-LE-LABEL: v_movf32_sti64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-LE-NEXT:    vdup.32 d16, r1 | 
|  | ; CHECK-LE-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; FIXME: vrev is not needed here | 
|  | ; CHECK-BE-LABEL: v_movf32_sti64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-BE-NEXT:    vdup.32 d16, r1 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 d16, d16 | 
|  | ; CHECK-BE-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x float> <float 1.0, float 1.0> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movi64_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movi64_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i64 d16, #0xff | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> <i64 255>, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_sti8(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_sti8: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.8 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v16i8(ptr %p, <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, i32 1) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <8 x i16> | 
|  | call void @llvm.arm.neon.vst1.p0.v8i16(ptr %p, <8 x i16> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <8 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v8f16(ptr %p, <8 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <4 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <4 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi8_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi8_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i8 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi16_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi16_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v8i16(ptr %p, <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1>, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi16_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi16_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1> to <8 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v8f16(ptr %p, <8 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi16_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi16_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1> to <4 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi16_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi16_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1> to <4 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi16_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi16_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i16 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi32_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> <i32 1, i32 1, i32 1, i32 1>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i32> <i32 1, i32 1, i32 1, i32 1> to <4 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi32_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi32_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i32 q8, #0x1 | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i32> <i32 1, i32 1, i32 1, i32 1> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQf32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQf32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.f32 q8, #1.000000e+00 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQf32_sti32(ptr %p) { | 
|  | ; FIXME: We should use vmov.f32 instead of mov then vdup | 
|  | ; CHECK-LABEL: v_movQf32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-NEXT:    vdup.32 q8, r1 | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0> to <4 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQf32_sti64(ptr %p) { | 
|  | ; CHECK-LE-LABEL: v_movQf32_sti64: | 
|  | ; CHECK-LE:       @ %bb.0: | 
|  | ; CHECK-LE-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-LE-NEXT:    vdup.32 q8, r1 | 
|  | ; CHECK-LE-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-LE-NEXT:    mov pc, lr | 
|  | ; | 
|  | ; FIXME: vrev is not needed here | 
|  | ; CHECK-BE-LABEL: v_movQf32_sti64: | 
|  | ; CHECK-BE:       @ %bb.0: | 
|  | ; CHECK-BE-NEXT:    mov r1, #1065353216 | 
|  | ; CHECK-BE-NEXT:    vdup.32 q8, r1 | 
|  | ; CHECK-BE-NEXT:    vrev64.32 q8, q8 | 
|  | ; CHECK-BE-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-BE-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_movQi64_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_movQi64_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmov.i64 q8, #0xff | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> <i64 255, i64 255>, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni16_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni16_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v4i16(ptr %p, <4 x i16> <i16 65281, i16 65281, i16 65281, i16 65281>, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni16_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni16_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.16 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 65281, i16 65281, i16 65281, i16 65281> to <4 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f16(ptr %p, <4 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni16_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni16_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 65281, i16 65281, i16 65281, i16 65281> to <2 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni16_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni16_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 65281, i16 65281, i16 65281, i16 65281> to <2 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni16_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni16_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i16> <i16 65281, i16 65281, i16 65281, i16 65281> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni32_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v2i32(ptr %p, <2 x i32> <i32 4294967041, i32 4294967041>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x i32> <i32 4294967041, i32 4294967041> to <2 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v2f32(ptr %p, <2 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvni32_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvni32_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 d16, #0xfe | 
|  | ; CHECK-NEXT:    vst1.64 {d16}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <2 x i32> <i32 4294967041, i32 4294967041> to <1 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v1i64(ptr %p, <1 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi16_sti16(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi16_sti16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v8i16(ptr %p, <8 x i16> <i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281>, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi16_stf16(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi16_stf16: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.16 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281> to <8 x half> | 
|  | call void @llvm.arm.neon.vst1.p0.v8f16(ptr %p, <8 x half> %val, i32 2) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi16_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi16_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281> to <4 x i32> | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi16_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi16_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281> to <4 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi16_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi16_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i16 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <8 x i16> <i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281, i16 65281> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi32_sti32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi32_sti32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | call void @llvm.arm.neon.vst1.p0.v4i32(ptr %p, <4 x i32> <i32 4294967041, i32 4294967041, i32 4294967041, i32 4294967041>, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi32_stf32(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi32_stf32: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.32 {d16, d17}, [r0] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i32> <i32 4294967041, i32 4294967041, i32 4294967041, i32 4294967041> to <4 x float> | 
|  | call void @llvm.arm.neon.vst1.p0.v4f32(ptr %p, <4 x float> %val, i32 4) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | define arm_aapcs_vfpcc void @v_mvnQi32_sti64(ptr %p) { | 
|  | ; CHECK-LABEL: v_mvnQi32_sti64: | 
|  | ; CHECK:       @ %bb.0: | 
|  | ; CHECK-NEXT:    vmvn.i32 q8, #0xfe | 
|  | ; CHECK-NEXT:    vst1.64 {d16, d17}, [r0:64] | 
|  | ; CHECK-NEXT:    mov pc, lr | 
|  | %val = bitcast <4 x i32> <i32 4294967041, i32 4294967041, i32 4294967041, i32 4294967041> to <2 x i64> | 
|  | call void @llvm.arm.neon.vst1.p0.v2i64(ptr %p, <2 x i64> %val, i32 8) | 
|  | ret void | 
|  | } | 
|  |  | 
|  | declare void @llvm.arm.neon.vst1.p0.v8i8(ptr, <8 x i8>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v4i16(ptr, <4 x i16>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v4f16(ptr, <4 x half>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v2i32(ptr, <2 x i32>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v2f32(ptr, <2 x float>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v1i64(ptr, <1 x i64>, i32) nounwind | 
|  |  | 
|  | declare void @llvm.arm.neon.vst1.p0.v16i8(ptr, <16 x i8>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v8i16(ptr, <8 x i16>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v8f16(ptr, <8 x half>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v4i32(ptr, <4 x i32>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v4f32(ptr, <4 x float>, i32) nounwind | 
|  | declare void @llvm.arm.neon.vst1.p0.v2i64(ptr, <2 x i64>, i32) nounwind |