| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc -march=mips -mcpu=mips32r5 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS32R5-EB |
| ; RUN: llc -march=mipsel -mcpu=mips32r5 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS32R5-EL |
| ; RUN: llc -march=mips -mcpu=mips32r6 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS32R6-EB |
| ; RUN: llc -march=mipsel -mcpu=mips32r6 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS32R6-EL |
| ; RUN: llc -march=mips64 -mcpu=mips64r6 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS64R6 |
| ; RUN: llc -march=mips64el -mcpu=mips64r6 -mattr=+msa,+fp64 -O0 < %s | FileCheck %s --check-prefix=MIPS64R6 |
| |
| ; Test intrinsics for 4-byte and 8-byte MSA load and stores. |
| |
| define void @llvm_mips_ldr_d_test(<2 x i64>* %val, i8* %ptr) nounwind { |
| ; MIPS32R5-EB-LABEL: llvm_mips_ldr_d_test: |
| ; MIPS32R5-EB: # %bb.0: # %entry |
| ; MIPS32R5-EB-NEXT: # implicit-def: $v0 |
| ; MIPS32R5-EB-NEXT: lwr $2, 23($5) |
| ; MIPS32R5-EB-NEXT: lwl $2, 20($5) |
| ; MIPS32R5-EB-NEXT: # implicit-def: $at |
| ; MIPS32R5-EB-NEXT: lwr $1, 19($5) |
| ; MIPS32R5-EB-NEXT: lwl $1, 16($5) |
| ; MIPS32R5-EB-NEXT: fill.w $w0, $2 |
| ; MIPS32R5-EB-NEXT: insert.w $w0[1], $1 |
| ; MIPS32R5-EB-NEXT: st.d $w0, 0($4) |
| ; MIPS32R5-EB-NEXT: jr $ra |
| ; MIPS32R5-EB-NEXT: nop |
| ; |
| ; MIPS32R5-EL-LABEL: llvm_mips_ldr_d_test: |
| ; MIPS32R5-EL: # %bb.0: # %entry |
| ; MIPS32R5-EL-NEXT: # implicit-def: $v0 |
| ; MIPS32R5-EL-NEXT: lwr $2, 16($5) |
| ; MIPS32R5-EL-NEXT: lwl $2, 19($5) |
| ; MIPS32R5-EL-NEXT: # implicit-def: $at |
| ; MIPS32R5-EL-NEXT: lwr $1, 20($5) |
| ; MIPS32R5-EL-NEXT: lwl $1, 23($5) |
| ; MIPS32R5-EL-NEXT: fill.w $w0, $2 |
| ; MIPS32R5-EL-NEXT: insert.w $w0[1], $1 |
| ; MIPS32R5-EL-NEXT: st.d $w0, 0($4) |
| ; MIPS32R5-EL-NEXT: jr $ra |
| ; MIPS32R5-EL-NEXT: nop |
| ; |
| ; MIPS32R6-EB-LABEL: llvm_mips_ldr_d_test: |
| ; MIPS32R6-EB: # %bb.0: # %entry |
| ; MIPS32R6-EB-NEXT: lw $2, 20($5) |
| ; MIPS32R6-EB-NEXT: lw $1, 16($5) |
| ; MIPS32R6-EB-NEXT: fill.w $w0, $2 |
| ; MIPS32R6-EB-NEXT: insert.w $w0[1], $1 |
| ; MIPS32R6-EB-NEXT: st.d $w0, 0($4) |
| ; MIPS32R6-EB-NEXT: jrc $ra |
| ; |
| ; MIPS32R6-EL-LABEL: llvm_mips_ldr_d_test: |
| ; MIPS32R6-EL: # %bb.0: # %entry |
| ; MIPS32R6-EL-NEXT: lw $2, 16($5) |
| ; MIPS32R6-EL-NEXT: lw $1, 20($5) |
| ; MIPS32R6-EL-NEXT: fill.w $w0, $2 |
| ; MIPS32R6-EL-NEXT: insert.w $w0[1], $1 |
| ; MIPS32R6-EL-NEXT: st.d $w0, 0($4) |
| ; MIPS32R6-EL-NEXT: jrc $ra |
| ; |
| ; MIPS64R6-LABEL: llvm_mips_ldr_d_test: |
| ; MIPS64R6: # %bb.0: # %entry |
| ; MIPS64R6-NEXT: ld $1, 16($5) |
| ; MIPS64R6-NEXT: fill.d $w0, $1 |
| ; MIPS64R6-NEXT: st.d $w0, 0($4) |
| ; MIPS64R6-NEXT: jrc $ra |
| entry: |
| %0 = tail call <2 x i64> @llvm.mips.ldr.d(i8* %ptr, i32 16) |
| store <2 x i64> %0, <2 x i64>* %val |
| ret void |
| } |
| |
| declare <2 x i64> @llvm.mips.ldr.d(i8*, i32) nounwind |
| |
| define void @llvm_mips_ldr_w_test(<4 x i32>* %val, i8* %ptr) nounwind { |
| ; MIPS32R5-EB-LABEL: llvm_mips_ldr_w_test: |
| ; MIPS32R5-EB: # %bb.0: # %entry |
| ; MIPS32R5-EB-NEXT: # implicit-def: $at |
| ; MIPS32R5-EB-NEXT: lwr $1, 19($5) |
| ; MIPS32R5-EB-NEXT: lwl $1, 16($5) |
| ; MIPS32R5-EB-NEXT: fill.w $w0, $1 |
| ; MIPS32R5-EB-NEXT: st.w $w0, 0($4) |
| ; MIPS32R5-EB-NEXT: jr $ra |
| ; MIPS32R5-EB-NEXT: nop |
| ; |
| ; MIPS32R5-EL-LABEL: llvm_mips_ldr_w_test: |
| ; MIPS32R5-EL: # %bb.0: # %entry |
| ; MIPS32R5-EL-NEXT: # implicit-def: $at |
| ; MIPS32R5-EL-NEXT: lwr $1, 16($5) |
| ; MIPS32R5-EL-NEXT: lwl $1, 19($5) |
| ; MIPS32R5-EL-NEXT: fill.w $w0, $1 |
| ; MIPS32R5-EL-NEXT: st.w $w0, 0($4) |
| ; MIPS32R5-EL-NEXT: jr $ra |
| ; MIPS32R5-EL-NEXT: nop |
| ; |
| ; MIPS32R6-EB-LABEL: llvm_mips_ldr_w_test: |
| ; MIPS32R6-EB: # %bb.0: # %entry |
| ; MIPS32R6-EB-NEXT: lw $1, 16($5) |
| ; MIPS32R6-EB-NEXT: fill.w $w0, $1 |
| ; MIPS32R6-EB-NEXT: st.w $w0, 0($4) |
| ; MIPS32R6-EB-NEXT: jrc $ra |
| ; |
| ; MIPS32R6-EL-LABEL: llvm_mips_ldr_w_test: |
| ; MIPS32R6-EL: # %bb.0: # %entry |
| ; MIPS32R6-EL-NEXT: lw $1, 16($5) |
| ; MIPS32R6-EL-NEXT: fill.w $w0, $1 |
| ; MIPS32R6-EL-NEXT: st.w $w0, 0($4) |
| ; MIPS32R6-EL-NEXT: jrc $ra |
| ; |
| ; MIPS64R6-LABEL: llvm_mips_ldr_w_test: |
| ; MIPS64R6: # %bb.0: # %entry |
| ; MIPS64R6-NEXT: lw $1, 16($5) |
| ; MIPS64R6-NEXT: fill.w $w0, $1 |
| ; MIPS64R6-NEXT: st.w $w0, 0($4) |
| ; MIPS64R6-NEXT: jrc $ra |
| entry: |
| %0 = tail call <4 x i32> @llvm.mips.ldr.w(i8* %ptr, i32 16) |
| store <4 x i32> %0, <4 x i32>* %val |
| ret void |
| } |
| |
| declare <4 x i32> @llvm.mips.ldr.w(i8*, i32) nounwind |
| |
| define void @llvm_mips_str_d_test(<2 x i64>* %val, i8* %ptr) nounwind { |
| ; MIPS32R5-EB-LABEL: llvm_mips_str_d_test: |
| ; MIPS32R5-EB: # %bb.0: # %entry |
| ; MIPS32R5-EB-NEXT: ld.d $w0, 0($4) |
| ; MIPS32R5-EB-NEXT: copy_s.w $2, $w0[0] |
| ; MIPS32R5-EB-NEXT: copy_s.w $1, $w0[1] |
| ; MIPS32R5-EB-NEXT: swr $2, 19($5) |
| ; MIPS32R5-EB-NEXT: swl $2, 16($5) |
| ; MIPS32R5-EB-NEXT: swr $1, 23($5) |
| ; MIPS32R5-EB-NEXT: swl $1, 20($5) |
| ; MIPS32R5-EB-NEXT: jr $ra |
| ; MIPS32R5-EB-NEXT: nop |
| ; |
| ; MIPS32R5-EL-LABEL: llvm_mips_str_d_test: |
| ; MIPS32R5-EL: # %bb.0: # %entry |
| ; MIPS32R5-EL-NEXT: ld.d $w0, 0($4) |
| ; MIPS32R5-EL-NEXT: copy_s.w $2, $w0[0] |
| ; MIPS32R5-EL-NEXT: copy_s.w $1, $w0[1] |
| ; MIPS32R5-EL-NEXT: swr $2, 16($5) |
| ; MIPS32R5-EL-NEXT: swl $2, 19($5) |
| ; MIPS32R5-EL-NEXT: swr $1, 20($5) |
| ; MIPS32R5-EL-NEXT: swl $1, 23($5) |
| ; MIPS32R5-EL-NEXT: jr $ra |
| ; MIPS32R5-EL-NEXT: nop |
| ; |
| ; MIPS32R6-EB-LABEL: llvm_mips_str_d_test: |
| ; MIPS32R6-EB: # %bb.0: # %entry |
| ; MIPS32R6-EB-NEXT: ld.d $w0, 0($4) |
| ; MIPS32R6-EB-NEXT: copy_s.w $2, $w0[0] |
| ; MIPS32R6-EB-NEXT: copy_s.w $1, $w0[1] |
| ; MIPS32R6-EB-NEXT: sw $2, 20($5) |
| ; MIPS32R6-EB-NEXT: sw $1, 16($5) |
| ; MIPS32R6-EB-NEXT: jrc $ra |
| ; |
| ; MIPS32R6-EL-LABEL: llvm_mips_str_d_test: |
| ; MIPS32R6-EL: # %bb.0: # %entry |
| ; MIPS32R6-EL-NEXT: ld.d $w0, 0($4) |
| ; MIPS32R6-EL-NEXT: copy_s.w $2, $w0[0] |
| ; MIPS32R6-EL-NEXT: copy_s.w $1, $w0[1] |
| ; MIPS32R6-EL-NEXT: sw $2, 16($5) |
| ; MIPS32R6-EL-NEXT: sw $1, 20($5) |
| ; MIPS32R6-EL-NEXT: jrc $ra |
| ; |
| ; MIPS64R6-LABEL: llvm_mips_str_d_test: |
| ; MIPS64R6: # %bb.0: # %entry |
| ; MIPS64R6-NEXT: ld.d $w0, 0($4) |
| ; MIPS64R6-NEXT: copy_s.d $1, $w0[0] |
| ; MIPS64R6-NEXT: sd $1, 16($5) |
| ; MIPS64R6-NEXT: jrc $ra |
| entry: |
| %0 = load <2 x i64>, <2 x i64>* %val |
| tail call void @llvm.mips.str.d(<2 x i64> %0, i8* %ptr, i32 16) |
| ret void |
| } |
| |
| declare void @llvm.mips.str.d(<2 x i64>, i8*, i32) nounwind |
| |
| define void @llvm_mips_str_w_test(<4 x i32>* %val, i8* %ptr) nounwind { |
| ; MIPS32R5-EB-LABEL: llvm_mips_str_w_test: |
| ; MIPS32R5-EB: # %bb.0: # %entry |
| ; MIPS32R5-EB-NEXT: ld.w $w0, 0($4) |
| ; MIPS32R5-EB-NEXT: copy_s.w $1, $w0[0] |
| ; MIPS32R5-EB-NEXT: swr $1, 19($5) |
| ; MIPS32R5-EB-NEXT: swl $1, 16($5) |
| ; MIPS32R5-EB-NEXT: jr $ra |
| ; MIPS32R5-EB-NEXT: nop |
| ; |
| ; MIPS32R5-EL-LABEL: llvm_mips_str_w_test: |
| ; MIPS32R5-EL: # %bb.0: # %entry |
| ; MIPS32R5-EL-NEXT: ld.w $w0, 0($4) |
| ; MIPS32R5-EL-NEXT: copy_s.w $1, $w0[0] |
| ; MIPS32R5-EL-NEXT: swr $1, 16($5) |
| ; MIPS32R5-EL-NEXT: swl $1, 19($5) |
| ; MIPS32R5-EL-NEXT: jr $ra |
| ; MIPS32R5-EL-NEXT: nop |
| ; |
| ; MIPS32R6-EB-LABEL: llvm_mips_str_w_test: |
| ; MIPS32R6-EB: # %bb.0: # %entry |
| ; MIPS32R6-EB-NEXT: ld.w $w0, 0($4) |
| ; MIPS32R6-EB-NEXT: copy_s.w $1, $w0[0] |
| ; MIPS32R6-EB-NEXT: sw $1, 16($5) |
| ; MIPS32R6-EB-NEXT: jrc $ra |
| ; |
| ; MIPS32R6-EL-LABEL: llvm_mips_str_w_test: |
| ; MIPS32R6-EL: # %bb.0: # %entry |
| ; MIPS32R6-EL-NEXT: ld.w $w0, 0($4) |
| ; MIPS32R6-EL-NEXT: copy_s.w $1, $w0[0] |
| ; MIPS32R6-EL-NEXT: sw $1, 16($5) |
| ; MIPS32R6-EL-NEXT: jrc $ra |
| ; |
| ; MIPS64R6-LABEL: llvm_mips_str_w_test: |
| ; MIPS64R6: # %bb.0: # %entry |
| ; MIPS64R6-NEXT: ld.w $w0, 0($4) |
| ; MIPS64R6-NEXT: copy_s.w $1, $w0[0] |
| ; MIPS64R6-NEXT: sw $1, 16($5) |
| ; MIPS64R6-NEXT: jrc $ra |
| entry: |
| %0 = load <4 x i32>, <4 x i32>* %val |
| tail call void @llvm.mips.str.w(<4 x i32> %0, i8* %ptr, i32 16) |
| ret void |
| } |
| |
| declare void @llvm.mips.str.w(<4 x i32>, i8*, i32) nounwind |
| |