blob: 66731ac0f04c36b966778a15db18d7f366176b22 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=aarch64-unknown-linux-gnu -mattr=-neon | FileCheck %s --check-prefixes=ALL,GPR
; RUN: llc < %s -mtriple=aarch64-unknown-linux-gnu -mattr=neon | FileCheck %s --check-prefixes=ALL,NEON
declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1) nounwind
declare void @llvm.memset.inline.p0i8.i64(i8* nocapture, i8, i64, i1) nounwind
; /////////////////////////////////////////////////////////////////////////////
define void @memset_1(i8* %a, i8 %value) nounwind {
; ALL-LABEL: memset_1:
; ALL: // %bb.0:
; ALL-NEXT: strb w1, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 1, i1 0)
ret void
}
define void @memset_2(i8* %a, i8 %value) nounwind {
; ALL-LABEL: memset_2:
; ALL: // %bb.0:
; ALL-NEXT: bfi w1, w1, #8, #24
; ALL-NEXT: strh w1, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 2, i1 0)
ret void
}
define void @memset_4(i8* %a, i8 %value) nounwind {
; ALL-LABEL: memset_4:
; ALL: // %bb.0:
; ALL-NEXT: mov w8, #16843009
; ALL-NEXT: and w9, w1, #0xff
; ALL-NEXT: mul w8, w9, w8
; ALL-NEXT: str w8, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 4, i1 0)
ret void
}
define void @memset_8(i8* %a, i8 %value) nounwind {
; ALL-LABEL: memset_8:
; ALL: // %bb.0:
; ALL-NEXT: // kill: def $w1 killed $w1 def $x1
; ALL-NEXT: mov x8, #72340172838076673
; ALL-NEXT: and x9, x1, #0xff
; ALL-NEXT: mul x8, x9, x8
; ALL-NEXT: str x8, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 8, i1 0)
ret void
}
define void @memset_16(i8* %a, i8 %value) nounwind {
; ALL-LABEL: memset_16:
; ALL: // %bb.0:
; ALL-NEXT: // kill: def $w1 killed $w1 def $x1
; ALL-NEXT: mov x8, #72340172838076673
; ALL-NEXT: and x9, x1, #0xff
; ALL-NEXT: mul x8, x9, x8
; ALL-NEXT: stp x8, x8, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 16, i1 0)
ret void
}
define void @memset_32(i8* %a, i8 %value) nounwind {
; GPR-LABEL: memset_32:
; GPR: // %bb.0:
; GPR-NEXT: // kill: def $w1 killed $w1 def $x1
; GPR-NEXT: mov x8, #72340172838076673
; GPR-NEXT: and x9, x1, #0xff
; GPR-NEXT: mul x8, x9, x8
; GPR-NEXT: stp x8, x8, [x0, #16]
; GPR-NEXT: stp x8, x8, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: memset_32:
; NEON: // %bb.0:
; NEON-NEXT: dup v0.16b, w1
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 32, i1 0)
ret void
}
define void @memset_64(i8* %a, i8 %value) nounwind {
; GPR-LABEL: memset_64:
; GPR: // %bb.0:
; GPR-NEXT: // kill: def $w1 killed $w1 def $x1
; GPR-NEXT: mov x8, #72340172838076673
; GPR-NEXT: and x9, x1, #0xff
; GPR-NEXT: mul x8, x9, x8
; GPR-NEXT: stp x8, x8, [x0, #48]
; GPR-NEXT: stp x8, x8, [x0, #32]
; GPR-NEXT: stp x8, x8, [x0, #16]
; GPR-NEXT: stp x8, x8, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: memset_64:
; NEON: // %bb.0:
; NEON-NEXT: dup v0.16b, w1
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: stp q0, q0, [x0, #32]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 %value, i64 64, i1 0)
ret void
}
; /////////////////////////////////////////////////////////////////////////////
define void @aligned_memset_16(i8* align 16 %a, i8 %value) nounwind {
; ALL-LABEL: aligned_memset_16:
; ALL: // %bb.0:
; ALL-NEXT: // kill: def $w1 killed $w1 def $x1
; ALL-NEXT: mov x8, #72340172838076673
; ALL-NEXT: and x9, x1, #0xff
; ALL-NEXT: mul x8, x9, x8
; ALL-NEXT: stp x8, x8, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 16 %a, i8 %value, i64 16, i1 0)
ret void
}
define void @aligned_memset_32(i8* align 32 %a, i8 %value) nounwind {
; GPR-LABEL: aligned_memset_32:
; GPR: // %bb.0:
; GPR-NEXT: // kill: def $w1 killed $w1 def $x1
; GPR-NEXT: mov x8, #72340172838076673
; GPR-NEXT: and x9, x1, #0xff
; GPR-NEXT: mul x8, x9, x8
; GPR-NEXT: stp x8, x8, [x0, #16]
; GPR-NEXT: stp x8, x8, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: aligned_memset_32:
; NEON: // %bb.0:
; NEON-NEXT: dup v0.16b, w1
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 32 %a, i8 %value, i64 32, i1 0)
ret void
}
define void @aligned_memset_64(i8* align 64 %a, i8 %value) nounwind {
; GPR-LABEL: aligned_memset_64:
; GPR: // %bb.0:
; GPR-NEXT: // kill: def $w1 killed $w1 def $x1
; GPR-NEXT: mov x8, #72340172838076673
; GPR-NEXT: and x9, x1, #0xff
; GPR-NEXT: mul x8, x9, x8
; GPR-NEXT: stp x8, x8, [x0, #48]
; GPR-NEXT: stp x8, x8, [x0, #32]
; GPR-NEXT: stp x8, x8, [x0, #16]
; GPR-NEXT: stp x8, x8, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: aligned_memset_64:
; NEON: // %bb.0:
; NEON-NEXT: dup v0.16b, w1
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: stp q0, q0, [x0, #32]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 64 %a, i8 %value, i64 64, i1 0)
ret void
}
; /////////////////////////////////////////////////////////////////////////////
define void @bzero_1(i8* %a) nounwind {
; ALL-LABEL: bzero_1:
; ALL: // %bb.0:
; ALL-NEXT: strb wzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 1, i1 0)
ret void
}
define void @bzero_2(i8* %a) nounwind {
; ALL-LABEL: bzero_2:
; ALL: // %bb.0:
; ALL-NEXT: strh wzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 2, i1 0)
ret void
}
define void @bzero_4(i8* %a) nounwind {
; ALL-LABEL: bzero_4:
; ALL: // %bb.0:
; ALL-NEXT: str wzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 4, i1 0)
ret void
}
define void @bzero_8(i8* %a) nounwind {
; ALL-LABEL: bzero_8:
; ALL: // %bb.0:
; ALL-NEXT: str xzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 8, i1 0)
ret void
}
define void @bzero_16(i8* %a) nounwind {
; ALL-LABEL: bzero_16:
; ALL: // %bb.0:
; ALL-NEXT: stp xzr, xzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 16, i1 0)
ret void
}
define void @bzero_32(i8* %a) nounwind {
; GPR-LABEL: bzero_32:
; GPR: // %bb.0:
; GPR-NEXT: adrp x8, .LCPI15_0
; GPR-NEXT: ldr q0, [x8, :lo12:.LCPI15_0]
; GPR-NEXT: stp q0, q0, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: bzero_32:
; NEON: // %bb.0:
; NEON-NEXT: movi v0.2d, #0000000000000000
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 32, i1 0)
ret void
}
define void @bzero_64(i8* %a) nounwind {
; GPR-LABEL: bzero_64:
; GPR: // %bb.0:
; GPR-NEXT: adrp x8, .LCPI16_0
; GPR-NEXT: ldr q0, [x8, :lo12:.LCPI16_0]
; GPR-NEXT: stp q0, q0, [x0]
; GPR-NEXT: stp q0, q0, [x0, #32]
; GPR-NEXT: ret
;
; NEON-LABEL: bzero_64:
; NEON: // %bb.0:
; NEON-NEXT: movi v0.2d, #0000000000000000
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: stp q0, q0, [x0, #32]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* %a, i8 0, i64 64, i1 0)
ret void
}
; /////////////////////////////////////////////////////////////////////////////
define void @aligned_bzero_16(i8* %a) nounwind {
; ALL-LABEL: aligned_bzero_16:
; ALL: // %bb.0:
; ALL-NEXT: stp xzr, xzr, [x0]
; ALL-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 16 %a, i8 0, i64 16, i1 0)
ret void
}
define void @aligned_bzero_32(i8* %a) nounwind {
; GPR-LABEL: aligned_bzero_32:
; GPR: // %bb.0:
; GPR-NEXT: adrp x8, .LCPI18_0
; GPR-NEXT: ldr q0, [x8, :lo12:.LCPI18_0]
; GPR-NEXT: stp q0, q0, [x0]
; GPR-NEXT: ret
;
; NEON-LABEL: aligned_bzero_32:
; NEON: // %bb.0:
; NEON-NEXT: movi v0.2d, #0000000000000000
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 32 %a, i8 0, i64 32, i1 0)
ret void
}
define void @aligned_bzero_64(i8* %a) nounwind {
; GPR-LABEL: aligned_bzero_64:
; GPR: // %bb.0:
; GPR-NEXT: adrp x8, .LCPI19_0
; GPR-NEXT: ldr q0, [x8, :lo12:.LCPI19_0]
; GPR-NEXT: stp q0, q0, [x0]
; GPR-NEXT: stp q0, q0, [x0, #32]
; GPR-NEXT: ret
;
; NEON-LABEL: aligned_bzero_64:
; NEON: // %bb.0:
; NEON-NEXT: movi v0.2d, #0000000000000000
; NEON-NEXT: stp q0, q0, [x0]
; NEON-NEXT: stp q0, q0, [x0, #32]
; NEON-NEXT: ret
tail call void @llvm.memset.inline.p0i8.i64(i8* align 64 %a, i8 0, i64 64, i1 0)
ret void
}