blob: b7308b77669e71dd0a08001020eb35ed904a04b0 [file] [log] [blame] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6
; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=avx10.2 | FileCheck %s --check-prefix=X86
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx10.2 | FileCheck %s --check-prefix=X64
; Function Attrs: nocallback nofree nosync nounwind willreturn memory(argmem: write)
declare void @llvm.masked.store.v8i8.p1(<8 x i8>, ptr addrspace(1) captures(none), <8 x i1>) #0
define void @foo(<8 x i16> %arg, ptr addrspace(1) %add.ptr) {
; X86-LABEL: foo:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: vmovw %xmm0, %ecx
; X86-NEXT: movb %ch, (%eax)
; X86-NEXT: retl
;
; X64-LABEL: foo:
; X64: # %bb.0: # %entry
; X64-NEXT: vmovw %xmm0, %eax
; X64-NEXT: movb %ah, (%rdi)
; X64-NEXT: retq
entry:
%i3 = shufflevector <8 x i16> %arg, <8 x i16> <i16 poison, i16 257, i16 257, i16 257, i16 257, i16 257, i16 257, i16 257>, <8 x i32> <i32 0, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
%i4 = lshr <8 x i16> %i3, splat (i16 8)
%i5 = trunc <8 x i16> %i4 to <8 x i8>
call void @llvm.masked.store.v8i8.p1(<8 x i8> %i5, ptr addrspace(1) %add.ptr, <8 x i1> <i1 true, i1 false, i1 false, i1 false, i1 false, i1 false, i1 false, i1 false>)
ret void
}
define void @bar(<8 x i64> %arg, ptr addrspace(1) %add.ptr) {
; X86-LABEL: bar:
; X86: # %bb.0: # %entry
; X86-NEXT: vpbroadcastq {{.*#+}} zmm1 = [257,0,257,0,257,0,257,0,257,0,257,0,257,0,257,0]
; X86-NEXT: movb $2, %al
; X86-NEXT: kmovd %eax, %k1
; X86-NEXT: vmovdqa64 %zmm0, %zmm1 {%k1}
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: vpsrlq $16, %zmm1, %zmm0
; X86-NEXT: vpmovqb %zmm0, (%eax) {%k1}
; X86-NEXT: vzeroupper
; X86-NEXT: retl
;
; X64-LABEL: bar:
; X64: # %bb.0: # %entry
; X64-NEXT: vpextrq $1, %xmm0, %rax
; X64-NEXT: shrl $16, %eax
; X64-NEXT: movb %al, 1(%rdi)
; X64-NEXT: vzeroupper
; X64-NEXT: retq
entry:
%i3 = shufflevector <8 x i64> %arg, <8 x i64> <i64 257, i64 poison, i64 257, i64 257, i64 257, i64 257, i64 257, i64 257>, <8 x i32> <i32 8, i32 1, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
%i4 = lshr <8 x i64> %i3, splat (i64 16)
%i5 = trunc <8 x i64> %i4 to <8 x i8>
call void @llvm.masked.store.v8i8.p1(<8 x i8> %i5, ptr addrspace(1) %add.ptr, <8 x i1> <i1 false, i1 true, i1 false, i1 false, i1 false, i1 false, i1 false, i1 false>)
ret void
}
attributes #0 = { nocallback nofree nosync nounwind willreturn memory(argmem: write) }