| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse2,-avx | FileCheck %s --check-prefixes=CHECK,SSE2 |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1,-avx | FileCheck %s --check-prefixes=CHECK,SSE41 |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,-avx2 | FileCheck %s --check-prefixes=CHECK,AVX,AVX1 |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512vl,+avx512dq,+avx512bw | FileCheck %s --check-prefixes=CHECK,AVX,AVX512 |
| |
| define i32 @veccond128(<4 x i32> %input) { |
| ; SSE2-LABEL: veccond128: |
| ; SSE2: # %bb.0: # %entry |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %eax |
| ; SSE2-NEXT: xorl $15, %eax |
| ; SSE2-NEXT: je .LBB0_2 |
| ; SSE2-NEXT: # %bb.1: # %if-true-block |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: retq |
| ; SSE2-NEXT: .LBB0_2: # %endif-block |
| ; SSE2-NEXT: movl $1, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: veccond128: |
| ; SSE41: # %bb.0: # %entry |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: je .LBB0_2 |
| ; SSE41-NEXT: # %bb.1: # %if-true-block |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: retq |
| ; SSE41-NEXT: .LBB0_2: # %endif-block |
| ; SSE41-NEXT: movl $1, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: veccond128: |
| ; AVX: # %bb.0: # %entry |
| ; AVX-NEXT: vptest %xmm0, %xmm0 |
| ; AVX-NEXT: je .LBB0_2 |
| ; AVX-NEXT: # %bb.1: # %if-true-block |
| ; AVX-NEXT: xorl %eax, %eax |
| ; AVX-NEXT: retq |
| ; AVX-NEXT: .LBB0_2: # %endif-block |
| ; AVX-NEXT: movl $1, %eax |
| ; AVX-NEXT: retq |
| entry: |
| %0 = bitcast <4 x i32> %input to i128 |
| %1 = icmp ne i128 %0, 0 |
| br i1 %1, label %if-true-block, label %endif-block |
| if-true-block: |
| ret i32 0 |
| endif-block: |
| ret i32 1 |
| } |
| |
| define i32 @veccond256(<8 x i32> %input) { |
| ; SSE2-LABEL: veccond256: |
| ; SSE2: # %bb.0: # %entry |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %eax |
| ; SSE2-NEXT: xorl $15, %eax |
| ; SSE2-NEXT: je .LBB1_2 |
| ; SSE2-NEXT: # %bb.1: # %if-true-block |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: retq |
| ; SSE2-NEXT: .LBB1_2: # %endif-block |
| ; SSE2-NEXT: movl $1, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: veccond256: |
| ; SSE41: # %bb.0: # %entry |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: je .LBB1_2 |
| ; SSE41-NEXT: # %bb.1: # %if-true-block |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: retq |
| ; SSE41-NEXT: .LBB1_2: # %endif-block |
| ; SSE41-NEXT: movl $1, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: veccond256: |
| ; AVX: # %bb.0: # %entry |
| ; AVX-NEXT: vptest %ymm0, %ymm0 |
| ; AVX-NEXT: je .LBB1_2 |
| ; AVX-NEXT: # %bb.1: # %if-true-block |
| ; AVX-NEXT: xorl %eax, %eax |
| ; AVX-NEXT: vzeroupper |
| ; AVX-NEXT: retq |
| ; AVX-NEXT: .LBB1_2: # %endif-block |
| ; AVX-NEXT: movl $1, %eax |
| ; AVX-NEXT: vzeroupper |
| ; AVX-NEXT: retq |
| entry: |
| %0 = bitcast <8 x i32> %input to i256 |
| %1 = icmp ne i256 %0, 0 |
| br i1 %1, label %if-true-block, label %endif-block |
| if-true-block: |
| ret i32 0 |
| endif-block: |
| ret i32 1 |
| } |
| |
| define i32 @veccond512(<16 x i32> %input) { |
| ; SSE2-LABEL: veccond512: |
| ; SSE2: # %bb.0: # %entry |
| ; SSE2-NEXT: por %xmm3, %xmm1 |
| ; SSE2-NEXT: por %xmm2, %xmm0 |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %eax |
| ; SSE2-NEXT: xorl $15, %eax |
| ; SSE2-NEXT: je .LBB2_2 |
| ; SSE2-NEXT: # %bb.1: # %if-true-block |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: retq |
| ; SSE2-NEXT: .LBB2_2: # %endif-block |
| ; SSE2-NEXT: movl $1, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: veccond512: |
| ; SSE41: # %bb.0: # %entry |
| ; SSE41-NEXT: por %xmm3, %xmm1 |
| ; SSE41-NEXT: por %xmm2, %xmm0 |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: je .LBB2_2 |
| ; SSE41-NEXT: # %bb.1: # %if-true-block |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: retq |
| ; SSE41-NEXT: .LBB2_2: # %endif-block |
| ; SSE41-NEXT: movl $1, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX1-LABEL: veccond512: |
| ; AVX1: # %bb.0: # %entry |
| ; AVX1-NEXT: vorps %ymm1, %ymm0, %ymm0 |
| ; AVX1-NEXT: vptest %ymm0, %ymm0 |
| ; AVX1-NEXT: je .LBB2_2 |
| ; AVX1-NEXT: # %bb.1: # %if-true-block |
| ; AVX1-NEXT: xorl %eax, %eax |
| ; AVX1-NEXT: vzeroupper |
| ; AVX1-NEXT: retq |
| ; AVX1-NEXT: .LBB2_2: # %endif-block |
| ; AVX1-NEXT: movl $1, %eax |
| ; AVX1-NEXT: vzeroupper |
| ; AVX1-NEXT: retq |
| ; |
| ; AVX512-LABEL: veccond512: |
| ; AVX512: # %bb.0: # %entry |
| ; AVX512-NEXT: vptestmd %zmm0, %zmm0, %k0 |
| ; AVX512-NEXT: kortestw %k0, %k0 |
| ; AVX512-NEXT: je .LBB2_2 |
| ; AVX512-NEXT: # %bb.1: # %if-true-block |
| ; AVX512-NEXT: xorl %eax, %eax |
| ; AVX512-NEXT: vzeroupper |
| ; AVX512-NEXT: retq |
| ; AVX512-NEXT: .LBB2_2: # %endif-block |
| ; AVX512-NEXT: movl $1, %eax |
| ; AVX512-NEXT: vzeroupper |
| ; AVX512-NEXT: retq |
| entry: |
| %0 = bitcast <16 x i32> %input to i512 |
| %1 = icmp ne i512 %0, 0 |
| br i1 %1, label %if-true-block, label %endif-block |
| if-true-block: |
| ret i32 0 |
| endif-block: |
| ret i32 1 |
| } |
| |
| define i32 @vectest128(<4 x i32> %input) { |
| ; SSE2-LABEL: vectest128: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: setne %al |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vectest128: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: setne %al |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: vectest128: |
| ; AVX: # %bb.0: |
| ; AVX-NEXT: xorl %eax, %eax |
| ; AVX-NEXT: vptest %xmm0, %xmm0 |
| ; AVX-NEXT: setne %al |
| ; AVX-NEXT: retq |
| %t0 = bitcast <4 x i32> %input to i128 |
| %t1 = icmp ne i128 %t0, 0 |
| %t2 = zext i1 %t1 to i32 |
| ret i32 %t2 |
| } |
| |
| define i32 @vectest256(<8 x i32> %input) { |
| ; SSE2-LABEL: vectest256: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: setne %al |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vectest256: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: setne %al |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: vectest256: |
| ; AVX: # %bb.0: |
| ; AVX-NEXT: xorl %eax, %eax |
| ; AVX-NEXT: vptest %ymm0, %ymm0 |
| ; AVX-NEXT: setne %al |
| ; AVX-NEXT: vzeroupper |
| ; AVX-NEXT: retq |
| %t0 = bitcast <8 x i32> %input to i256 |
| %t1 = icmp ne i256 %t0, 0 |
| %t2 = zext i1 %t1 to i32 |
| ret i32 %t2 |
| } |
| |
| define i32 @vectest512(<16 x i32> %input) { |
| ; SSE2-LABEL: vectest512: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: por %xmm3, %xmm1 |
| ; SSE2-NEXT: por %xmm2, %xmm0 |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl %eax, %eax |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: setne %al |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vectest512: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: por %xmm3, %xmm1 |
| ; SSE41-NEXT: por %xmm2, %xmm0 |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: xorl %eax, %eax |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: setne %al |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX1-LABEL: vectest512: |
| ; AVX1: # %bb.0: |
| ; AVX1-NEXT: vorps %ymm1, %ymm0, %ymm0 |
| ; AVX1-NEXT: xorl %eax, %eax |
| ; AVX1-NEXT: vptest %ymm0, %ymm0 |
| ; AVX1-NEXT: setne %al |
| ; AVX1-NEXT: vzeroupper |
| ; AVX1-NEXT: retq |
| ; |
| ; AVX512-LABEL: vectest512: |
| ; AVX512: # %bb.0: |
| ; AVX512-NEXT: vptestmd %zmm0, %zmm0, %k0 |
| ; AVX512-NEXT: xorl %eax, %eax |
| ; AVX512-NEXT: kortestw %k0, %k0 |
| ; AVX512-NEXT: setne %al |
| ; AVX512-NEXT: vzeroupper |
| ; AVX512-NEXT: retq |
| %t0 = bitcast <16 x i32> %input to i512 |
| %t1 = icmp ne i512 %t0, 0 |
| %t2 = zext i1 %t1 to i32 |
| ret i32 %t2 |
| } |
| |
| define i32 @vecsel128(<4 x i32> %input, i32 %a, i32 %b) { |
| ; SSE2-LABEL: vecsel128: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: movl %edi, %eax |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: cmovel %esi, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vecsel128: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: movl %edi, %eax |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: cmovel %esi, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: vecsel128: |
| ; AVX: # %bb.0: |
| ; AVX-NEXT: movl %edi, %eax |
| ; AVX-NEXT: vptest %xmm0, %xmm0 |
| ; AVX-NEXT: cmovel %esi, %eax |
| ; AVX-NEXT: retq |
| %t0 = bitcast <4 x i32> %input to i128 |
| %t1 = icmp ne i128 %t0, 0 |
| %t2 = select i1 %t1, i32 %a, i32 %b |
| ret i32 %t2 |
| } |
| |
| define i32 @vecsel256(<8 x i32> %input, i32 %a, i32 %b) { |
| ; SSE2-LABEL: vecsel256: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: movl %edi, %eax |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: cmovel %esi, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vecsel256: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: movl %edi, %eax |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: cmovel %esi, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX-LABEL: vecsel256: |
| ; AVX: # %bb.0: |
| ; AVX-NEXT: movl %edi, %eax |
| ; AVX-NEXT: vptest %ymm0, %ymm0 |
| ; AVX-NEXT: cmovel %esi, %eax |
| ; AVX-NEXT: vzeroupper |
| ; AVX-NEXT: retq |
| %t0 = bitcast <8 x i32> %input to i256 |
| %t1 = icmp ne i256 %t0, 0 |
| %t2 = select i1 %t1, i32 %a, i32 %b |
| ret i32 %t2 |
| } |
| |
| define i32 @vecsel512(<16 x i32> %input, i32 %a, i32 %b) { |
| ; SSE2-LABEL: vecsel512: |
| ; SSE2: # %bb.0: |
| ; SSE2-NEXT: movl %edi, %eax |
| ; SSE2-NEXT: por %xmm3, %xmm1 |
| ; SSE2-NEXT: por %xmm2, %xmm0 |
| ; SSE2-NEXT: por %xmm1, %xmm0 |
| ; SSE2-NEXT: pxor %xmm1, %xmm1 |
| ; SSE2-NEXT: pcmpeqd %xmm0, %xmm1 |
| ; SSE2-NEXT: movmskps %xmm1, %ecx |
| ; SSE2-NEXT: xorl $15, %ecx |
| ; SSE2-NEXT: cmovel %esi, %eax |
| ; SSE2-NEXT: retq |
| ; |
| ; SSE41-LABEL: vecsel512: |
| ; SSE41: # %bb.0: |
| ; SSE41-NEXT: movl %edi, %eax |
| ; SSE41-NEXT: por %xmm3, %xmm1 |
| ; SSE41-NEXT: por %xmm2, %xmm0 |
| ; SSE41-NEXT: por %xmm1, %xmm0 |
| ; SSE41-NEXT: ptest %xmm0, %xmm0 |
| ; SSE41-NEXT: cmovel %esi, %eax |
| ; SSE41-NEXT: retq |
| ; |
| ; AVX1-LABEL: vecsel512: |
| ; AVX1: # %bb.0: |
| ; AVX1-NEXT: movl %edi, %eax |
| ; AVX1-NEXT: vorps %ymm1, %ymm0, %ymm0 |
| ; AVX1-NEXT: vptest %ymm0, %ymm0 |
| ; AVX1-NEXT: cmovel %esi, %eax |
| ; AVX1-NEXT: vzeroupper |
| ; AVX1-NEXT: retq |
| ; |
| ; AVX512-LABEL: vecsel512: |
| ; AVX512: # %bb.0: |
| ; AVX512-NEXT: movl %edi, %eax |
| ; AVX512-NEXT: vptestmd %zmm0, %zmm0, %k0 |
| ; AVX512-NEXT: kortestw %k0, %k0 |
| ; AVX512-NEXT: cmovel %esi, %eax |
| ; AVX512-NEXT: vzeroupper |
| ; AVX512-NEXT: retq |
| %t0 = bitcast <16 x i32> %input to i512 |
| %t1 = icmp ne i512 %t0, 0 |
| %t2 = select i1 %t1, i32 %a, i32 %b |
| ret i32 %t2 |
| } |
| |
| define i1 @vecmp_load64x2(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load64x2: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq (%rdi), %rax |
| ; CHECK-NEXT: orq 8(%rdi), %rax |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 8 |
| %i0 = load i64, ptr %p0, align 1 |
| %i1 = load i64, ptr %p1, align 1 |
| %or = or i64 %i0, %i1 |
| %ne = icmp ne i64 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |
| |
| define i1 @vecmp_load64x4(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load64x4: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq (%rdi), %rax |
| ; CHECK-NEXT: movq 8(%rdi), %rcx |
| ; CHECK-NEXT: orq 16(%rdi), %rax |
| ; CHECK-NEXT: orq 24(%rdi), %rcx |
| ; CHECK-NEXT: orq %rax, %rcx |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 8 |
| %p2 = getelementptr i8, ptr %p0, i64 16 |
| %p3 = getelementptr i8, ptr %p0, i64 24 |
| %i0 = load i64, ptr %p0, align 1 |
| %i1 = load i64, ptr %p1, align 1 |
| %i2 = load i64, ptr %p2, align 1 |
| %i3 = load i64, ptr %p3, align 1 |
| %or02 = or i64 %i0, %i2 |
| %or13 = or i64 %i1, %i3 |
| %or = or i64 %or02, %or13 |
| %ne = icmp ne i64 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |
| |
| define i1 @vecmp_load128x2(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load128x2: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq (%rdi), %rax |
| ; CHECK-NEXT: movq 8(%rdi), %rcx |
| ; CHECK-NEXT: orq 24(%rdi), %rcx |
| ; CHECK-NEXT: orq 16(%rdi), %rax |
| ; CHECK-NEXT: orq %rcx, %rax |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 16 |
| %i0 = load i128, ptr %p0, align 1 |
| %i1 = load i128, ptr %p1, align 1 |
| %or = or i128 %i0, %i1 |
| %ne = icmp ne i128 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |
| |
| define i1 @vecmp_load128x4(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load128x4: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq (%rdi), %rax |
| ; CHECK-NEXT: movq 8(%rdi), %rcx |
| ; CHECK-NEXT: movq 24(%rdi), %rdx |
| ; CHECK-NEXT: movq 16(%rdi), %rsi |
| ; CHECK-NEXT: orq 32(%rdi), %rax |
| ; CHECK-NEXT: orq 40(%rdi), %rcx |
| ; CHECK-NEXT: orq 48(%rdi), %rsi |
| ; CHECK-NEXT: orq %rax, %rsi |
| ; CHECK-NEXT: orq 56(%rdi), %rdx |
| ; CHECK-NEXT: orq %rcx, %rdx |
| ; CHECK-NEXT: orq %rsi, %rdx |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 16 |
| %p2 = getelementptr i8, ptr %p0, i64 32 |
| %p3 = getelementptr i8, ptr %p0, i64 48 |
| %i0 = load i128, ptr %p0, align 1 |
| %i1 = load i128, ptr %p1, align 1 |
| %i2 = load i128, ptr %p2, align 1 |
| %i3 = load i128, ptr %p3, align 1 |
| %or02 = or i128 %i0, %i2 |
| %or13 = or i128 %i1, %i3 |
| %or = or i128 %or02, %or13 |
| %ne = icmp ne i128 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |
| |
| ; PR144861 |
| define i1 @vecmp_load256x2(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load256x2: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq 24(%rdi), %rax |
| ; CHECK-NEXT: movq (%rdi), %rcx |
| ; CHECK-NEXT: movq 8(%rdi), %rdx |
| ; CHECK-NEXT: movq 16(%rdi), %rsi |
| ; CHECK-NEXT: orq 48(%rdi), %rsi |
| ; CHECK-NEXT: orq 32(%rdi), %rcx |
| ; CHECK-NEXT: orq %rsi, %rcx |
| ; CHECK-NEXT: orq 56(%rdi), %rax |
| ; CHECK-NEXT: orq 40(%rdi), %rdx |
| ; CHECK-NEXT: orq %rax, %rdx |
| ; CHECK-NEXT: orq %rcx, %rdx |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 32 |
| %i0 = load i256, ptr %p0, align 1 |
| %i1 = load i256, ptr %p1, align 1 |
| %or = or i256 %i0, %i1 |
| %ne = icmp ne i256 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |
| |
| define i1 @vecmp_load512x2(ptr %p0) { |
| ; CHECK-LABEL: vecmp_load512x2: |
| ; CHECK: # %bb.0: |
| ; CHECK-NEXT: movq 24(%rdi), %rax |
| ; CHECK-NEXT: movq 56(%rdi), %rdx |
| ; CHECK-NEXT: movq 40(%rdi), %rsi |
| ; CHECK-NEXT: movq 16(%rdi), %rcx |
| ; CHECK-NEXT: movq 48(%rdi), %r8 |
| ; CHECK-NEXT: movq (%rdi), %r9 |
| ; CHECK-NEXT: movq 8(%rdi), %r10 |
| ; CHECK-NEXT: movq 32(%rdi), %r11 |
| ; CHECK-NEXT: orq 96(%rdi), %r11 |
| ; CHECK-NEXT: orq 64(%rdi), %r9 |
| ; CHECK-NEXT: orq %r11, %r9 |
| ; CHECK-NEXT: orq 112(%rdi), %r8 |
| ; CHECK-NEXT: orq 80(%rdi), %rcx |
| ; CHECK-NEXT: orq %r8, %rcx |
| ; CHECK-NEXT: orq %r9, %rcx |
| ; CHECK-NEXT: orq 104(%rdi), %rsi |
| ; CHECK-NEXT: orq 72(%rdi), %r10 |
| ; CHECK-NEXT: orq %rsi, %r10 |
| ; CHECK-NEXT: orq 120(%rdi), %rdx |
| ; CHECK-NEXT: orq 88(%rdi), %rax |
| ; CHECK-NEXT: orq %rdx, %rax |
| ; CHECK-NEXT: orq %r10, %rax |
| ; CHECK-NEXT: orq %rcx, %rax |
| ; CHECK-NEXT: sete %al |
| ; CHECK-NEXT: retq |
| %p1 = getelementptr i8, ptr %p0, i64 64 |
| %i0 = load i512, ptr %p0, align 1 |
| %i1 = load i512, ptr %p1, align 1 |
| %or = or i512 %i0, %i1 |
| %ne = icmp ne i512 %or, 0 |
| %zx = zext i1 %ne to i32 |
| %eq = icmp eq i32 %zx, 0 |
| ret i1 %eq |
| } |