blob: 3e23a5f348bde4ada1acbc544c628f06f0cb1ae7 [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-unknown-unknown -mattr=+cmov,+bmi | FileCheck %s --check-prefix=X86
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+cmov,+bmi | FileCheck %s --check-prefix=X64
define i32 @blsmsk_used2(i32 %a) nounwind {
; X86-LABEL: blsmsk_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: leal -1(%eax), %ecx
; X86-NEXT: xorl %ecx, %eax
; X86-NEXT: imull %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsmsk_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: # kill: def $edi killed $edi def $rdi
; X64-NEXT: leal -1(%rdi), %eax
; X64-NEXT: xorl %eax, %edi
; X64-NEXT: imull %edi, %eax
; X64-NEXT: retq
entry:
%sub = add i32 %a, -1
%xor = xor i32 %sub, %a
%mul = mul i32 %xor, %sub
ret i32 %mul
}
define i64 @blsmask_through1(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsmask_through1:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: addl $-1, %eax
; X86-NEXT: movl %esi, %edx
; X86-NEXT: adcl $-1, %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl %ecx, %eax
; X86-NEXT: xorl %esi, %edx
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsmask_through1:
; X64: # %bb.0: # %entry
; X64-NEXT: blsmskq %rsi, %rax
; X64-NEXT: xorq %rdi, %rax
; X64-NEXT: retq
entry:
%sub = add i64 %b, -1
%0 = xor i64 %sub, %a
%xor1 = xor i64 %0, %b
ret i64 %xor1
}
define i32 @blsmask_through2(i32 %a, i32 %b, i32 %c) nounwind {
; X86-LABEL: blsmask_through2:
; X86: # %bb.0: # %entry
; X86-NEXT: blsmskl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: retl
;
; X64-LABEL: blsmask_through2:
; X64: # %bb.0: # %entry
; X64-NEXT: blsmskl %esi, %eax
; X64-NEXT: xorl %edx, %edi
; X64-NEXT: xorl %edi, %eax
; X64-NEXT: retq
entry:
%sub = add nsw i32 %b, -1
%0 = xor i32 %sub, %a
%1 = xor i32 %0, %c
%xor2 = xor i32 %1, %b
ret i32 %xor2
}
define i64 @blsmask_through3(i64 %a, i64 %b, i64 %c, i64 %d) nounwind {
; X86-LABEL: blsmask_through3:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl %esi, %eax
; X86-NEXT: addl $-1, %eax
; X86-NEXT: movl %ecx, %edx
; X86-NEXT: adcl $-1, %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl {{[0-9]+}}(%esp), %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl {{[0-9]+}}(%esp), %edx
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl %esi, %eax
; X86-NEXT: xorl %ecx, %edx
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsmask_through3:
; X64: # %bb.0: # %entry
; X64-NEXT: leaq -1(%rsi), %rax
; X64-NEXT: xorq %rdx, %rdi
; X64-NEXT: xorq %rdi, %rax
; X64-NEXT: xorq %rsi, %rcx
; X64-NEXT: xorq %rcx, %rax
; X64-NEXT: retq
entry:
%sub = add nsw i64 %b, -1
%0 = xor i64 %sub, %a
%1 = xor i64 %0, %c
%2 = xor i64 %1, %d
%xor3 = xor i64 %2, %b
ret i64 %xor3
}
define i32 @blsmask_through1_used1(i32 %a, i32 %b) nounwind {
; X86-LABEL: blsmask_through1_used1:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: leal -1(%ecx), %eax
; X86-NEXT: xorl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl %eax, %ecx
; X86-NEXT: incl %eax
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsmask_through1_used1:
; X64: # %bb.0: # %entry
; X64-NEXT: # kill: def $esi killed $esi def $rsi
; X64-NEXT: leal -1(%rsi), %eax
; X64-NEXT: xorl %edi, %eax
; X64-NEXT: xorl %eax, %esi
; X64-NEXT: incl %eax
; X64-NEXT: orl %esi, %eax
; X64-NEXT: retq
entry:
%sub = add i32 %b, -1
%xor = xor i32 %sub, %a
%xor1 = xor i32 %xor, %b
%add = add i32 %xor, 1
%or = or i32 %add, %xor1
ret i32 %or
}
define i64 @blsmask_through1_used2(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsmask_through1_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %ebp
; X86-NEXT: pushl %ebx
; X86-NEXT: pushl %edi
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl %ecx, %edi
; X86-NEXT: addl $-1, %edi
; X86-NEXT: movl %esi, %ebp
; X86-NEXT: adcl $-1, %ebp
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
; X86-NEXT: xorl %ebp, %ebx
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: xorl %edi, %eax
; X86-NEXT: xorl %ebx, %esi
; X86-NEXT: xorl %eax, %ecx
; X86-NEXT: imull %eax, %ebp
; X86-NEXT: mull %edi
; X86-NEXT: addl %ebp, %edx
; X86-NEXT: imull %edi, %ebx
; X86-NEXT: addl %ebx, %edx
; X86-NEXT: orl %esi, %edx
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: popl %edi
; X86-NEXT: popl %ebx
; X86-NEXT: popl %ebp
; X86-NEXT: retl
;
; X64-LABEL: blsmask_through1_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: leaq -1(%rsi), %rax
; X64-NEXT: xorq %rax, %rdi
; X64-NEXT: xorq %rdi, %rsi
; X64-NEXT: imulq %rdi, %rax
; X64-NEXT: orq %rsi, %rax
; X64-NEXT: retq
entry:
%sub = add i64 %b, -1
%xor = xor i64 %sub, %a
%xor1 = xor i64 %xor, %b
%mul = mul i64 %xor, %sub
%or = or i64 %mul, %xor1
ret i64 %or
}
define i32 @blsi_used2(i32 %a) nounwind {
; X86-LABEL: blsi_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: movl %eax, %ecx
; X86-NEXT: negl %ecx
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: imull %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsi_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: movl %edi, %eax
; X64-NEXT: negl %eax
; X64-NEXT: andl %eax, %edi
; X64-NEXT: imull %edi, %eax
; X64-NEXT: retq
entry:
%sub = sub nsw i32 0, %a
%and = and i32 %sub, %a
%mul = mul nsw i32 %and, %sub
ret i32 %mul
}
define i64 @blsi_through1(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsi_through1:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: xorl %edx, %edx
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: negl %eax
; X86-NEXT: sbbl %esi, %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %esi, %edx
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsi_through1:
; X64: # %bb.0: # %entry
; X64-NEXT: blsiq %rsi, %rax
; X64-NEXT: andq %rdi, %rax
; X64-NEXT: retq
entry:
%sub = sub nsw i64 0, %b
%and = and i64 %sub, %a
%and1 = and i64 %and, %b
ret i64 %and1
}
define i32 @blsi_through2(i32 %a, i32 %b, i32 %c) nounwind {
; X86-LABEL: blsi_through2:
; X86: # %bb.0: # %entry
; X86-NEXT: blsil {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: retl
;
; X64-LABEL: blsi_through2:
; X64: # %bb.0: # %entry
; X64-NEXT: blsil %esi, %eax
; X64-NEXT: andl %edx, %edi
; X64-NEXT: andl %edi, %eax
; X64-NEXT: retq
entry:
%sub = sub i32 0, %b
%and = and i32 %sub, %a
%0 = and i32 %and, %c
%and2 = and i32 %0, %b
ret i32 %and2
}
define i64 @blsi_through3(i64 %a, i64 %b, i64 %c) nounwind {
; X86-LABEL: blsi_through3:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: xorl %edx, %edx
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: negl %eax
; X86-NEXT: sbbl %esi, %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %esi, %edx
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsi_through3:
; X64: # %bb.0: # %entry
; X64-NEXT: blsiq %rsi, %rax
; X64-NEXT: andq %rdx, %rdi
; X64-NEXT: andq %rdi, %rax
; X64-NEXT: retq
entry:
%sub = sub i64 0, %b
%and = and i64 %sub, %a
%0 = and i64 %and, %c
%and3 = and i64 %0, %b
ret i64 %and3
}
define i32 @blsi_through1_used1(i32 %a, i32 %b) nounwind {
; X86-LABEL: blsi_through1_used1:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: negl %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %eax, %ecx
; X86-NEXT: incl %eax
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsi_through1_used1:
; X64: # %bb.0: # %entry
; X64-NEXT: movl %esi, %eax
; X64-NEXT: negl %eax
; X64-NEXT: andl %edi, %eax
; X64-NEXT: andl %eax, %esi
; X64-NEXT: incl %eax
; X64-NEXT: orl %esi, %eax
; X64-NEXT: retq
entry:
%sub = sub nsw i32 0, %b
%and = and i32 %sub, %a
%and1 = and i32 %and, %b
%add = add nsw i32 %and, 1
%or = or i32 %add, %and1
ret i32 %or
}
define i64 @blsi_through1_used2(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsi_through1_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %ebx
; X86-NEXT: pushl %edi
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: xorl %edi, %edi
; X86-NEXT: movl %ecx, %edx
; X86-NEXT: negl %edx
; X86-NEXT: sbbl %esi, %edi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
; X86-NEXT: andl %edi, %ebx
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %edx, %eax
; X86-NEXT: andl %ebx, %esi
; X86-NEXT: andl %eax, %ecx
; X86-NEXT: imull %edx, %ebx
; X86-NEXT: imull %eax, %edi
; X86-NEXT: mull %edx
; X86-NEXT: addl %edi, %edx
; X86-NEXT: addl %ebx, %edx
; X86-NEXT: orl %esi, %edx
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: popl %edi
; X86-NEXT: popl %ebx
; X86-NEXT: retl
;
; X64-LABEL: blsi_through1_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: movq %rsi, %rax
; X64-NEXT: negq %rax
; X64-NEXT: andq %rax, %rdi
; X64-NEXT: andq %rdi, %rsi
; X64-NEXT: imulq %rdi, %rax
; X64-NEXT: orq %rsi, %rax
; X64-NEXT: retq
entry:
%sub = sub nsw i64 0, %b
%and = and i64 %sub, %a
%and1 = and i64 %and, %b
%mul = mul nsw i64 %and, %sub
%or = or i64 %mul, %and1
ret i64 %or
}
define i32 @blsr_used2(i32 %a) nounwind {
; X86-LABEL: blsr_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: leal -1(%eax), %ecx
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: imull %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsr_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: # kill: def $edi killed $edi def $rdi
; X64-NEXT: leal -1(%rdi), %eax
; X64-NEXT: andl %eax, %edi
; X64-NEXT: imull %edi, %eax
; X64-NEXT: retq
entry:
%sub = add i32 %a, -1
%and = and i32 %sub, %a
%mul = mul i32 %and, %sub
ret i32 %mul
}
define i64 @blsr_through1(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsr_through1:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: addl $-1, %eax
; X86-NEXT: movl %esi, %edx
; X86-NEXT: adcl $-1, %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: andl %esi, %edx
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsr_through1:
; X64: # %bb.0: # %entry
; X64-NEXT: blsrq %rsi, %rax
; X64-NEXT: andq %rdi, %rax
; X64-NEXT: retq
entry:
%sub = add i64 %b, -1
%0 = and i64 %sub, %a
%and1 = and i64 %0, %b
ret i64 %and1
}
define i32 @blsr_through2(i32 %a, i32 %b, i32 %c) nounwind {
; X86-LABEL: blsr_through2:
; X86: # %bb.0: # %entry
; X86-NEXT: blsrl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: retl
;
; X64-LABEL: blsr_through2:
; X64: # %bb.0: # %entry
; X64-NEXT: blsrl %esi, %eax
; X64-NEXT: andl %edx, %edi
; X64-NEXT: andl %edi, %eax
; X64-NEXT: retq
entry:
%sub = add nsw i32 %b, -1
%0 = and i32 %sub, %a
%1 = and i32 %0, %c
%and2 = and i32 %1, %b
ret i32 %and2
}
define i64 @blsr_through3(i64 %a, i64 %b, i64 %c, i64 %d) nounwind {
; X86-LABEL: blsr_through3:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: xorl %edx, %edx
; X86-NEXT: movl %ecx, %eax
; X86-NEXT: negl %eax
; X86-NEXT: sbbl %esi, %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %edx
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %esi, %edx
; X86-NEXT: andl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: retl
;
; X64-LABEL: blsr_through3:
; X64: # %bb.0: # %entry
; X64-NEXT: movq %rdi, %rax
; X64-NEXT: andq %rsi, %rcx
; X64-NEXT: negq %rsi
; X64-NEXT: andq %rdx, %rax
; X64-NEXT: andq %rsi, %rax
; X64-NEXT: andq %rcx, %rax
; X64-NEXT: retq
entry:
%sub = sub nsw i64 0, %b
%and = and i64 %sub, %a
%0 = and i64 %and, %c
%1 = and i64 %0, %d
%and4 = and i64 %1, %b
ret i64 %and4
}
define i32 @blsr_through1_used1(i32 %a, i32 %b) nounwind {
; X86-LABEL: blsr_through1_used1:
; X86: # %bb.0: # %entry
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: leal -1(%ecx), %eax
; X86-NEXT: andl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %eax, %ecx
; X86-NEXT: incl %eax
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: retl
;
; X64-LABEL: blsr_through1_used1:
; X64: # %bb.0: # %entry
; X64-NEXT: # kill: def $esi killed $esi def $rsi
; X64-NEXT: leal -1(%rsi), %eax
; X64-NEXT: andl %edi, %eax
; X64-NEXT: andl %eax, %esi
; X64-NEXT: incl %eax
; X64-NEXT: orl %esi, %eax
; X64-NEXT: retq
entry:
%sub = add i32 %b, -1
%and = and i32 %sub, %a
%and1 = and i32 %and, %b
%add = add i32 %and, 1
%or = or i32 %add, %and1
ret i32 %or
}
define i64 @blsr_through1_used2(i64 %a, i64 %b) nounwind {
; X86-LABEL: blsr_through1_used2:
; X86: # %bb.0: # %entry
; X86-NEXT: pushl %ebp
; X86-NEXT: pushl %ebx
; X86-NEXT: pushl %edi
; X86-NEXT: pushl %esi
; X86-NEXT: movl {{[0-9]+}}(%esp), %ecx
; X86-NEXT: movl {{[0-9]+}}(%esp), %esi
; X86-NEXT: movl %ecx, %edi
; X86-NEXT: addl $-1, %edi
; X86-NEXT: movl %esi, %ebp
; X86-NEXT: adcl $-1, %ebp
; X86-NEXT: movl {{[0-9]+}}(%esp), %ebx
; X86-NEXT: andl %ebp, %ebx
; X86-NEXT: movl {{[0-9]+}}(%esp), %eax
; X86-NEXT: andl %edi, %eax
; X86-NEXT: andl %ebx, %esi
; X86-NEXT: andl %eax, %ecx
; X86-NEXT: imull %eax, %ebp
; X86-NEXT: mull %edi
; X86-NEXT: addl %ebp, %edx
; X86-NEXT: imull %edi, %ebx
; X86-NEXT: addl %ebx, %edx
; X86-NEXT: orl %esi, %edx
; X86-NEXT: orl %ecx, %eax
; X86-NEXT: popl %esi
; X86-NEXT: popl %edi
; X86-NEXT: popl %ebx
; X86-NEXT: popl %ebp
; X86-NEXT: retl
;
; X64-LABEL: blsr_through1_used2:
; X64: # %bb.0: # %entry
; X64-NEXT: leaq -1(%rsi), %rax
; X64-NEXT: andq %rax, %rdi
; X64-NEXT: andq %rdi, %rsi
; X64-NEXT: imulq %rdi, %rax
; X64-NEXT: orq %rsi, %rax
; X64-NEXT: retq
entry:
%sub = add i64 %b, -1
%and = and i64 %sub, %a
%and1 = and i64 %and, %b
%mul = mul i64 %and, %sub
%or = or i64 %mul, %and1
ret i64 %or
}