blob: 4641c114238f8f96fcfa0bd526916915112577bb [file] [log] [blame]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=-bmi2,-lzcnt | FileCheck %s --check-prefix=NOBMI
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+bmi2,+lzcnt | FileCheck %s --check-prefix=BMI
; Check the assembly sequence generated for std::bit_ceil.
; std::bit_ceil<uint32_t>(x)
define i32 @bit_ceil_i32(i32 %x) {
; NOBMI-LABEL: bit_ceil_i32:
; NOBMI: # %bb.0:
; NOBMI-NEXT: movl %edi, %eax
; NOBMI-NEXT: decl %eax
; NOBMI-NEXT: je .LBB0_1
; NOBMI-NEXT: # %bb.2: # %cond.false
; NOBMI-NEXT: bsrl %eax, %ecx
; NOBMI-NEXT: xorl $31, %ecx
; NOBMI-NEXT: jmp .LBB0_3
; NOBMI-NEXT: .LBB0_1:
; NOBMI-NEXT: movl $32, %ecx
; NOBMI-NEXT: .LBB0_3: # %cond.end
; NOBMI-NEXT: negb %cl
; NOBMI-NEXT: movl $1, %edx
; NOBMI-NEXT: movl $1, %eax
; NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
; NOBMI-NEXT: shll %cl, %eax
; NOBMI-NEXT: cmpl $2, %edi
; NOBMI-NEXT: cmovbl %edx, %eax
; NOBMI-NEXT: retq
;
; BMI-LABEL: bit_ceil_i32:
; BMI: # %bb.0:
; BMI-NEXT: # kill: def $edi killed $edi def $rdi
; BMI-NEXT: leal -1(%rdi), %eax
; BMI-NEXT: lzcntl %eax, %eax
; BMI-NEXT: negb %al
; BMI-NEXT: movl $1, %ecx
; BMI-NEXT: shlxl %eax, %ecx, %eax
; BMI-NEXT: cmpl $2, %edi
; BMI-NEXT: cmovbl %ecx, %eax
; BMI-NEXT: retq
%dec = add i32 %x, -1
%lz = tail call i32 @llvm.ctlz.i32(i32 %dec, i1 false)
%cnt = sub i32 32, %lz
%res = shl i32 1, %cnt
%ugt = icmp ugt i32 %x, 1
%sel = select i1 %ugt, i32 %res, i32 1
ret i32 %sel
}
; std::bit_ceil<uint32_t>(x + 1)
define i32 @bit_ceil_i32_plus1(i32 noundef %x) {
; NOBMI-LABEL: bit_ceil_i32_plus1:
; NOBMI: # %bb.0: # %entry
; NOBMI-NEXT: testl %edi, %edi
; NOBMI-NEXT: je .LBB1_1
; NOBMI-NEXT: # %bb.2: # %cond.false
; NOBMI-NEXT: bsrl %edi, %ecx
; NOBMI-NEXT: xorl $31, %ecx
; NOBMI-NEXT: jmp .LBB1_3
; NOBMI-NEXT: .LBB1_1:
; NOBMI-NEXT: movl $32, %ecx
; NOBMI-NEXT: .LBB1_3: # %cond.end
; NOBMI-NEXT: negb %cl
; NOBMI-NEXT: movl $1, %edx
; NOBMI-NEXT: movl $1, %eax
; NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
; NOBMI-NEXT: shll %cl, %eax
; NOBMI-NEXT: decl %edi
; NOBMI-NEXT: cmpl $-2, %edi
; NOBMI-NEXT: cmovael %edx, %eax
; NOBMI-NEXT: retq
;
; BMI-LABEL: bit_ceil_i32_plus1:
; BMI: # %bb.0: # %entry
; BMI-NEXT: lzcntl %edi, %eax
; BMI-NEXT: negb %al
; BMI-NEXT: movl $1, %ecx
; BMI-NEXT: shlxl %eax, %ecx, %eax
; BMI-NEXT: decl %edi
; BMI-NEXT: cmpl $-2, %edi
; BMI-NEXT: cmovael %ecx, %eax
; BMI-NEXT: retq
entry:
%ctlz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)
%cnt = sub i32 32, %ctlz
%shl = shl i32 1, %cnt
%dec = add i32 %x, -1
%ult = icmp ult i32 %dec, -2
%sel = select i1 %ult, i32 %shl, i32 1
ret i32 %sel
}
; std::bit_ceil<uint64_t>(x)
define i64 @bit_ceil_i64(i64 %x) {
; NOBMI-LABEL: bit_ceil_i64:
; NOBMI: # %bb.0:
; NOBMI-NEXT: movq %rdi, %rax
; NOBMI-NEXT: decq %rax
; NOBMI-NEXT: je .LBB2_1
; NOBMI-NEXT: # %bb.2: # %cond.false
; NOBMI-NEXT: bsrq %rax, %rcx
; NOBMI-NEXT: xorq $63, %rcx
; NOBMI-NEXT: jmp .LBB2_3
; NOBMI-NEXT: .LBB2_1:
; NOBMI-NEXT: movl $64, %ecx
; NOBMI-NEXT: .LBB2_3: # %cond.end
; NOBMI-NEXT: negb %cl
; NOBMI-NEXT: movl $1, %edx
; NOBMI-NEXT: movl $1, %eax
; NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
; NOBMI-NEXT: shlq %cl, %rax
; NOBMI-NEXT: cmpq $2, %rdi
; NOBMI-NEXT: cmovbq %rdx, %rax
; NOBMI-NEXT: retq
;
; BMI-LABEL: bit_ceil_i64:
; BMI: # %bb.0:
; BMI-NEXT: leaq -1(%rdi), %rax
; BMI-NEXT: lzcntq %rax, %rax
; BMI-NEXT: negb %al
; BMI-NEXT: movl $1, %ecx
; BMI-NEXT: shlxq %rax, %rcx, %rax
; BMI-NEXT: cmpq $2, %rdi
; BMI-NEXT: cmovbq %rcx, %rax
; BMI-NEXT: retq
%dec = add i64 %x, -1
%lz = tail call i64 @llvm.ctlz.i64(i64 %dec, i1 false)
%cnt = sub i64 64, %lz
%res = shl i64 1, %cnt
%ugt = icmp ugt i64 %x, 1
%sel = select i1 %ugt, i64 %res, i64 1
ret i64 %sel
}
; std::bit_ceil<uint64_t>(x + 1)
define i64 @bit_ceil_i64_plus1(i64 noundef %x) {
; NOBMI-LABEL: bit_ceil_i64_plus1:
; NOBMI: # %bb.0: # %entry
; NOBMI-NEXT: testq %rdi, %rdi
; NOBMI-NEXT: je .LBB3_1
; NOBMI-NEXT: # %bb.2: # %cond.false
; NOBMI-NEXT: bsrq %rdi, %rcx
; NOBMI-NEXT: xorq $63, %rcx
; NOBMI-NEXT: jmp .LBB3_3
; NOBMI-NEXT: .LBB3_1:
; NOBMI-NEXT: movl $64, %ecx
; NOBMI-NEXT: .LBB3_3: # %cond.end
; NOBMI-NEXT: negb %cl
; NOBMI-NEXT: movl $1, %edx
; NOBMI-NEXT: movl $1, %eax
; NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
; NOBMI-NEXT: shlq %cl, %rax
; NOBMI-NEXT: decq %rdi
; NOBMI-NEXT: cmpq $-2, %rdi
; NOBMI-NEXT: cmovaeq %rdx, %rax
; NOBMI-NEXT: retq
;
; BMI-LABEL: bit_ceil_i64_plus1:
; BMI: # %bb.0: # %entry
; BMI-NEXT: lzcntq %rdi, %rax
; BMI-NEXT: negb %al
; BMI-NEXT: movl $1, %ecx
; BMI-NEXT: shlxq %rax, %rcx, %rax
; BMI-NEXT: decq %rdi
; BMI-NEXT: cmpq $-2, %rdi
; BMI-NEXT: cmovaeq %rcx, %rax
; BMI-NEXT: retq
entry:
%ctlz = tail call i64 @llvm.ctlz.i64(i64 %x, i1 false)
%cnt = sub i64 64, %ctlz
%shl = shl i64 1, %cnt
%dec = add i64 %x, -1
%ult = icmp ult i64 %dec, -2
%sel = select i1 %ult, i64 %shl, i64 1
ret i64 %sel
}
declare i32 @llvm.ctlz.i32(i32, i1 immarg)
declare i64 @llvm.ctlz.i64(i64, i1 immarg)