blob: bad23c3ae67fa82448c6b320288d7c8f0704f13e [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6
; RUN: llc -mtriple=riscv64 -mattr=+m -O2 < %s | FileCheck %s -check-prefix=RV64
; RUN: llc -mtriple=riscv32 -mattr=+m -O2 < %s | FileCheck %s -check-prefix=RV32
; Test that very large outgoing call frames in functions with variable-sized
; objects get proper stack probing. The outgoing args are large enough to force
; the PROBED_STACKALLOC path, which must be expanded in a non-entry block.
define void @f(i64 %n) #0 {
; RV64-LABEL: f:
; RV64: # %bb.0: # %entry
; RV64-NEXT: addi sp, sp, -16
; RV64-NEXT: .cfi_def_cfa_offset 16
; RV64-NEXT: sd zero, 0(sp)
; RV64-NEXT: sd ra, 8(sp) # 8-byte Folded Spill
; RV64-NEXT: sd s0, 0(sp) # 8-byte Folded Spill
; RV64-NEXT: .cfi_offset ra, -8
; RV64-NEXT: .cfi_offset s0, -16
; RV64-NEXT: addi s0, sp, 16
; RV64-NEXT: .cfi_def_cfa s0, 0
; RV64-NEXT: slli a0, a0, 2
; RV64-NEXT: addi a0, a0, 15
; RV64-NEXT: andi a0, a0, -16
; RV64-NEXT: sub a0, sp, a0
; RV64-NEXT: lui a1, 1
; RV64-NEXT: .LBB0_1: # %entry
; RV64-NEXT: # =>This Inner Loop Header: Depth=1
; RV64-NEXT: sub sp, sp, a1
; RV64-NEXT: sd zero, 0(sp)
; RV64-NEXT: bltu a0, sp, .LBB0_1
; RV64-NEXT: # %bb.2: # %entry
; RV64-NEXT: mv sp, a0
; RV64-NEXT: lui a1, 5
; RV64-NEXT: sub t1, sp, a1
; RV64-NEXT: lui t2, 1
; RV64-NEXT: .LBB0_3: # %entry
; RV64-NEXT: # =>This Inner Loop Header: Depth=1
; RV64-NEXT: sub sp, sp, t2
; RV64-NEXT: sd zero, 0(sp)
; RV64-NEXT: bne sp, t1, .LBB0_3
; RV64-NEXT: # %bb.4: # %entry
; RV64-NEXT: addi sp, sp, -2048
; RV64-NEXT: addi sp, sp, -1424
; RV64-NEXT: sd zero, 0(sp)
; RV64-NEXT: call g
; RV64-NEXT: lui a0, 6
; RV64-NEXT: addi a0, a0, -624
; RV64-NEXT: add sp, sp, a0
; RV64-NEXT: addi sp, s0, -16
; RV64-NEXT: .cfi_def_cfa sp, 16
; RV64-NEXT: ld ra, 8(sp) # 8-byte Folded Reload
; RV64-NEXT: ld s0, 0(sp) # 8-byte Folded Reload
; RV64-NEXT: .cfi_restore ra
; RV64-NEXT: .cfi_restore s0
; RV64-NEXT: addi sp, sp, 16
; RV64-NEXT: .cfi_def_cfa_offset 0
; RV64-NEXT: ret
;
; RV32-LABEL: f:
; RV32: # %bb.0: # %entry
; RV32-NEXT: addi sp, sp, -16
; RV32-NEXT: .cfi_def_cfa_offset 16
; RV32-NEXT: sw zero, 0(sp)
; RV32-NEXT: sw ra, 12(sp) # 4-byte Folded Spill
; RV32-NEXT: sw s0, 8(sp) # 4-byte Folded Spill
; RV32-NEXT: .cfi_offset ra, -4
; RV32-NEXT: .cfi_offset s0, -8
; RV32-NEXT: addi s0, sp, 16
; RV32-NEXT: .cfi_def_cfa s0, 0
; RV32-NEXT: slli a0, a0, 2
; RV32-NEXT: addi a0, a0, 15
; RV32-NEXT: andi a0, a0, -16
; RV32-NEXT: sub a0, sp, a0
; RV32-NEXT: lui a1, 1
; RV32-NEXT: .LBB0_1: # %entry
; RV32-NEXT: # =>This Inner Loop Header: Depth=1
; RV32-NEXT: sub sp, sp, a1
; RV32-NEXT: sw zero, 0(sp)
; RV32-NEXT: bltu a0, sp, .LBB0_1
; RV32-NEXT: # %bb.2: # %entry
; RV32-NEXT: mv sp, a0
; RV32-NEXT: lui a1, 5
; RV32-NEXT: sub t1, sp, a1
; RV32-NEXT: lui t2, 1
; RV32-NEXT: .LBB0_3: # %entry
; RV32-NEXT: # =>This Inner Loop Header: Depth=1
; RV32-NEXT: sub sp, sp, t2
; RV32-NEXT: sw zero, 0(sp)
; RV32-NEXT: bne sp, t1, .LBB0_3
; RV32-NEXT: # %bb.4: # %entry
; RV32-NEXT: addi sp, sp, -2048
; RV32-NEXT: addi sp, sp, -1456
; RV32-NEXT: sw zero, 0(sp)
; RV32-NEXT: call g
; RV32-NEXT: lui a0, 6
; RV32-NEXT: addi a0, a0, -592
; RV32-NEXT: add sp, sp, a0
; RV32-NEXT: addi sp, s0, -16
; RV32-NEXT: .cfi_def_cfa sp, 16
; RV32-NEXT: lw ra, 12(sp) # 4-byte Folded Reload
; RV32-NEXT: lw s0, 8(sp) # 4-byte Folded Reload
; RV32-NEXT: .cfi_restore ra
; RV32-NEXT: .cfi_restore s0
; RV32-NEXT: addi sp, sp, 16
; RV32-NEXT: .cfi_def_cfa_offset 0
; RV32-NEXT: ret
entry:
%v = alloca i32, i64 %n
call void @g(ptr %v, [3000 x i64] poison)
ret void
}
declare void @g(ptr, [3000 x i64])
attributes #0 = { "probe-stack"="inline-asm" }