blob: 8d6cee48b416c46e627e473e62188dca61aaf11d [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-promote-alloca %s | FileCheck %s
define amdgpu_kernel void @kernel(ptr %p) {
; CHECK-LABEL: define amdgpu_kernel void @kernel(
; CHECK-SAME: ptr [[P:%.*]]) {
; CHECK-NEXT: [[ENTRY:.*]]:
; CHECK-NEXT: [[ASCAST:%.*]] = addrspacecast ptr [[P]] to ptr addrspace(1)
; CHECK-NEXT: [[ALLOCA:%.*]] = freeze <14 x i32> poison
; CHECK-NEXT: [[LOAD:%.*]] = load i32, ptr addrspace(1) [[ASCAST]], align 4
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[LOAD]], 0
; CHECK-NEXT: br i1 [[CMP]], label %[[BB_1:.*]], label %[[BB_2:.*]]
; CHECK: [[BB_2]]:
; CHECK-NEXT: br label %[[BB_1]]
; CHECK: [[BB_1]]:
; CHECK-NEXT: [[PROMOTEALLOCA:%.*]] = phi <14 x i32> [ [[ALLOCA]], %[[BB_2]] ], [ [[ALLOCA]], %[[ENTRY]] ]
; CHECK-NEXT: [[TMP0:%.*]] = insertelement <14 x i32> [[PROMOTEALLOCA]], i32 0, i32 0
; CHECK-NEXT: ret void
;
entry:
%ascast = addrspacecast ptr %p to ptr addrspace(1)
%alloca = alloca [14 x i32], addrspace(5)
%load = load i32, ptr addrspace(1) %ascast
%cmp = icmp eq i32 %load, 0
br i1 %cmp, label %bb.1, label %bb.2
bb.2:
store i32 poison, ptr addrspace(5) %alloca
br label %bb.1
bb.1:
store i32 0, ptr addrspace(5) %alloca
ret void
uselistorder ptr addrspace(5) %alloca, { 1, 0 }
}