| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| ; RUN: opt -S -passes=amdgpu-unify-divergent-exit-nodes -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a %s -o - | FileCheck %s |
| |
| declare void @foo(ptr) |
| declare i1 @bar(ptr) |
| |
| define void @musttail_call_without_return_value(ptr %p) { |
| ; CHECK-LABEL: define void @musttail_call_without_return_value( |
| ; CHECK-SAME: ptr [[P:%.*]]) #[[ATTR0:[0-9]+]] { |
| ; CHECK-NEXT: [[ENTRY:.*:]] |
| ; CHECK-NEXT: [[LOAD:%.*]] = load i1, ptr [[P]], align 1 |
| ; CHECK-NEXT: br i1 [[LOAD]], label %[[BB_0:.*]], label %[[BB_1:.*]] |
| ; CHECK: [[BB_0]]: |
| ; CHECK-NEXT: musttail call void @foo(ptr [[P]]) |
| ; CHECK-NEXT: ret void |
| ; CHECK: [[BB_1]]: |
| ; CHECK-NEXT: ret void |
| ; |
| entry: |
| %load = load i1, ptr %p, align 1 |
| br i1 %load, label %bb.0, label %bb.1 |
| |
| bb.0: |
| musttail call void @foo(ptr %p) |
| ret void |
| |
| bb.1: |
| ret void |
| } |
| |
| define i1 @musttail_call_with_return_value(ptr %p) { |
| ; CHECK-LABEL: define i1 @musttail_call_with_return_value( |
| ; CHECK-SAME: ptr [[P:%.*]]) #[[ATTR0]] { |
| ; CHECK-NEXT: [[ENTRY:.*:]] |
| ; CHECK-NEXT: [[LOAD:%.*]] = load i1, ptr [[P]], align 1 |
| ; CHECK-NEXT: br i1 [[LOAD]], label %[[BB_0:.*]], label %[[BB_1:.*]] |
| ; CHECK: [[BB_0]]: |
| ; CHECK-NEXT: [[RET:%.*]] = musttail call i1 @bar(ptr [[P]]) |
| ; CHECK-NEXT: ret i1 [[RET]] |
| ; CHECK: [[BB_1]]: |
| ; CHECK-NEXT: ret i1 [[LOAD]] |
| ; |
| entry: |
| %load = load i1, ptr %p, align 1 |
| br i1 %load, label %bb.0, label %bb.1 |
| |
| bb.0: |
| %ret = musttail call i1 @bar(ptr %p) |
| ret i1 %ret |
| |
| bb.1: |
| ret i1 %load |
| } |