blob: f0b09482256fe140d3c98ddae3715f84e7ce5eac [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-attributes --check-globals all --version 5
; Test the generation of the attribute amdgpu-no-wwm
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1200 -passes=amdgpu-attributor < %s | FileCheck -check-prefixes=CHECK %s
define amdgpu_kernel void @test_no_wwm(i32 %input, ptr addrspace(1) %out) {
; CHECK-LABEL: define amdgpu_kernel void @test_no_wwm(
; CHECK-SAME: i32 [[INPUT:%.*]], ptr addrspace(1) [[OUT:%.*]]) #[[ATTR0:[0-9]+]] {
; CHECK-NEXT: store i32 [[INPUT]], ptr addrspace(1) [[OUT]], align 4
; CHECK-NEXT: ret void
;
store i32 %input, ptr addrspace(1) %out
ret void
}
define amdgpu_kernel void @test_old_wwm(i32 %input, ptr addrspace(1) %out) {
; CHECK-LABEL: define amdgpu_kernel void @test_old_wwm(
; CHECK-SAME: i32 [[INPUT:%.*]], ptr addrspace(1) [[OUT:%.*]]) #[[ATTR1:[0-9]+]] {
; CHECK-NEXT: [[WWM:%.*]] = call i32 @llvm.amdgcn.wwm.i32(i32 [[INPUT]])
; CHECK-NEXT: store i32 [[WWM]], ptr addrspace(1) [[OUT]], align 4
; CHECK-NEXT: ret void
;
%wwm = call i32 @llvm.amdgcn.wwm.i32(i32 %input)
store i32 %wwm, ptr addrspace(1) %out
ret void
}
define amdgpu_kernel void @test_strict_wwm(i32 %input, ptr addrspace(1) %out) {
; CHECK-LABEL: define amdgpu_kernel void @test_strict_wwm(
; CHECK-SAME: i32 [[INPUT:%.*]], ptr addrspace(1) [[OUT:%.*]]) #[[ATTR1]] {
; CHECK-NEXT: [[WWM:%.*]] = call i32 @llvm.amdgcn.strict.wwm.i32(i32 [[INPUT]])
; CHECK-NEXT: store i32 [[WWM]], ptr addrspace(1) [[OUT]], align 4
; CHECK-NEXT: ret void
;
%wwm = call i32 @llvm.amdgcn.strict.wwm.i32(i32 %input)
store i32 %wwm, ptr addrspace(1) %out
ret void
}
define i32 @test_calls_wwm(i32 %input) {
; CHECK-LABEL: define i32 @test_calls_wwm(
; CHECK-SAME: i32 [[INPUT:%.*]]) #[[ATTR1]] {
; CHECK-NEXT: [[WWM:%.*]] = call i32 @llvm.amdgcn.wwm.i32(i32 [[INPUT]])
; CHECK-NEXT: ret i32 [[WWM]]
;
%wwm = call i32 @llvm.amdgcn.wwm.i32(i32 %input)
ret i32 %wwm
}
define amdgpu_kernel void @test_nested(i32 %input, ptr addrspace(1) %out) {
; CHECK-LABEL: define amdgpu_kernel void @test_nested(
; CHECK-SAME: i32 [[INPUT:%.*]], ptr addrspace(1) [[OUT:%.*]]) #[[ATTR1]] {
; CHECK-NEXT: [[RES:%.*]] = call i32 @test_calls_wwm(i32 [[INPUT]])
; CHECK-NEXT: store i32 [[RES]], ptr addrspace(1) [[OUT]], align 4
; CHECK-NEXT: ret void
;
%res = call i32 @test_calls_wwm(i32 %input)
store i32 %res, ptr addrspace(1) %out
ret void
}
;.
; CHECK: attributes #[[ATTR0]] = { "amdgpu-no-cluster-id-x" "amdgpu-no-cluster-id-y" "amdgpu-no-cluster-id-z" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-flat-scratch-init" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-no-wwm" "target-cpu"="gfx1200" }
; CHECK: attributes #[[ATTR1]] = { "amdgpu-no-cluster-id-x" "amdgpu-no-cluster-id-y" "amdgpu-no-cluster-id-z" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-flat-scratch-init" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "target-cpu"="gfx1200" }
; CHECK: attributes #[[ATTR2:[0-9]+]] = { convergent nocallback nofree nounwind speculatable willreturn memory(none) "target-cpu"="gfx1200" }
;.