| ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -O1 < %s | FileCheck -check-prefix=OPT %s |
| ; RUN: llc -march=amdgcn -mcpu=gfx1010 -verify-machineinstrs < %s | FileCheck -check-prefix=LLC %s |
| |
| ; OPT: declare void @foo4() local_unnamed_addr #0 |
| ; OPT: define internal fastcc void @foo3.2() unnamed_addr #1 |
| ; OPT: define void @foo2() local_unnamed_addr #1 |
| ; OPT: define internal fastcc void @foo1.1() unnamed_addr #1 |
| ; OPT: define amdgpu_kernel void @kernel1() local_unnamed_addr #2 |
| ; OPT: define amdgpu_kernel void @kernel2() local_unnamed_addr #3 |
| ; OPT: define amdgpu_kernel void @kernel3() local_unnamed_addr #3 |
| ; OPT: define void @foo1() local_unnamed_addr #4 |
| ; OPT: define void @foo3() local_unnamed_addr #4 |
| ; OPT: attributes #0 = { {{.*}} "target-features"="+wavefrontsize64" } |
| ; OPT: attributes #1 = { {{.*}} "target-features"="{{.*}},-wavefrontsize16,-wavefrontsize32,+wavefrontsize64{{.*}}" } |
| ; OPT: attributes #2 = { {{.*}} "target-features"="+wavefrontsize32" } |
| ; OPT: attributes #3 = { {{.*}} "target-features"="+wavefrontsize64" } |
| ; OPT: attributes #4 = { {{.*}} "target-features"="{{.*}},-wavefrontsize16,+wavefrontsize32,-wavefrontsize64{{.*}}" } |
| |
| ; LLC: foo3: |
| ; LLC: sample asm |
| ; LLC: foo2: |
| ; LLC: sample asm |
| ; LLC: foo1: |
| ; LLC: foo4@gotpcrel32@lo+4 |
| ; LLC: foo4@gotpcrel32@hi+4 |
| ; LLC: foo3@gotpcrel32@lo+4 |
| ; LLC: foo3@gotpcrel32@hi+4 |
| ; LLC: foo2@gotpcrel32@lo+4 |
| ; LLC: foo2@gotpcrel32@hi+4 |
| ; LLC: foo1@gotpcrel32@lo+4 |
| ; LLC: foo1@gotpcrel32@hi+4 |
| ; LLC: kernel1: |
| ; LLC: foo1@gotpcrel32@lo+4 |
| ; LLC: foo1@gotpcrel32@hi+4 |
| ; LLC: kernel2: |
| ; LLC: foo2@gotpcrel32@lo+4 |
| ; LLC: foo2@gotpcrel32@hi+4 |
| ; LLC: kernel3: |
| ; LLC: foo1@gotpcrel32@lo+4 |
| ; LLC: foo1@gotpcrel32@hi+4 |
| |
| declare void @foo4() #1 |
| |
| define void @foo3() #1 { |
| entry: |
| call void asm sideeffect "; sample asm", ""() |
| ret void |
| } |
| |
| define void @foo2() #1 { |
| entry: |
| call void asm sideeffect "; sample asm", ""() |
| ret void |
| } |
| |
| define void @foo1() #1 { |
| entry: |
| tail call void @foo4() |
| tail call void @foo3() |
| tail call void @foo2() |
| tail call void @foo2() |
| tail call void @foo1() |
| ret void |
| } |
| |
| define amdgpu_kernel void @kernel1() #0 { |
| entry: |
| tail call void @foo1() |
| ret void |
| } |
| |
| define amdgpu_kernel void @kernel2() #2 { |
| entry: |
| tail call void @foo2() |
| ret void |
| } |
| |
| define amdgpu_kernel void @kernel3() #3 { |
| entry: |
| tail call void @foo1() |
| ret void |
| } |
| |
| attributes #0 = { nounwind "target-features"="+wavefrontsize32" } |
| attributes #1 = { noinline nounwind "target-features"="+wavefrontsize64" } |
| attributes #2 = { nounwind "target-features"="+wavefrontsize64" } |
| attributes #3 = { nounwind "target-features"="+wavefrontsize64" } |