blob: a142bddbae69a845126e2422a8869f7dbb6b2311 [file] [log] [blame]
Fangrui Song9e9907f2024-01-16 21:54:58 -08001# RUN: llc -mtriple=amdgcn -verify-machineinstrs -run-pass si-insert-waitcnts -o - %s | FileCheck %s
Matt Arsenault7bee6ac2016-12-05 20:23:10 +00002--- |
Matt Arsenault3ea06332017-02-22 00:02:21 +00003 define amdgpu_ps <4 x float> @exp_done_waitcnt(<4 x i32> inreg, <4 x
4 i32> inreg, i32 inreg %w, float %v) #0 {
Nikita Popov60442f02023-01-05 13:13:06 +01005 %a = load volatile float, ptr addrspace(1) undef
6 %b = load volatile float, ptr addrspace(1) undef
7 %c = load volatile float, ptr addrspace(1) undef
8 %d = load volatile float, ptr addrspace(1) undef
Matt Arsenault3ea06332017-02-22 00:02:21 +00009 call void @llvm.amdgcn.exp.f32(i32 15, i32 1, float %a, float %b, float %c, float %d, i1 true, i1 false)
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000010 ret <4 x float> <float 5.000000e-01, float 1.000000e+00, float 2.000000e+00, float 4.000000e+00>
11 }
12
Matt Arsenault3ea06332017-02-22 00:02:21 +000013 declare void @llvm.amdgcn.exp.f32(i32, i32, float, float, float, float, i1, i1) #0
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000014
Matt Arsenault3ea06332017-02-22 00:02:21 +000015 attributes #0 = { nounwind }
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000016
17...
18---
19
20# CHECK-LABEL: name: exp_done_waitcnt{{$}}
21# CHECK: EXP_DONE
22# CHECK-NEXT: S_WAITCNT 3855
Puyan Lotfi43e94b12018-01-31 22:04:26 +000023# CHECK: $vgpr0 = V_MOV_B32
24# CHECK: $vgpr1 = V_MOV_B32
25# CHECK: $vgpr2 = V_MOV_B32
26# CHECK: $vgpr3 = V_MOV_B32
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000027name: exp_done_waitcnt
Guillaume Chatelet48904e92019-09-11 11:16:48 +000028alignment: 1
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000029exposesReturnsTwice: false
30legalized: false
31regBankSelected: false
32selected: false
33tracksRegLiveness: true
34frameInfo:
35 isFrameAddressTaken: false
36 isReturnAddressTaken: false
37 hasStackMap: false
38 hasPatchPoint: false
39 stackSize: 0
40 offsetAdjustment: 0
41 maxAlignment: 0
42 adjustsStack: false
43 hasCalls: false
44 maxCallFrameSize: 0
45 hasOpaqueSPAdjustment: false
46 hasVAStart: false
47 hasMustTailInVarArgFunc: false
48body: |
49 bb.0 (%ir-block.2):
Puyan Lotfi43e94b12018-01-31 22:04:26 +000050 $sgpr3 = S_MOV_B32 61440
51 $sgpr2 = S_MOV_B32 -1
Nikita Popov60442f02023-01-05 13:13:06 +010052 $vgpr0 = BUFFER_LOAD_DWORD_OFFSET $sgpr0_sgpr1_sgpr2_sgpr3, 0, 0, 0, 0, implicit $exec :: (volatile load (s32) from `ptr addrspace(1) undef`)
53 $vgpr1 = BUFFER_LOAD_DWORD_OFFSET $sgpr0_sgpr1_sgpr2_sgpr3, 0, 0, 0, 0, implicit $exec :: (volatile load (s32) from `ptr addrspace(1) undef`)
54 $vgpr2 = BUFFER_LOAD_DWORD_OFFSET $sgpr0_sgpr1_sgpr2_sgpr3, 0, 0, 0, 0, implicit $exec :: (volatile load (s32) from `ptr addrspace(1) undef`)
55 $vgpr3 = BUFFER_LOAD_DWORD_OFFSET killed $sgpr0_sgpr1_sgpr2_sgpr3, 0, 0, 0, 0, implicit $exec :: (volatile load (s32) from `ptr addrspace(1) undef`)
Puyan Lotfi43e94b12018-01-31 22:04:26 +000056 EXP_DONE 0, killed $vgpr0, killed $vgpr1, killed $vgpr2, killed $vgpr3, -1, -1, 15, implicit $exec
57 $vgpr0 = V_MOV_B32_e32 1056964608, implicit $exec
58 $vgpr1 = V_MOV_B32_e32 1065353216, implicit $exec
59 $vgpr2 = V_MOV_B32_e32 1073741824, implicit $exec
60 $vgpr3 = V_MOV_B32_e32 1082130432, implicit $exec
61 SI_RETURN_TO_EPILOG killed $vgpr0, killed $vgpr1, killed $vgpr2, killed $vgpr3
Matt Arsenault7bee6ac2016-12-05 20:23:10 +000062
63...