| # RUN: llc -mtriple=amdgcn-amd-amdhsa -run-pass=none -verify-machineinstrs %s -o - | FileCheck -check-prefixes=FULL,ALL %s |
| # RUN: llc -mtriple=amdgcn-amd-amdhsa -run-pass=none -simplify-mir -verify-machineinstrs %s -o - | FileCheck -check-prefixes=SIMPLE,ALL %s |
| |
| |
| --- |
| # ALL-LABEL: name: kernel0 |
| # FULL: machineFunctionInfo: |
| # FULL-NEXT: explicitKernArgSize: 128 |
| # FULL-NEXT: maxKernArgAlign: 64 |
| # FULL-NEXT: ldsSize: 2048 |
| # FULL-NEXT: isEntryFunction: true |
| # FULL-NEXT: noSignedZerosFPMath: false |
| # FULL-NEXT: memoryBound: true |
| # FULL-NEXT: waveLimiter: true |
| # FULL-NEXT: scratchRSrcReg: '$sgpr8_sgpr9_sgpr10_sgpr11' |
| # FULL-NEXT: scratchWaveOffsetReg: '$sgpr12' |
| # FULL-NEXT: frameOffsetReg: '$sgpr12' |
| # FULL-NEXT: stackPtrOffsetReg: '$sgpr13' |
| # FULL-NEXT: argumentInfo: |
| # FULL-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # FULL-NEXT: kernargSegmentPtr: { reg: '$sgpr4_sgpr5' } |
| # FULL-NEXT: workGroupIDX: { reg: '$sgpr6' } |
| # FULL-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr7' } |
| # FULL-NEXT: workItemIDX: { reg: '$vgpr0' } |
| # FULL-NEXT: mode: |
| # FULL-NEXT: ieee: true |
| # FULL-NEXT: dx10-clamp: true |
| # FULL-NEXT: highBitsOf32BitAddress: 0 |
| # FULL-NEXT: body: |
| |
| # SIMPLE: machineFunctionInfo: |
| # SIMPLE-NEXT: explicitKernArgSize: 128 |
| # SIMPLE-NEXT: maxKernArgAlign: 64 |
| # SIMPLE-NEXT: ldsSize: 2048 |
| # SIMPLE-NEXT: isEntryFunction: true |
| # SIMPLE-NEXT: memoryBound: true |
| # SIMPLE-NEXT: waveLimiter: true |
| # SIMPLE-NEXT: scratchRSrcReg: '$sgpr8_sgpr9_sgpr10_sgpr11' |
| # SIMPLE-NEXT: scratchWaveOffsetReg: '$sgpr12' |
| # SIMPLE-NEXT: frameOffsetReg: '$sgpr12' |
| # SIMPLE-NEXT: stackPtrOffsetReg: '$sgpr13' |
| # SIMPLE-NEXT: argumentInfo: |
| # SIMPLE-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # SIMPLE-NEXT: kernargSegmentPtr: { reg: '$sgpr4_sgpr5' } |
| # SIMPLE-NEXT: workGroupIDX: { reg: '$sgpr6' } |
| # SIMPLE-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr7' } |
| # SIMPLE-NEXT: workItemIDX: { reg: '$vgpr0' } |
| # SIMPLE-NEXT: body: |
| name: kernel0 |
| machineFunctionInfo: |
| explicitKernArgSize: 128 |
| maxKernArgAlign: 64 |
| ldsSize: 2048 |
| isEntryFunction: true |
| noSignedZerosFPMath: false |
| memoryBound: true |
| waveLimiter: true |
| scratchRSrcReg: '$sgpr8_sgpr9_sgpr10_sgpr11' |
| scratchWaveOffsetReg: '$sgpr12' |
| frameOffsetReg: '$sgpr12' |
| stackPtrOffsetReg: '$sgpr13' |
| argumentInfo: |
| privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| kernargSegmentPtr: { reg: '$sgpr4_sgpr5' } |
| workGroupIDX: { reg: '$sgpr6' } |
| privateSegmentWaveByteOffset: { reg: '$sgpr7' } |
| workItemIDX: { reg: '$vgpr0' } |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| # FIXME: Should be able to not print section for simple |
| --- |
| # ALL-LABEL: name: no_mfi |
| # FULL: machineFunctionInfo: |
| # FULL-NEXT: explicitKernArgSize: 0 |
| # FULL-NEXT: maxKernArgAlign: 1 |
| # FULL-NEXT: ldsSize: 0 |
| # FULL-NEXT: isEntryFunction: false |
| # FULL-NEXT: noSignedZerosFPMath: false |
| # FULL-NEXT: memoryBound: false |
| # FULL-NEXT: waveLimiter: false |
| # FULL-NEXT: scratchRSrcReg: '$private_rsrc_reg' |
| # FULL-NEXT: scratchWaveOffsetReg: '$scratch_wave_offset_reg' |
| # FULL-NEXT: frameOffsetReg: '$fp_reg' |
| # FULL-NEXT: stackPtrOffsetReg: '$sp_reg' |
| # FULL-NEXT: argumentInfo: |
| # FULL-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # FULL-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # FULL-NEXT: mode: |
| # FULL-NEXT: ieee: true |
| # FULL-NEXT: dx10-clamp: true |
| # FULL-NEXT: highBitsOf32BitAddress: 0 |
| # FULL-NEXT: body: |
| |
| # SIMPLE: machineFunctionInfo: |
| # SIMPLE-NEXT: maxKernArgAlign: 1 |
| # SIMPLE-NEXT: argumentInfo: |
| # SIMPLE-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # SIMPLE-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # SIMPLE-NEXT: body: |
| |
| name: no_mfi |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| --- |
| # ALL-LABEL: name: empty_mfi |
| # FULL: machineFunctionInfo: |
| # FULL-NEXT: explicitKernArgSize: 0 |
| # FULL-NEXT: maxKernArgAlign: 1 |
| # FULL-NEXT: ldsSize: 0 |
| # FULL-NEXT: isEntryFunction: false |
| # FULL-NEXT: noSignedZerosFPMath: false |
| # FULL-NEXT: memoryBound: false |
| # FULL-NEXT: waveLimiter: false |
| # FULL-NEXT: scratchRSrcReg: '$private_rsrc_reg' |
| # FULL-NEXT: scratchWaveOffsetReg: '$scratch_wave_offset_reg' |
| # FULL-NEXT: frameOffsetReg: '$fp_reg' |
| # FULL-NEXT: stackPtrOffsetReg: '$sp_reg' |
| # FULL-NEXT: argumentInfo: |
| # FULL-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # FULL-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # FULL-NEXT: mode: |
| # FULL-NEXT: ieee: true |
| # FULL-NEXT: dx10-clamp: true |
| # FULL-NEXT: highBitsOf32BitAddress: 0 |
| # FULL-NEXT: body: |
| |
| # SIMPLE: machineFunctionInfo: |
| # SIMPLE-NEXT: maxKernArgAlign: 1 |
| # SIMPLE-NEXT: argumentInfo: |
| # SIMPLE-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # SIMPLE-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # SIMPLE-NEXT: body: |
| |
| name: empty_mfi |
| machineFunctionInfo: |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| --- |
| # ALL-LABEL: name: empty_mfi_entry_func |
| # FULL: machineFunctionInfo: |
| # FULL-NEXT: explicitKernArgSize: 0 |
| # FULL-NEXT: maxKernArgAlign: 1 |
| # FULL-NEXT: ldsSize: 0 |
| # FULL-NEXT: isEntryFunction: true |
| # FULL-NEXT: noSignedZerosFPMath: false |
| # FULL-NEXT: memoryBound: false |
| # FULL-NEXT: waveLimiter: false |
| # FULL-NEXT: scratchRSrcReg: '$private_rsrc_reg' |
| # FULL-NEXT: scratchWaveOffsetReg: '$scratch_wave_offset_reg' |
| # FULL-NEXT: frameOffsetReg: '$fp_reg' |
| # FULL-NEXT: stackPtrOffsetReg: '$sp_reg' |
| # FULL-NEXT: argumentInfo: |
| # FULL-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # FULL-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # FULL-NEXT: mode: |
| # FULL-NEXT: ieee: true |
| # FULL-NEXT: dx10-clamp: true |
| # FULL-NEXT: highBitsOf32BitAddress: 0 |
| # FULL-NEXT: body: |
| |
| # SIMPLE: machineFunctionInfo: |
| # SIMPLE-NEXT: maxKernArgAlign: 1 |
| # SIMPLE-NEXT: isEntryFunction: true |
| # SIMPLE-NEXT: argumentInfo: |
| # SIMPLE-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # SIMPLE-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # SIMPLE-NEXT: body: |
| |
| name: empty_mfi_entry_func |
| machineFunctionInfo: |
| isEntryFunction: true |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| --- |
| # ALL-LABEL: name: default_regs_mfi |
| |
| # FULL: scratchRSrcReg: '$private_rsrc_reg' |
| # FULL-NEXT: scratchWaveOffsetReg: '$scratch_wave_offset_reg' |
| # FULL-NEXT: frameOffsetReg: '$fp_reg' |
| # FULL-NEXT: stackPtrOffsetReg: '$sp_reg' |
| |
| # SIMPLE-NOT: scratchRSrcReg |
| # SIMPLE-NOT: scratchWaveOffsetReg |
| # SIMPLE-NOT:: stackPtrOffsetReg |
| name: default_regs_mfi |
| machineFunctionInfo: |
| scratchRSrcReg: '$private_rsrc_reg' |
| |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| --- |
| # ALL-LABEL: name: fake_stack_arginfo |
| |
| # FULL: argumentInfo: |
| # FULL-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # FULL-NEXT: flatScratchInit: { offset: 4 } |
| # FULL-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # FULL-NEXT: workItemIDY: { reg: '$vgpr0', mask: 65280 } |
| |
| # SIMPLE: argumentInfo: |
| # SIMPLE-NEXT: privateSegmentBuffer: { reg: '$sgpr0_sgpr1_sgpr2_sgpr3' } |
| # SIMPLE-NEXT: flatScratchInit: { offset: 4 } |
| # SIMPLE-NEXT: privateSegmentWaveByteOffset: { reg: '$sgpr33' } |
| # SIMPLE-NEXT: workItemIDY: { reg: '$vgpr0', mask: 65280 } |
| name: fake_stack_arginfo |
| machineFunctionInfo: |
| argumentInfo: |
| flatScratchInit: { offset: 4 } |
| workItemIDY: { reg: '$vgpr0' , mask: 0xff00 } |
| |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |
| |
| --- |
| # ALL-LABEL: name: parse_mode |
| # ALL: mode: |
| # ALL-NEXT: ieee: false |
| # ALL-NEXT: dx10-clamp: false |
| name: parse_mode |
| machineFunctionInfo: |
| mode: |
| ieee: false |
| dx10-clamp: false |
| |
| body: | |
| bb.0: |
| S_ENDPGM 0 |
| |
| ... |