blob: f41739ac6c169ecd6b70a8ebbc3f57abb4edcfb8 [file] [log] [blame] [edit]
//==- AMDGPUArgumentrUsageInfo.h - Function Arg Usage Info -------*- C++ -*-==//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUARGUMENTUSAGEINFO_H
#define LLVM_LIB_TARGET_AMDGPU_AMDGPUARGUMENTUSAGEINFO_H
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
#include "llvm/ADT/DenseMap.h"
#include "llvm/CodeGen/Register.h"
#include "llvm/IR/PassManager.h"
#include "llvm/Pass.h"
#include "llvm/PassRegistry.h"
#include <variant>
namespace llvm {
void initializeAMDGPUArgumentUsageInfoWrapperLegacyPass(PassRegistry &);
class Function;
class LLT;
class raw_ostream;
class TargetRegisterClass;
class TargetRegisterInfo;
struct ArgDescriptor {
private:
friend struct AMDGPUFunctionArgInfo;
friend class AMDGPUArgumentUsageInfo;
std::variant<std::monostate, MCRegister, unsigned> Val;
// Bitmask to locate argument within the register.
unsigned Mask;
public:
ArgDescriptor(unsigned Mask = ~0u) : Mask(Mask) {}
static ArgDescriptor createRegister(Register Reg, unsigned Mask = ~0u) {
ArgDescriptor Ret(Mask);
Ret.Val = Reg.asMCReg();
return Ret;
}
static ArgDescriptor createStack(unsigned Offset, unsigned Mask = ~0u) {
ArgDescriptor Ret(Mask);
Ret.Val = Offset;
return Ret;
}
static ArgDescriptor createArg(const ArgDescriptor &Arg, unsigned Mask) {
// Copy the descriptor, then change the mask.
ArgDescriptor Ret(Arg);
Ret.Mask = Mask;
return Ret;
}
bool isSet() const { return !std::holds_alternative<std::monostate>(Val); }
explicit operator bool() const {
return isSet();
}
bool isRegister() const { return std::holds_alternative<MCRegister>(Val); }
MCRegister getRegister() const { return std::get<MCRegister>(Val); }
unsigned getStackOffset() const { return std::get<unsigned>(Val); }
unsigned getMask() const {
// None of the target SGPRs or VGPRs are expected to have a 'zero' mask.
assert(Mask && "Invalid mask.");
return Mask;
}
bool isMasked() const {
return Mask != ~0u;
}
void print(raw_ostream &OS, const TargetRegisterInfo *TRI = nullptr) const;
};
inline raw_ostream &operator<<(raw_ostream &OS, const ArgDescriptor &Arg) {
Arg.print(OS);
return OS;
}
struct KernArgPreloadDescriptor : public ArgDescriptor {
KernArgPreloadDescriptor() = default;
SmallVector<MCRegister> Regs;
};
struct AMDGPUFunctionArgInfo {
// clang-format off
enum PreloadedValue {
// SGPRS:
PRIVATE_SEGMENT_BUFFER = 0,
DISPATCH_PTR = 1,
QUEUE_PTR = 2,
KERNARG_SEGMENT_PTR = 3,
DISPATCH_ID = 4,
FLAT_SCRATCH_INIT = 5,
LDS_KERNEL_ID = 6, // LLVM internal, not part of the ABI
WORKGROUP_ID_X = 10, // Also used for cluster ID X.
WORKGROUP_ID_Y = 11, // Also used for cluster ID Y.
WORKGROUP_ID_Z = 12, // Also used for cluster ID Z.
PRIVATE_SEGMENT_WAVE_BYTE_OFFSET = 14,
IMPLICIT_BUFFER_PTR = 15,
IMPLICIT_ARG_PTR = 16,
PRIVATE_SEGMENT_SIZE = 17,
CLUSTER_WORKGROUP_ID_X = 21,
CLUSTER_WORKGROUP_ID_Y = 22,
CLUSTER_WORKGROUP_ID_Z = 23,
CLUSTER_WORKGROUP_MAX_ID_X = 24,
CLUSTER_WORKGROUP_MAX_ID_Y = 25,
CLUSTER_WORKGROUP_MAX_ID_Z = 26,
CLUSTER_WORKGROUP_MAX_FLAT_ID = 27,
// VGPRS:
WORKITEM_ID_X = 28,
WORKITEM_ID_Y = 29,
WORKITEM_ID_Z = 30,
FIRST_VGPR_VALUE = WORKITEM_ID_X
};
// clang-format on
// Kernel input registers setup for the HSA ABI in allocation order.
// User SGPRs in kernels
// XXX - Can these require argument spills?
ArgDescriptor PrivateSegmentBuffer;
ArgDescriptor DispatchPtr;
ArgDescriptor QueuePtr;
ArgDescriptor KernargSegmentPtr;
ArgDescriptor DispatchID;
ArgDescriptor FlatScratchInit;
ArgDescriptor PrivateSegmentSize;
ArgDescriptor LDSKernelId;
// System SGPRs in kernels.
ArgDescriptor WorkGroupIDX;
ArgDescriptor WorkGroupIDY;
ArgDescriptor WorkGroupIDZ;
ArgDescriptor WorkGroupInfo;
ArgDescriptor PrivateSegmentWaveByteOffset;
// Pointer with offset from kernargsegmentptr to where special ABI arguments
// are passed to callable functions.
ArgDescriptor ImplicitArgPtr;
// Input registers for non-HSA ABI
ArgDescriptor ImplicitBufferPtr;
// VGPRs inputs. For entry functions these are either v0, v1 and v2 or packed
// into v0, 10 bits per dimension if packed-tid is set.
ArgDescriptor WorkItemIDX;
ArgDescriptor WorkItemIDY;
ArgDescriptor WorkItemIDZ;
// Map the index of preloaded kernel arguments to its descriptor.
SmallDenseMap<int, KernArgPreloadDescriptor> PreloadKernArgs{};
// The first user SGPR allocated for kernarg preloading.
Register FirstKernArgPreloadReg;
std::tuple<const ArgDescriptor *, const TargetRegisterClass *, LLT>
getPreloadedValue(PreloadedValue Value) const;
static AMDGPUFunctionArgInfo fixedABILayout();
};
class AMDGPUArgumentUsageInfo {
private:
DenseMap<const Function *, AMDGPUFunctionArgInfo> ArgInfoMap;
public:
static const AMDGPUFunctionArgInfo ExternFunctionInfo;
static const AMDGPUFunctionArgInfo FixedABIFunctionInfo;
void print(raw_ostream &OS, const Module *M = nullptr) const;
void clear() { ArgInfoMap.clear(); }
void setFuncArgInfo(const Function &F, const AMDGPUFunctionArgInfo &ArgInfo) {
ArgInfoMap[&F] = ArgInfo;
}
const AMDGPUFunctionArgInfo &lookupFuncArgInfo(const Function &F) const;
bool invalidate(Module &M, const PreservedAnalyses &PA,
ModuleAnalysisManager::Invalidator &Inv);
};
class AMDGPUArgumentUsageInfoWrapperLegacy : public ImmutablePass {
std::unique_ptr<AMDGPUArgumentUsageInfo> AUIP;
public:
static char ID;
AMDGPUArgumentUsageInfoWrapperLegacy() : ImmutablePass(ID) {
initializeAMDGPUArgumentUsageInfoWrapperLegacyPass(
*PassRegistry::getPassRegistry());
}
AMDGPUArgumentUsageInfo &getArgUsageInfo() { return *AUIP; }
const AMDGPUArgumentUsageInfo &getArgUsageInfo() const { return *AUIP; }
void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.setPreservesAll();
}
bool doInitialization(Module &M) override {
AUIP = std::make_unique<AMDGPUArgumentUsageInfo>();
return false;
}
bool doFinalization(Module &M) override {
AUIP->clear();
return false;
}
void print(raw_ostream &OS, const Module *M = nullptr) const override {
AUIP->print(OS, M);
}
};
class AMDGPUArgumentUsageAnalysis
: public AnalysisInfoMixin<AMDGPUArgumentUsageAnalysis> {
friend AnalysisInfoMixin<AMDGPUArgumentUsageAnalysis>;
static AnalysisKey Key;
public:
using Result = AMDGPUArgumentUsageInfo;
AMDGPUArgumentUsageInfo run(Module &M, ModuleAnalysisManager &);
};
} // end namespace llvm
#endif