30#define DEBUG_TYPE "si-pre-allocate-wwm-regs"
38class SIPreAllocateWWMRegs {
48 std::vector<unsigned> RegsToRewrite;
59 bool run(MachineFunction &MF);
66 SIPreAllocateWWMRegsLegacy() : MachineFunctionPass(ID) {}
68 bool runOnMachineFunction(MachineFunction &MF)
override;
70 void getAnalysisUsage(AnalysisUsage &AU)
const override {
82 "SI Pre-allocate WWM Registers",
false,
false)
89char SIPreAllocateWWMRegsLegacy::
ID = 0;
94 return new SIPreAllocateWWMRegsLegacy();
111 if (!
MRI->isPhysRegUsed(PhysReg,
true) &&
113 Matrix->assign(LI, PhysReg);
115 RegsToRewrite.push_back(
Reg);
123void SIPreAllocateWWMRegs::rewriteRegs(MachineFunction &MF) {
124 for (MachineBasicBlock &
MBB : MF) {
125 for (MachineInstr &
MI :
MBB) {
126 for (MachineOperand &MO :
MI.operands()) {
143 PhysReg =
TRI->getSubReg(PhysReg,
SubReg);
153 SIMachineFunctionInfo *MFI = MF.getInfo<SIMachineFunctionInfo>();
155 for (
unsigned Reg : RegsToRewrite) {
164 RegsToRewrite.clear();
167 MRI->freezeReservedRegs();
172SIPreAllocateWWMRegs::printWWMInfo(
const MachineInstr &
MI) {
174 unsigned Opc =
MI.getOpcode();
176 if (
Opc == AMDGPU::ENTER_STRICT_WWM ||
Opc == AMDGPU::ENTER_STRICT_WQM) {
177 dbgs() <<
"Entering ";
179 assert(
Opc == AMDGPU::EXIT_STRICT_WWM ||
Opc == AMDGPU::EXIT_STRICT_WQM);
180 dbgs() <<
"Exiting ";
183 if (
Opc == AMDGPU::ENTER_STRICT_WWM ||
Opc == AMDGPU::EXIT_STRICT_WWM) {
184 dbgs() <<
"Strict WWM ";
186 assert(
Opc == AMDGPU::ENTER_STRICT_WQM ||
Opc == AMDGPU::EXIT_STRICT_WQM);
187 dbgs() <<
"Strict WQM ";
190 dbgs() <<
"region: " <<
MI;
195bool SIPreAllocateWWMRegsLegacy::runOnMachineFunction(MachineFunction &MF) {
196 auto *LIS = &getAnalysis<LiveIntervalsWrapperPass>().getLIS();
197 auto *
Matrix = &getAnalysis<LiveRegMatrixWrapperLegacy>().getLRM();
198 auto *VRM = &getAnalysis<VirtRegMapWrapperLegacy>().getVRM();
199 return SIPreAllocateWWMRegs(LIS,
Matrix, VRM).run(MF);
202bool SIPreAllocateWWMRegs::run(MachineFunction &MF) {
207 TII =
ST.getInstrInfo();
208 TRI = &
TII->getRegisterInfo();
213 bool PreallocateSGPRSpillVGPRs =
217 bool RegsAssigned =
false;
224 ReversePostOrderTraversal<MachineFunction*> RPOT(&MF);
226 for (MachineBasicBlock *
MBB : RPOT) {
228 for (MachineInstr &
MI : *
MBB) {
229 if (
MI.getOpcode() == AMDGPU::SI_SPILL_S32_TO_VGPR) {
230 if (PreallocateSGPRSpillVGPRs)
231 RegsAssigned |= processDef(
MI.getOperand(0));
235 if (
MI.getOpcode() == AMDGPU::ENTER_STRICT_WWM ||
236 MI.getOpcode() == AMDGPU::ENTER_STRICT_WQM) {
242 if (
MI.getOpcode() == AMDGPU::EXIT_STRICT_WWM ||
243 MI.getOpcode() == AMDGPU::EXIT_STRICT_WQM) {
253 for (MachineOperand &DefOpnd :
MI.defs()) {
254 RegsAssigned |= processDef(DefOpnd);
272 SIPreAllocateWWMRegs(LIS,
Matrix, VRM).
run(MF);
unsigned const MachineRegisterInfo * MRI
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
Provides AMDGPU specific target descriptions.
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
AMD GCN specific subclass of TargetSubtarget.
const HexagonInstrInfo * TII
Register const TargetRegisterInfo * TRI
Promote Memory to Register
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
static cl::opt< bool > EnablePreallocateSGPRSpillVGPRs("amdgpu-prealloc-sgpr-spill-vgprs", cl::init(false), cl::Hidden)
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
AnalysisUsage & addRequired()
void setPreservesAll()
Set by analyses that do not transform their input at all.
FunctionPass class - This class is used to implement most global optimizations.
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
LiveInterval - This class represents the liveness of a register, or stack slot.
LiveInterval & getInterval(Register Reg)
void removeInterval(Register Reg)
Interval removal.
@ IK_Free
No interference, go ahead and assign.
Wrapper class representing physical registers. Should be passed by value.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Representation of each machine instruction.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
LLVM_ABI void setIsRenamable(bool Val=true)
bool isReg() const
isReg - Tests if this is a MO_Register operand.
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
LLVM_ABI void runOnMachineFunction(const MachineFunction &MF, bool Rev=false)
runOnFunction - Prepare to answer questions about MF.
ArrayRef< MCPhysReg > getOrder(const TargetRegisterClass *RC) const
getOrder - Returns the preferred allocation order for RC.
Wrapper class representing virtual and physical registers.
constexpr bool isValid() const
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
void reserveWWMRegister(Register Reg)
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
LLVM_ABI VirtRegMap run(MachineFunction &MF, MachineFunctionAnalysisManager &MAM)
MCRegister getPhys(Register virtReg) const
returns the physical register mapped to the specified virtual register
bool hasPhys(Register virtReg) const
returns true if the specified virtual register is mapped to a physical register
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
initializer< Ty > init(const Ty &Val)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
This is an optimization pass for GlobalISel generic memory operations.
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FunctionPass * createSIPreAllocateWWMRegsLegacyPass()
char & SIPreAllocateWWMRegsLegacyID