xref: /llvm-project/llvm/lib/MCA/HardwareUnits/RegisterFile.cpp (revision 4a5b191703978a56ff6dcbae0e0bcb6b8933adfc)
1 //===--------------------- RegisterFile.cpp ---------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 /// \file
9 ///
10 /// This file defines a register mapping file class.  This class is responsible
11 /// for managing hardware register files and the tracking of data dependencies
12 /// between registers.
13 ///
14 //===----------------------------------------------------------------------===//
15 
16 #include "llvm/MCA/HardwareUnits/RegisterFile.h"
17 #include "llvm/MCA/Instruction.h"
18 #include "llvm/Support/Debug.h"
19 
20 #define DEBUG_TYPE "llvm-mca"
21 
22 namespace llvm {
23 namespace mca {
24 
25 const unsigned WriteRef::INVALID_IID = std::numeric_limits<unsigned>::max();
26 
27 WriteRef::WriteRef(unsigned SourceIndex, WriteState *WS)
28     : IID(SourceIndex), WriteBackCycle(), WriteResID(), RegisterID(),
29       Write(WS) {}
30 
31 void WriteRef::commit() {
32   assert(Write && Write->isExecuted() && "Cannot commit before write back!");
33   RegisterID = Write->getRegisterID();
34   WriteResID = Write->getWriteResourceID();
35   Write = nullptr;
36 }
37 
38 void WriteRef::notifyExecuted(unsigned Cycle) {
39   assert(Write && Write->isExecuted() && "Not executed!");
40   WriteBackCycle = Cycle;
41 }
42 
43 bool WriteRef::hasKnownWriteBackCycle() const {
44   return isValid() && (!Write || Write->isExecuted());
45 }
46 
47 bool WriteRef::isWriteZero() const {
48   assert(isValid() && "Invalid null WriteState found!");
49   return getWriteState()->isWriteZero();
50 }
51 
52 unsigned WriteRef::getWriteResourceID() const {
53   if (Write)
54     return Write->getWriteResourceID();
55   return WriteResID;
56 }
57 
58 MCPhysReg WriteRef::getRegisterID() const {
59   if (Write)
60     return Write->getRegisterID();
61   return RegisterID;
62 }
63 
64 RegisterFile::RegisterFile(const MCSchedModel &SM, const MCRegisterInfo &mri,
65                            unsigned NumRegs)
66     : MRI(mri),
67       RegisterMappings(mri.getNumRegs(), {WriteRef(), RegisterRenamingInfo()}),
68       ZeroRegisters(mri.getNumRegs(), false), CurrentCycle() {
69   initialize(SM, NumRegs);
70 }
71 
72 void RegisterFile::initialize(const MCSchedModel &SM, unsigned NumRegs) {
73   // Create a default register file that "sees" all the machine registers
74   // declared by the target. The number of physical registers in the default
75   // register file is set equal to `NumRegs`. A value of zero for `NumRegs`
76   // means: this register file has an unbounded number of physical registers.
77   RegisterFiles.emplace_back(NumRegs);
78   if (!SM.hasExtraProcessorInfo())
79     return;
80 
81   // For each user defined register file, allocate a RegisterMappingTracker
82   // object. The size of every register file, as well as the mapping between
83   // register files and register classes is specified via tablegen.
84   const MCExtraProcessorInfo &Info = SM.getExtraProcessorInfo();
85 
86   // Skip invalid register file at index 0.
87   for (unsigned I = 1, E = Info.NumRegisterFiles; I < E; ++I) {
88     const MCRegisterFileDesc &RF = Info.RegisterFiles[I];
89     assert(RF.NumPhysRegs && "Invalid PRF with zero physical registers!");
90 
91     // The cost of a register definition is equivalent to the number of
92     // physical registers that are allocated at register renaming stage.
93     unsigned Length = RF.NumRegisterCostEntries;
94     const MCRegisterCostEntry *FirstElt =
95         &Info.RegisterCostTable[RF.RegisterCostEntryIdx];
96     addRegisterFile(RF, ArrayRef<MCRegisterCostEntry>(FirstElt, Length));
97   }
98 }
99 
100 void RegisterFile::cycleStart() {
101   for (RegisterMappingTracker &RMT : RegisterFiles)
102     RMT.NumMoveEliminated = 0;
103 }
104 
105 void RegisterFile::onInstructionExecuted(Instruction *IS) {
106   assert(IS && IS->isExecuted() && "Unexpected internal state found!");
107   for (WriteState &WS : IS->getDefs()) {
108     if (WS.isEliminated())
109       return;
110 
111     MCPhysReg RegID = WS.getRegisterID();
112 
113     // This allows InstrPostProcess to remove register Defs
114     // by setting their RegisterID to 0.
115     if (!RegID)
116       continue;
117 
118     assert(WS.getCyclesLeft() != UNKNOWN_CYCLES &&
119            "The number of cycles should be known at this point!");
120     assert(WS.getCyclesLeft() <= 0 && "Invalid cycles left for this write!");
121 
122     MCPhysReg RenameAs = RegisterMappings[RegID].second.RenameAs;
123     if (RenameAs && RenameAs != RegID)
124       RegID = RenameAs;
125 
126     WriteRef &WR = RegisterMappings[RegID].first;
127     if (WR.getWriteState() == &WS)
128       WR.notifyExecuted(CurrentCycle);
129 
130     for (MCSubRegIterator I(RegID, &MRI); I.isValid(); ++I) {
131       WriteRef &OtherWR = RegisterMappings[*I].first;
132       if (OtherWR.getWriteState() == &WS)
133         OtherWR.notifyExecuted(CurrentCycle);
134     }
135 
136     if (!WS.clearsSuperRegisters())
137       continue;
138 
139     for (MCSuperRegIterator I(RegID, &MRI); I.isValid(); ++I) {
140       WriteRef &OtherWR = RegisterMappings[*I].first;
141       if (OtherWR.getWriteState() == &WS)
142         OtherWR.notifyExecuted(CurrentCycle);
143     }
144   }
145 }
146 
147 void RegisterFile::addRegisterFile(const MCRegisterFileDesc &RF,
148                                    ArrayRef<MCRegisterCostEntry> Entries) {
149   // A default register file is always allocated at index #0. That register file
150   // is mainly used to count the total number of mappings created by all
151   // register files at runtime. Users can limit the number of available physical
152   // registers in register file #0 through the command line flag
153   // `-register-file-size`.
154   unsigned RegisterFileIndex = RegisterFiles.size();
155   RegisterFiles.emplace_back(RF.NumPhysRegs, RF.MaxMovesEliminatedPerCycle,
156                              RF.AllowZeroMoveEliminationOnly);
157 
158   // Special case where there is no register class identifier in the set.
159   // An empty set of register classes means: this register file contains all
160   // the physical registers specified by the target.
161   // We optimistically assume that a register can be renamed at the cost of a
162   // single physical register. The constructor of RegisterFile ensures that
163   // a RegisterMapping exists for each logical register defined by the Target.
164   if (Entries.empty())
165     return;
166 
167   // Now update the cost of individual registers.
168   for (const MCRegisterCostEntry &RCE : Entries) {
169     const MCRegisterClass &RC = MRI.getRegClass(RCE.RegisterClassID);
170     for (const MCPhysReg Reg : RC) {
171       RegisterRenamingInfo &Entry = RegisterMappings[Reg].second;
172       IndexPlusCostPairTy &IPC = Entry.IndexPlusCost;
173       if (IPC.first && IPC.first != RegisterFileIndex) {
174         // The only register file that is allowed to overlap is the default
175         // register file at index #0. The analysis is inaccurate if register
176         // files overlap.
177         errs() << "warning: register " << MRI.getName(Reg)
178                << " defined in multiple register files.";
179       }
180       IPC = std::make_pair(RegisterFileIndex, RCE.Cost);
181       Entry.RenameAs = Reg;
182       Entry.AllowMoveElimination = RCE.AllowMoveElimination;
183 
184       // Assume the same cost for each sub-register.
185       for (MCSubRegIterator I(Reg, &MRI); I.isValid(); ++I) {
186         RegisterRenamingInfo &OtherEntry = RegisterMappings[*I].second;
187         if (!OtherEntry.IndexPlusCost.first &&
188             (!OtherEntry.RenameAs ||
189              MRI.isSuperRegister(*I, OtherEntry.RenameAs))) {
190           OtherEntry.IndexPlusCost = IPC;
191           OtherEntry.RenameAs = Reg;
192         }
193       }
194     }
195   }
196 }
197 
198 void RegisterFile::allocatePhysRegs(const RegisterRenamingInfo &Entry,
199                                     MutableArrayRef<unsigned> UsedPhysRegs) {
200   unsigned RegisterFileIndex = Entry.IndexPlusCost.first;
201   unsigned Cost = Entry.IndexPlusCost.second;
202   if (RegisterFileIndex) {
203     RegisterMappingTracker &RMT = RegisterFiles[RegisterFileIndex];
204     RMT.NumUsedPhysRegs += Cost;
205     UsedPhysRegs[RegisterFileIndex] += Cost;
206   }
207 
208   // Now update the default register mapping tracker.
209   RegisterFiles[0].NumUsedPhysRegs += Cost;
210   UsedPhysRegs[0] += Cost;
211 }
212 
213 void RegisterFile::freePhysRegs(const RegisterRenamingInfo &Entry,
214                                 MutableArrayRef<unsigned> FreedPhysRegs) {
215   unsigned RegisterFileIndex = Entry.IndexPlusCost.first;
216   unsigned Cost = Entry.IndexPlusCost.second;
217   if (RegisterFileIndex) {
218     RegisterMappingTracker &RMT = RegisterFiles[RegisterFileIndex];
219     RMT.NumUsedPhysRegs -= Cost;
220     FreedPhysRegs[RegisterFileIndex] += Cost;
221   }
222 
223   // Now update the default register mapping tracker.
224   RegisterFiles[0].NumUsedPhysRegs -= Cost;
225   FreedPhysRegs[0] += Cost;
226 }
227 
228 void RegisterFile::addRegisterWrite(WriteRef Write,
229                                     MutableArrayRef<unsigned> UsedPhysRegs) {
230   WriteState &WS = *Write.getWriteState();
231   MCPhysReg RegID = WS.getRegisterID();
232 
233   // This allows InstrPostProcess to remove register Defs
234   // by setting their RegisterID to 0.
235   if (!RegID)
236     return;
237 
238   LLVM_DEBUG({
239     dbgs() << "[PRF] addRegisterWrite [ " << Write.getSourceIndex() << ", "
240            << MRI.getName(RegID) << "]\n";
241   });
242 
243   // If RenameAs is equal to RegID, then RegID is subject to register renaming
244   // and false dependencies on RegID are all eliminated.
245 
246   // If RenameAs references the invalid register, then we optimistically assume
247   // that it can be renamed. In the absence of tablegen descriptors for register
248   // files, RenameAs is always set to the invalid register ID.  In all other
249   // cases, RenameAs must be either equal to RegID, or it must reference a
250   // super-register of RegID.
251 
252   // If RenameAs is a super-register of RegID, then a write to RegID has always
253   // a false dependency on RenameAs. The only exception is for when the write
254   // implicitly clears the upper portion of the underlying register.
255   // If a write clears its super-registers, then it is renamed as `RenameAs`.
256   bool IsWriteZero = WS.isWriteZero();
257   bool IsEliminated = WS.isEliminated();
258   bool ShouldAllocatePhysRegs = !IsWriteZero && !IsEliminated;
259   const RegisterRenamingInfo &RRI = RegisterMappings[RegID].second;
260   WS.setPRF(RRI.IndexPlusCost.first);
261 
262   if (RRI.RenameAs && RRI.RenameAs != RegID) {
263     RegID = RRI.RenameAs;
264     WriteRef &OtherWrite = RegisterMappings[RegID].first;
265 
266     if (!WS.clearsSuperRegisters()) {
267       // The processor keeps the definition of `RegID` together with register
268       // `RenameAs`. Since this partial write is not renamed, no physical
269       // register is allocated.
270       ShouldAllocatePhysRegs = false;
271 
272       WriteState *OtherWS = OtherWrite.getWriteState();
273       if (OtherWS && (OtherWrite.getSourceIndex() != Write.getSourceIndex())) {
274         // This partial write has a false dependency on RenameAs.
275         assert(!IsEliminated && "Unexpected partial update!");
276         OtherWS->addUser(OtherWrite.getSourceIndex(), &WS);
277       }
278     }
279   }
280 
281   // Update zero registers.
282   MCPhysReg ZeroRegisterID =
283       WS.clearsSuperRegisters() ? RegID : WS.getRegisterID();
284   ZeroRegisters.setBitVal(ZeroRegisterID, IsWriteZero);
285   for (MCSubRegIterator I(ZeroRegisterID, &MRI); I.isValid(); ++I)
286     ZeroRegisters.setBitVal(*I, IsWriteZero);
287 
288   // If this move has been eliminated, then method tryEliminateMoveOrSwap should
289   // have already updated all the register mappings.
290   if (!IsEliminated) {
291     // Check if this is one of multiple writes performed by this
292     // instruction to register RegID.
293     const WriteRef &OtherWrite = RegisterMappings[RegID].first;
294     const WriteState *OtherWS = OtherWrite.getWriteState();
295     if (OtherWS && OtherWrite.getSourceIndex() == Write.getSourceIndex()) {
296       if (OtherWS->getLatency() > WS.getLatency()) {
297         // Conservatively keep the slowest write to RegID.
298         return;
299       }
300     }
301 
302     // Update the mapping for register RegID including its sub-registers.
303     RegisterMappings[RegID].first = Write;
304     RegisterMappings[RegID].second.AliasRegID = 0U;
305     for (MCSubRegIterator I(RegID, &MRI); I.isValid(); ++I) {
306       RegisterMappings[*I].first = Write;
307       RegisterMappings[*I].second.AliasRegID = 0U;
308     }
309 
310     // No physical registers are allocated for instructions that are optimized
311     // in hardware. For example, zero-latency data-dependency breaking
312     // instructions don't consume physical registers.
313     if (ShouldAllocatePhysRegs)
314       allocatePhysRegs(RegisterMappings[RegID].second, UsedPhysRegs);
315   }
316 
317   if (!WS.clearsSuperRegisters())
318     return;
319 
320   for (MCSuperRegIterator I(RegID, &MRI); I.isValid(); ++I) {
321     if (!IsEliminated) {
322       RegisterMappings[*I].first = Write;
323       RegisterMappings[*I].second.AliasRegID = 0U;
324     }
325 
326     ZeroRegisters.setBitVal(*I, IsWriteZero);
327   }
328 }
329 
330 void RegisterFile::removeRegisterWrite(
331     const WriteState &WS, MutableArrayRef<unsigned> FreedPhysRegs) {
332   // Early exit if this write was eliminated. A write eliminated at register
333   // renaming stage generates an alias, and it is not added to the PRF.
334   if (WS.isEliminated())
335     return;
336 
337   MCPhysReg RegID = WS.getRegisterID();
338 
339   // This allows InstrPostProcess to remove register Defs
340   // by setting their RegisterID to 0.
341   if (!RegID)
342     return;
343 
344   assert(WS.getCyclesLeft() != UNKNOWN_CYCLES &&
345          "Invalidating a write of unknown cycles!");
346   assert(WS.getCyclesLeft() <= 0 && "Invalid cycles left for this write!");
347 
348   bool ShouldFreePhysRegs = !WS.isWriteZero();
349   MCPhysReg RenameAs = RegisterMappings[RegID].second.RenameAs;
350   if (RenameAs && RenameAs != RegID) {
351     RegID = RenameAs;
352 
353     if (!WS.clearsSuperRegisters()) {
354       // Keep the definition of `RegID` together with register `RenameAs`.
355       ShouldFreePhysRegs = false;
356     }
357   }
358 
359   if (ShouldFreePhysRegs)
360     freePhysRegs(RegisterMappings[RegID].second, FreedPhysRegs);
361 
362   WriteRef &WR = RegisterMappings[RegID].first;
363   if (WR.getWriteState() == &WS)
364     WR.commit();
365 
366   for (MCSubRegIterator I(RegID, &MRI); I.isValid(); ++I) {
367     WriteRef &OtherWR = RegisterMappings[*I].first;
368     if (OtherWR.getWriteState() == &WS)
369       OtherWR.commit();
370   }
371 
372   if (!WS.clearsSuperRegisters())
373     return;
374 
375   for (MCSuperRegIterator I(RegID, &MRI); I.isValid(); ++I) {
376     WriteRef &OtherWR = RegisterMappings[*I].first;
377     if (OtherWR.getWriteState() == &WS)
378       OtherWR.commit();
379   }
380 }
381 
382 bool RegisterFile::canEliminateMove(const WriteState &WS, const ReadState &RS,
383                                     unsigned RegisterFileIndex) const {
384   const RegisterMapping &RMFrom = RegisterMappings[RS.getRegisterID()];
385   const RegisterMapping &RMTo = RegisterMappings[WS.getRegisterID()];
386   const RegisterMappingTracker &RMT = RegisterFiles[RegisterFileIndex];
387 
388   // From and To must be owned by the PRF at index `RegisterFileIndex`.
389   const RegisterRenamingInfo &RRIFrom = RMFrom.second;
390   if (RRIFrom.IndexPlusCost.first != RegisterFileIndex)
391     return false;
392 
393   const RegisterRenamingInfo &RRITo = RMTo.second;
394   if (RRITo.IndexPlusCost.first != RegisterFileIndex)
395     return false;
396 
397   // Early exit if the destination register is from a register class that
398   // doesn't allow move elimination.
399   if (!RegisterMappings[RRITo.RenameAs].second.AllowMoveElimination)
400     return false;
401 
402   // We only allow move elimination for writes that update a full physical
403   // register. On X86, move elimination is possible with 32-bit general purpose
404   // registers because writes to those registers are not partial writes.  If a
405   // register move is a partial write, then we conservatively assume that move
406   // elimination fails, since it would either trigger a partial update, or the
407   // issue of a merge opcode.
408   //
409   // Note that this constraint may be lifted in future.  For example, we could
410   // make this model more flexible, and let users customize the set of registers
411   // (i.e. register classes) that allow move elimination.
412   //
413   // For now, we assume that there is a strong correlation between registers
414   // that allow move elimination, and how those same registers are renamed in
415   // hardware.
416   if (RRITo.RenameAs && RRITo.RenameAs != WS.getRegisterID())
417     if (!WS.clearsSuperRegisters())
418       return false;
419 
420   bool IsZeroMove = ZeroRegisters[RS.getRegisterID()];
421   return (!RMT.AllowZeroMoveEliminationOnly || IsZeroMove);
422 }
423 
424 bool RegisterFile::tryEliminateMoveOrSwap(MutableArrayRef<WriteState> Writes,
425                                           MutableArrayRef<ReadState> Reads) {
426   if (Writes.size() != Reads.size())
427     return false;
428 
429   // This logic assumes that writes and reads are contributed by a register move
430   // or a register swap operation. In particular, it assumes a simple register
431   // move if there is only one write.  It assumes a swap operation if there are
432   // exactly two writes.
433   if (Writes.empty() || Writes.size() > 2)
434     return false;
435 
436   // All registers must be owned by the same PRF.
437   const RegisterRenamingInfo &RRInfo =
438       RegisterMappings[Writes[0].getRegisterID()].second;
439   unsigned RegisterFileIndex = RRInfo.IndexPlusCost.first;
440   RegisterMappingTracker &RMT = RegisterFiles[RegisterFileIndex];
441 
442   // Early exit if the PRF cannot eliminate more moves/xchg in this cycle.
443   if (RMT.MaxMoveEliminatedPerCycle &&
444       (RMT.NumMoveEliminated + Writes.size()) > RMT.MaxMoveEliminatedPerCycle)
445     return false;
446 
447   for (size_t I = 0, E = Writes.size(); I < E; ++I) {
448     const ReadState &RS = Reads[I];
449     const WriteState &WS = Writes[E - (I + 1)];
450     if (!canEliminateMove(WS, RS, RegisterFileIndex))
451       return false;
452   }
453 
454   for (size_t I = 0, E = Writes.size(); I < E; ++I) {
455     ReadState &RS = Reads[I];
456     WriteState &WS = Writes[E - (I + 1)];
457 
458     const RegisterMapping &RMFrom = RegisterMappings[RS.getRegisterID()];
459     const RegisterMapping &RMTo = RegisterMappings[WS.getRegisterID()];
460     const RegisterRenamingInfo &RRIFrom = RMFrom.second;
461     const RegisterRenamingInfo &RRITo = RMTo.second;
462 
463     // Construct an alias.
464     MCPhysReg AliasedReg =
465         RRIFrom.RenameAs ? RRIFrom.RenameAs : RS.getRegisterID();
466     MCPhysReg AliasReg = RRITo.RenameAs ? RRITo.RenameAs : WS.getRegisterID();
467 
468     const RegisterRenamingInfo &RMAlias = RegisterMappings[AliasedReg].second;
469     if (RMAlias.AliasRegID)
470       AliasedReg = RMAlias.AliasRegID;
471 
472     RegisterMappings[AliasReg].second.AliasRegID = AliasedReg;
473     for (MCSubRegIterator I(AliasReg, &MRI); I.isValid(); ++I)
474       RegisterMappings[*I].second.AliasRegID = AliasedReg;
475 
476     if (ZeroRegisters[RS.getRegisterID()]) {
477       WS.setWriteZero();
478       RS.setReadZero();
479     }
480 
481     WS.setEliminated();
482     RMT.NumMoveEliminated++;
483   }
484 
485   return true;
486 }
487 
488 unsigned WriteRef::getWriteBackCycle() const {
489   assert(hasKnownWriteBackCycle() && "Instruction not executed!");
490   assert((!Write || Write->getCyclesLeft() <= 0) &&
491          "Inconsistent state found!");
492   return WriteBackCycle;
493 }
494 
495 unsigned RegisterFile::getElapsedCyclesFromWriteBack(const WriteRef &WR) const {
496   assert(WR.hasKnownWriteBackCycle() && "Write hasn't been committed yet!");
497   return CurrentCycle - WR.getWriteBackCycle();
498 }
499 
500 void RegisterFile::collectWrites(
501     const MCSubtargetInfo &STI, const ReadState &RS,
502     SmallVectorImpl<WriteRef> &Writes,
503     SmallVectorImpl<WriteRef> &CommittedWrites) const {
504   const ReadDescriptor &RD = RS.getDescriptor();
505   const MCSchedModel &SM = STI.getSchedModel();
506   const MCSchedClassDesc *SC = SM.getSchedClassDesc(RD.SchedClassID);
507   MCPhysReg RegID = RS.getRegisterID();
508   assert(RegID && RegID < RegisterMappings.size());
509   LLVM_DEBUG(dbgs() << "[PRF] collecting writes for register "
510                     << MRI.getName(RegID) << '\n');
511 
512   // Check if this is an alias.
513   const RegisterRenamingInfo &RRI = RegisterMappings[RegID].second;
514   if (RRI.AliasRegID)
515     RegID = RRI.AliasRegID;
516 
517   const WriteRef &WR = RegisterMappings[RegID].first;
518   if (WR.getWriteState()) {
519     Writes.push_back(WR);
520   } else if (WR.hasKnownWriteBackCycle()) {
521     unsigned WriteResID = WR.getWriteResourceID();
522     int ReadAdvance = STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID);
523     if (ReadAdvance < 0) {
524       unsigned Elapsed = getElapsedCyclesFromWriteBack(WR);
525       if (Elapsed < static_cast<unsigned>(-ReadAdvance))
526         CommittedWrites.push_back(WR);
527     }
528   }
529 
530   // Handle potential partial register updates.
531   for (MCSubRegIterator I(RegID, &MRI); I.isValid(); ++I) {
532     const WriteRef &WR = RegisterMappings[*I].first;
533     if (WR.getWriteState()) {
534       Writes.push_back(WR);
535     } else if (WR.hasKnownWriteBackCycle()) {
536       unsigned WriteResID = WR.getWriteResourceID();
537       int ReadAdvance = STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID);
538       if (ReadAdvance < 0) {
539         unsigned Elapsed = getElapsedCyclesFromWriteBack(WR);
540         if (Elapsed < static_cast<unsigned>(-ReadAdvance))
541           CommittedWrites.push_back(WR);
542       }
543     }
544   }
545 
546   // Remove duplicate entries and resize the input vector.
547   if (Writes.size() > 1) {
548     sort(Writes, [](const WriteRef &Lhs, const WriteRef &Rhs) {
549       return Lhs.getWriteState() < Rhs.getWriteState();
550     });
551     auto It = std::unique(Writes.begin(), Writes.end());
552     Writes.resize(std::distance(Writes.begin(), It));
553   }
554 
555   LLVM_DEBUG({
556     for (const WriteRef &WR : Writes) {
557       const WriteState &WS = *WR.getWriteState();
558       dbgs() << "[PRF] Found a dependent use of Register "
559              << MRI.getName(WS.getRegisterID()) << " (defined by instruction #"
560              << WR.getSourceIndex() << ")\n";
561     }
562   });
563 }
564 
565 RegisterFile::RAWHazard
566 RegisterFile::checkRAWHazards(const MCSubtargetInfo &STI,
567                               const ReadState &RS) const {
568   RAWHazard Hazard;
569   SmallVector<WriteRef, 4> Writes;
570   SmallVector<WriteRef, 4> CommittedWrites;
571 
572   const MCSchedModel &SM = STI.getSchedModel();
573   const ReadDescriptor &RD = RS.getDescriptor();
574   const MCSchedClassDesc *SC = SM.getSchedClassDesc(RD.SchedClassID);
575 
576   collectWrites(STI, RS, Writes, CommittedWrites);
577   for (const WriteRef &WR : Writes) {
578     const WriteState *WS = WR.getWriteState();
579     unsigned WriteResID = WS->getWriteResourceID();
580     int ReadAdvance = STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID);
581 
582     if (WS->getCyclesLeft() == UNKNOWN_CYCLES) {
583       if (Hazard.isValid())
584         continue;
585 
586       Hazard.RegisterID = WR.getRegisterID();
587       Hazard.CyclesLeft = UNKNOWN_CYCLES;
588       continue;
589     }
590 
591     int CyclesLeft = WS->getCyclesLeft() - ReadAdvance;
592     if (CyclesLeft > 0) {
593       if (Hazard.CyclesLeft < CyclesLeft) {
594         Hazard.RegisterID = WR.getRegisterID();
595         Hazard.CyclesLeft = CyclesLeft;
596       }
597     }
598   }
599   Writes.clear();
600 
601   for (const WriteRef &WR : CommittedWrites) {
602     unsigned WriteResID = WR.getWriteResourceID();
603     int NegReadAdvance = -STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID);
604     int Elapsed = static_cast<int>(getElapsedCyclesFromWriteBack(WR));
605     int CyclesLeft = NegReadAdvance - Elapsed;
606     assert(CyclesLeft > 0 && "Write should not be in the CommottedWrites set!");
607     if (Hazard.CyclesLeft < CyclesLeft) {
608       Hazard.RegisterID = WR.getRegisterID();
609       Hazard.CyclesLeft = CyclesLeft;
610     }
611   }
612 
613   return Hazard;
614 }
615 
616 void RegisterFile::addRegisterRead(ReadState &RS,
617                                    const MCSubtargetInfo &STI) const {
618   MCPhysReg RegID = RS.getRegisterID();
619   const RegisterRenamingInfo &RRI = RegisterMappings[RegID].second;
620   RS.setPRF(RRI.IndexPlusCost.first);
621   if (RS.isIndependentFromDef())
622     return;
623 
624   if (ZeroRegisters[RS.getRegisterID()])
625     RS.setReadZero();
626 
627   SmallVector<WriteRef, 4> DependentWrites;
628   SmallVector<WriteRef, 4> CompletedWrites;
629   collectWrites(STI, RS, DependentWrites, CompletedWrites);
630   RS.setDependentWrites(DependentWrites.size() + CompletedWrites.size());
631 
632   // We know that this read depends on all the writes in DependentWrites.
633   // For each write, check if we have ReadAdvance information, and use it
634   // to figure out in how many cycles this read will be available.
635   const ReadDescriptor &RD = RS.getDescriptor();
636   const MCSchedModel &SM = STI.getSchedModel();
637   const MCSchedClassDesc *SC = SM.getSchedClassDesc(RD.SchedClassID);
638   for (WriteRef &WR : DependentWrites) {
639     unsigned WriteResID = WR.getWriteResourceID();
640     WriteState &WS = *WR.getWriteState();
641     int ReadAdvance = STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID);
642     WS.addUser(WR.getSourceIndex(), &RS, ReadAdvance);
643   }
644 
645   for (WriteRef &WR : CompletedWrites) {
646     unsigned WriteResID = WR.getWriteResourceID();
647     assert(WR.hasKnownWriteBackCycle() && "Invalid write!");
648     assert(STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID) < 0);
649     unsigned ReadAdvance = static_cast<unsigned>(
650         -STI.getReadAdvanceCycles(SC, RD.UseIndex, WriteResID));
651     unsigned Elapsed = getElapsedCyclesFromWriteBack(WR);
652     assert(Elapsed < ReadAdvance && "Should not have been added to the set!");
653     RS.writeStartEvent(WR.getSourceIndex(), WR.getRegisterID(),
654                        ReadAdvance - Elapsed);
655   }
656 }
657 
658 unsigned RegisterFile::isAvailable(ArrayRef<MCPhysReg> Regs) const {
659   SmallVector<unsigned, 4> NumPhysRegs(getNumRegisterFiles());
660 
661   // Find how many new mappings must be created for each register file.
662   for (const MCPhysReg RegID : Regs) {
663     const RegisterRenamingInfo &RRI = RegisterMappings[RegID].second;
664     const IndexPlusCostPairTy &Entry = RRI.IndexPlusCost;
665     if (Entry.first)
666       NumPhysRegs[Entry.first] += Entry.second;
667     NumPhysRegs[0] += Entry.second;
668   }
669 
670   unsigned Response = 0;
671   for (unsigned I = 0, E = getNumRegisterFiles(); I < E; ++I) {
672     unsigned NumRegs = NumPhysRegs[I];
673     if (!NumRegs)
674       continue;
675 
676     const RegisterMappingTracker &RMT = RegisterFiles[I];
677     if (!RMT.NumPhysRegs) {
678       // The register file has an unbounded number of microarchitectural
679       // registers.
680       continue;
681     }
682 
683     if (RMT.NumPhysRegs < NumRegs) {
684       // The current register file is too small. This may occur if the number of
685       // microarchitectural registers in register file #0 was changed by the
686       // users via flag -reg-file-size. Alternatively, the scheduling model
687       // specified a too small number of registers for this register file.
688       LLVM_DEBUG(
689           dbgs() << "[PRF] Not enough registers in the register file.\n");
690 
691       // FIXME: Normalize the instruction register count to match the
692       // NumPhysRegs value.  This is a highly unusual case, and is not expected
693       // to occur.  This normalization is hiding an inconsistency in either the
694       // scheduling model or in the value that the user might have specified
695       // for NumPhysRegs.
696       NumRegs = RMT.NumPhysRegs;
697     }
698 
699     if (RMT.NumPhysRegs < (RMT.NumUsedPhysRegs + NumRegs))
700       Response |= (1U << I);
701   }
702 
703   return Response;
704 }
705 
706 #ifndef NDEBUG
707 void WriteRef::dump() const {
708   dbgs() << "IID=" << getSourceIndex() << ' ';
709   if (isValid())
710     getWriteState()->dump();
711   else
712     dbgs() << "(null)";
713 }
714 
715 void RegisterFile::dump() const {
716   for (unsigned I = 0, E = MRI.getNumRegs(); I < E; ++I) {
717     const RegisterMapping &RM = RegisterMappings[I];
718     const RegisterRenamingInfo &RRI = RM.second;
719     if (ZeroRegisters[I]) {
720       dbgs() << MRI.getName(I) << ", " << I
721              << ", PRF=" << RRI.IndexPlusCost.first
722              << ", Cost=" << RRI.IndexPlusCost.second
723              << ", RenameAs=" << RRI.RenameAs << ", IsZero=" << ZeroRegisters[I]
724              << ",";
725       RM.first.dump();
726       dbgs() << '\n';
727     }
728   }
729 
730   for (unsigned I = 0, E = getNumRegisterFiles(); I < E; ++I) {
731     dbgs() << "Register File #" << I;
732     const RegisterMappingTracker &RMT = RegisterFiles[I];
733     dbgs() << "\n  TotalMappings:        " << RMT.NumPhysRegs
734            << "\n  NumUsedMappings:      " << RMT.NumUsedPhysRegs << '\n';
735   }
736 }
737 #endif
738 
739 } // namespace mca
740 } // namespace llvm
741