1f35c8403SAndrew Trick //===-- InterferenceCache.cpp - Caching per-block interference ---------*--===//
291cbcaf9SJakob Stoklund Olesen //
391cbcaf9SJakob Stoklund Olesen //                     The LLVM Compiler Infrastructure
491cbcaf9SJakob Stoklund Olesen //
591cbcaf9SJakob Stoklund Olesen // This file is distributed under the University of Illinois Open Source
691cbcaf9SJakob Stoklund Olesen // License. See LICENSE.TXT for details.
791cbcaf9SJakob Stoklund Olesen //
891cbcaf9SJakob Stoklund Olesen //===----------------------------------------------------------------------===//
991cbcaf9SJakob Stoklund Olesen //
1091cbcaf9SJakob Stoklund Olesen // InterferenceCache remembers per-block interference in LiveIntervalUnions.
1191cbcaf9SJakob Stoklund Olesen //
1291cbcaf9SJakob Stoklund Olesen //===----------------------------------------------------------------------===//
1391cbcaf9SJakob Stoklund Olesen 
1491cbcaf9SJakob Stoklund Olesen #include "InterferenceCache.h"
15a16ae597SJakob Stoklund Olesen #include "llvm/CodeGen/LiveIntervalAnalysis.h"
16ed0881b2SChandler Carruth #include "llvm/Support/ErrorHandling.h"
17ed0881b2SChandler Carruth #include "llvm/Target/TargetRegisterInfo.h"
1891cbcaf9SJakob Stoklund Olesen 
1991cbcaf9SJakob Stoklund Olesen using namespace llvm;
2091cbcaf9SJakob Stoklund Olesen 
211b9dde08SChandler Carruth #define DEBUG_TYPE "regalloc"
221b9dde08SChandler Carruth 
23cacefc7dSJakob Stoklund Olesen // Static member used for null interference cursors.
2457a3d084SBenjamin Kramer const InterferenceCache::BlockInterference
2557a3d084SBenjamin Kramer     InterferenceCache::Cursor::NoInterference;
26cacefc7dSJakob Stoklund Olesen 
275eb10048SPuyan Lotfi // Initializes PhysRegEntries (instead of a SmallVector, PhysRegEntries is a
285eb10048SPuyan Lotfi // buffer of size NumPhysRegs to speed up alloc/clear for targets with large
295eb10048SPuyan Lotfi // reg files). Calloced memory is used for good form, and quites tools like
305eb10048SPuyan Lotfi // Valgrind too, but zero initialized memory is not required by the algorithm:
315eb10048SPuyan Lotfi // this is because PhysRegEntries works like a SparseSet and its entries are
325eb10048SPuyan Lotfi // only valid when there is a corresponding CacheEntries assignment. There is
335eb10048SPuyan Lotfi // also support for when pass managers are reused for targets with different
345eb10048SPuyan Lotfi // numbers of PhysRegs: in this case PhysRegEntries is freed and reinitialized.
355eb10048SPuyan Lotfi void InterferenceCache::reinitPhysRegEntries() {
365eb10048SPuyan Lotfi   if (PhysRegEntriesCount == TRI->getNumRegs()) return;
375eb10048SPuyan Lotfi   free(PhysRegEntries);
385eb10048SPuyan Lotfi   PhysRegEntriesCount = TRI->getNumRegs();
395eb10048SPuyan Lotfi   PhysRegEntries = (unsigned char*)
405eb10048SPuyan Lotfi     calloc(PhysRegEntriesCount, sizeof(unsigned char));
415eb10048SPuyan Lotfi }
425eb10048SPuyan Lotfi 
4391cbcaf9SJakob Stoklund Olesen void InterferenceCache::init(MachineFunction *mf,
4491cbcaf9SJakob Stoklund Olesen                              LiveIntervalUnion *liuarray,
4591cbcaf9SJakob Stoklund Olesen                              SlotIndexes *indexes,
46a16ae597SJakob Stoklund Olesen                              LiveIntervals *lis,
4791cbcaf9SJakob Stoklund Olesen                              const TargetRegisterInfo *tri) {
4891cbcaf9SJakob Stoklund Olesen   MF = mf;
4991cbcaf9SJakob Stoklund Olesen   LIUArray = liuarray;
5091cbcaf9SJakob Stoklund Olesen   TRI = tri;
515eb10048SPuyan Lotfi   reinitPhysRegEntries();
5291cbcaf9SJakob Stoklund Olesen   for (unsigned i = 0; i != CacheEntries; ++i)
53a16ae597SJakob Stoklund Olesen     Entries[i].clear(mf, indexes, lis);
5491cbcaf9SJakob Stoklund Olesen }
5591cbcaf9SJakob Stoklund Olesen 
5691cbcaf9SJakob Stoklund Olesen InterferenceCache::Entry *InterferenceCache::get(unsigned PhysReg) {
5791cbcaf9SJakob Stoklund Olesen   unsigned E = PhysRegEntries[PhysReg];
5891cbcaf9SJakob Stoklund Olesen   if (E < CacheEntries && Entries[E].getPhysReg() == PhysReg) {
5991cbcaf9SJakob Stoklund Olesen     if (!Entries[E].valid(LIUArray, TRI))
6096eebf0bSJakob Stoklund Olesen       Entries[E].revalidate(LIUArray, TRI);
6191cbcaf9SJakob Stoklund Olesen     return &Entries[E];
6291cbcaf9SJakob Stoklund Olesen   }
6391cbcaf9SJakob Stoklund Olesen   // No valid entry exists, pick the next round-robin entry.
6491cbcaf9SJakob Stoklund Olesen   E = RoundRobin;
6591cbcaf9SJakob Stoklund Olesen   if (++RoundRobin == CacheEntries)
6691cbcaf9SJakob Stoklund Olesen     RoundRobin = 0;
67a153ca58SJakob Stoklund Olesen   for (unsigned i = 0; i != CacheEntries; ++i) {
68a153ca58SJakob Stoklund Olesen     // Skip entries that are in use.
69a153ca58SJakob Stoklund Olesen     if (Entries[E].hasRefs()) {
70a153ca58SJakob Stoklund Olesen       if (++E == CacheEntries)
71a153ca58SJakob Stoklund Olesen         E = 0;
72a153ca58SJakob Stoklund Olesen       continue;
73a153ca58SJakob Stoklund Olesen     }
7491cbcaf9SJakob Stoklund Olesen     Entries[E].reset(PhysReg, LIUArray, TRI, MF);
7591cbcaf9SJakob Stoklund Olesen     PhysRegEntries[PhysReg] = E;
7691cbcaf9SJakob Stoklund Olesen     return &Entries[E];
7791cbcaf9SJakob Stoklund Olesen   }
78a153ca58SJakob Stoklund Olesen   llvm_unreachable("Ran out of interference cache entries.");
79a153ca58SJakob Stoklund Olesen }
8091cbcaf9SJakob Stoklund Olesen 
8191cbcaf9SJakob Stoklund Olesen /// revalidate - LIU contents have changed, update tags.
8296eebf0bSJakob Stoklund Olesen void InterferenceCache::Entry::revalidate(LiveIntervalUnion *LIUArray,
8396eebf0bSJakob Stoklund Olesen                                           const TargetRegisterInfo *TRI) {
8491cbcaf9SJakob Stoklund Olesen   // Invalidate all block entries.
8591cbcaf9SJakob Stoklund Olesen   ++Tag;
8691cbcaf9SJakob Stoklund Olesen   // Invalidate all iterators.
8791cbcaf9SJakob Stoklund Olesen   PrevPos = SlotIndex();
8896eebf0bSJakob Stoklund Olesen   unsigned i = 0;
8996eebf0bSJakob Stoklund Olesen   for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units, ++i)
9096eebf0bSJakob Stoklund Olesen     RegUnits[i].VirtTag = LIUArray[*Units].getTag();
9191cbcaf9SJakob Stoklund Olesen }
9291cbcaf9SJakob Stoklund Olesen 
9391cbcaf9SJakob Stoklund Olesen void InterferenceCache::Entry::reset(unsigned physReg,
9491cbcaf9SJakob Stoklund Olesen                                      LiveIntervalUnion *LIUArray,
9591cbcaf9SJakob Stoklund Olesen                                      const TargetRegisterInfo *TRI,
9691cbcaf9SJakob Stoklund Olesen                                      const MachineFunction *MF) {
97a153ca58SJakob Stoklund Olesen   assert(!hasRefs() && "Cannot reset cache entry with references");
9891cbcaf9SJakob Stoklund Olesen   // LIU's changed, invalidate cache.
9991cbcaf9SJakob Stoklund Olesen   ++Tag;
10091cbcaf9SJakob Stoklund Olesen   PhysReg = physReg;
10191cbcaf9SJakob Stoklund Olesen   Blocks.resize(MF->getNumBlockIDs());
10291cbcaf9SJakob Stoklund Olesen 
10391cbcaf9SJakob Stoklund Olesen   // Reset iterators.
10491cbcaf9SJakob Stoklund Olesen   PrevPos = SlotIndex();
10596eebf0bSJakob Stoklund Olesen   RegUnits.clear();
10696eebf0bSJakob Stoklund Olesen   for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units) {
10796eebf0bSJakob Stoklund Olesen     RegUnits.push_back(LIUArray[*Units]);
10896eebf0bSJakob Stoklund Olesen     RegUnits.back().Fixed = &LIS->getRegUnit(*Units);
10996eebf0bSJakob Stoklund Olesen   }
11091cbcaf9SJakob Stoklund Olesen }
11191cbcaf9SJakob Stoklund Olesen 
11291cbcaf9SJakob Stoklund Olesen bool InterferenceCache::Entry::valid(LiveIntervalUnion *LIUArray,
11391cbcaf9SJakob Stoklund Olesen                                      const TargetRegisterInfo *TRI) {
11496eebf0bSJakob Stoklund Olesen   unsigned i = 0, e = RegUnits.size();
11596eebf0bSJakob Stoklund Olesen   for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units, ++i) {
11696eebf0bSJakob Stoklund Olesen     if (i == e)
11791cbcaf9SJakob Stoklund Olesen       return false;
11896eebf0bSJakob Stoklund Olesen     if (LIUArray[*Units].changedSince(RegUnits[i].VirtTag))
11991cbcaf9SJakob Stoklund Olesen       return false;
12091cbcaf9SJakob Stoklund Olesen   }
12191cbcaf9SJakob Stoklund Olesen   return i == e;
12291cbcaf9SJakob Stoklund Olesen }
12391cbcaf9SJakob Stoklund Olesen 
12491cbcaf9SJakob Stoklund Olesen void InterferenceCache::Entry::update(unsigned MBBNum) {
12591cbcaf9SJakob Stoklund Olesen   SlotIndex Start, Stop;
126d6f1f84fSBenjamin Kramer   std::tie(Start, Stop) = Indexes->getMBBRange(MBBNum);
12791cbcaf9SJakob Stoklund Olesen 
12891cbcaf9SJakob Stoklund Olesen   // Use advanceTo only when possible.
129994c1683SJakob Stoklund Olesen   if (PrevPos != Start) {
13096eebf0bSJakob Stoklund Olesen     if (!PrevPos.isValid() || Start < PrevPos) {
13196eebf0bSJakob Stoklund Olesen       for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
13296eebf0bSJakob Stoklund Olesen         RegUnitInfo &RUI = RegUnits[i];
13396eebf0bSJakob Stoklund Olesen         RUI.VirtI.find(Start);
13496eebf0bSJakob Stoklund Olesen         RUI.FixedI = RUI.Fixed->find(Start);
13596eebf0bSJakob Stoklund Olesen       }
13696eebf0bSJakob Stoklund Olesen     } else {
13796eebf0bSJakob Stoklund Olesen       for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
13896eebf0bSJakob Stoklund Olesen         RegUnitInfo &RUI = RegUnits[i];
13996eebf0bSJakob Stoklund Olesen         RUI.VirtI.advanceTo(Start);
14096eebf0bSJakob Stoklund Olesen         if (RUI.FixedI != RUI.Fixed->end())
14196eebf0bSJakob Stoklund Olesen           RUI.FixedI = RUI.Fixed->advanceTo(RUI.FixedI, Start);
14296eebf0bSJakob Stoklund Olesen       }
14396eebf0bSJakob Stoklund Olesen     }
14491cbcaf9SJakob Stoklund Olesen     PrevPos = Start;
145994c1683SJakob Stoklund Olesen   }
14691cbcaf9SJakob Stoklund Olesen 
147*5ae5939fSDuncan P. N. Exon Smith   MachineFunction::const_iterator MFI =
148*5ae5939fSDuncan P. N. Exon Smith       MF->getBlockNumbered(MBBNum)->getIterator();
1494ad6c160SJakob Stoklund Olesen   BlockInterference *BI = &Blocks[MBBNum];
150a16ae597SJakob Stoklund Olesen   ArrayRef<SlotIndex> RegMaskSlots;
151a16ae597SJakob Stoklund Olesen   ArrayRef<const uint32_t*> RegMaskBits;
1524ad6c160SJakob Stoklund Olesen   for (;;) {
1534ad6c160SJakob Stoklund Olesen     BI->Tag = Tag;
1544ad6c160SJakob Stoklund Olesen     BI->First = BI->Last = SlotIndex();
1554ad6c160SJakob Stoklund Olesen 
15696eebf0bSJakob Stoklund Olesen     // Check for first interference from virtregs.
15796eebf0bSJakob Stoklund Olesen     for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
15896eebf0bSJakob Stoklund Olesen       LiveIntervalUnion::SegmentIter &I = RegUnits[i].VirtI;
15991cbcaf9SJakob Stoklund Olesen       if (!I.valid())
16091cbcaf9SJakob Stoklund Olesen         continue;
16191cbcaf9SJakob Stoklund Olesen       SlotIndex StartI = I.start();
16291cbcaf9SJakob Stoklund Olesen       if (StartI >= Stop)
16391cbcaf9SJakob Stoklund Olesen         continue;
16491cbcaf9SJakob Stoklund Olesen       if (!BI->First.isValid() || StartI < BI->First)
16591cbcaf9SJakob Stoklund Olesen         BI->First = StartI;
16691cbcaf9SJakob Stoklund Olesen     }
16791cbcaf9SJakob Stoklund Olesen 
16896eebf0bSJakob Stoklund Olesen     // Same thing for fixed interference.
16996eebf0bSJakob Stoklund Olesen     for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
17096eebf0bSJakob Stoklund Olesen       LiveInterval::const_iterator I = RegUnits[i].FixedI;
17196eebf0bSJakob Stoklund Olesen       LiveInterval::const_iterator E = RegUnits[i].Fixed->end();
17296eebf0bSJakob Stoklund Olesen       if (I == E)
17396eebf0bSJakob Stoklund Olesen         continue;
17496eebf0bSJakob Stoklund Olesen       SlotIndex StartI = I->start;
17596eebf0bSJakob Stoklund Olesen       if (StartI >= Stop)
17696eebf0bSJakob Stoklund Olesen         continue;
17796eebf0bSJakob Stoklund Olesen       if (!BI->First.isValid() || StartI < BI->First)
17896eebf0bSJakob Stoklund Olesen         BI->First = StartI;
17996eebf0bSJakob Stoklund Olesen     }
18096eebf0bSJakob Stoklund Olesen 
181a16ae597SJakob Stoklund Olesen     // Also check for register mask interference.
182a16ae597SJakob Stoklund Olesen     RegMaskSlots = LIS->getRegMaskSlotsInBlock(MBBNum);
183a16ae597SJakob Stoklund Olesen     RegMaskBits = LIS->getRegMaskBitsInBlock(MBBNum);
184a16ae597SJakob Stoklund Olesen     SlotIndex Limit = BI->First.isValid() ? BI->First : Stop;
185a16ae597SJakob Stoklund Olesen     for (unsigned i = 0, e = RegMaskSlots.size();
186a16ae597SJakob Stoklund Olesen          i != e && RegMaskSlots[i] < Limit; ++i)
187024d7ae1SJakob Stoklund Olesen       if (MachineOperand::clobbersPhysReg(RegMaskBits[i], PhysReg)) {
188a16ae597SJakob Stoklund Olesen         // Register mask i clobbers PhysReg before the LIU interference.
189a16ae597SJakob Stoklund Olesen         BI->First = RegMaskSlots[i];
190a16ae597SJakob Stoklund Olesen         break;
191a16ae597SJakob Stoklund Olesen       }
192a16ae597SJakob Stoklund Olesen 
1934ad6c160SJakob Stoklund Olesen     PrevPos = Stop;
1944ad6c160SJakob Stoklund Olesen     if (BI->First.isValid())
1954ad6c160SJakob Stoklund Olesen       break;
19691cbcaf9SJakob Stoklund Olesen 
1974ad6c160SJakob Stoklund Olesen     // No interference in this block? Go ahead and precompute the next block.
1984ad6c160SJakob Stoklund Olesen     if (++MFI == MF->end())
1994ad6c160SJakob Stoklund Olesen       return;
2004ad6c160SJakob Stoklund Olesen     MBBNum = MFI->getNumber();
2014ad6c160SJakob Stoklund Olesen     BI = &Blocks[MBBNum];
2024ad6c160SJakob Stoklund Olesen     if (BI->Tag == Tag)
2034ad6c160SJakob Stoklund Olesen       return;
204d6f1f84fSBenjamin Kramer     std::tie(Start, Stop) = Indexes->getMBBRange(MBBNum);
2054ad6c160SJakob Stoklund Olesen   }
2064ad6c160SJakob Stoklund Olesen 
2074ad6c160SJakob Stoklund Olesen   // Check for last interference in block.
20896eebf0bSJakob Stoklund Olesen   for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
20996eebf0bSJakob Stoklund Olesen     LiveIntervalUnion::SegmentIter &I = RegUnits[i].VirtI;
21091cbcaf9SJakob Stoklund Olesen     if (!I.valid() || I.start() >= Stop)
21191cbcaf9SJakob Stoklund Olesen       continue;
21291cbcaf9SJakob Stoklund Olesen     I.advanceTo(Stop);
213994c1683SJakob Stoklund Olesen     bool Backup = !I.valid() || I.start() >= Stop;
214994c1683SJakob Stoklund Olesen     if (Backup)
21591cbcaf9SJakob Stoklund Olesen       --I;
21691cbcaf9SJakob Stoklund Olesen     SlotIndex StopI = I.stop();
21791cbcaf9SJakob Stoklund Olesen     if (!BI->Last.isValid() || StopI > BI->Last)
21891cbcaf9SJakob Stoklund Olesen       BI->Last = StopI;
219994c1683SJakob Stoklund Olesen     if (Backup)
220994c1683SJakob Stoklund Olesen       ++I;
22191cbcaf9SJakob Stoklund Olesen   }
222a16ae597SJakob Stoklund Olesen 
22396eebf0bSJakob Stoklund Olesen   // Fixed interference.
22496eebf0bSJakob Stoklund Olesen   for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
22596eebf0bSJakob Stoklund Olesen     LiveInterval::iterator &I = RegUnits[i].FixedI;
22634e1be94SMatthias Braun     LiveRange *LR = RegUnits[i].Fixed;
22734e1be94SMatthias Braun     if (I == LR->end() || I->start >= Stop)
22896eebf0bSJakob Stoklund Olesen       continue;
22934e1be94SMatthias Braun     I = LR->advanceTo(I, Stop);
23034e1be94SMatthias Braun     bool Backup = I == LR->end() || I->start >= Stop;
23196eebf0bSJakob Stoklund Olesen     if (Backup)
23296eebf0bSJakob Stoklund Olesen       --I;
23396eebf0bSJakob Stoklund Olesen     SlotIndex StopI = I->end;
23496eebf0bSJakob Stoklund Olesen     if (!BI->Last.isValid() || StopI > BI->Last)
23596eebf0bSJakob Stoklund Olesen       BI->Last = StopI;
23696eebf0bSJakob Stoklund Olesen     if (Backup)
23796eebf0bSJakob Stoklund Olesen       ++I;
23896eebf0bSJakob Stoklund Olesen   }
23996eebf0bSJakob Stoklund Olesen 
240a16ae597SJakob Stoklund Olesen   // Also check for register mask interference.
241a16ae597SJakob Stoklund Olesen   SlotIndex Limit = BI->Last.isValid() ? BI->Last : Start;
242c4cf13f7SJakob Stoklund Olesen   for (unsigned i = RegMaskSlots.size();
243c4cf13f7SJakob Stoklund Olesen        i && RegMaskSlots[i-1].getDeadSlot() > Limit; --i)
244024d7ae1SJakob Stoklund Olesen     if (MachineOperand::clobbersPhysReg(RegMaskBits[i-1], PhysReg)) {
245a16ae597SJakob Stoklund Olesen       // Register mask i-1 clobbers PhysReg after the LIU interference.
246a16ae597SJakob Stoklund Olesen       // Model the regmask clobber as a dead def.
247a16ae597SJakob Stoklund Olesen       BI->Last = RegMaskSlots[i-1].getDeadSlot();
248a16ae597SJakob Stoklund Olesen       break;
249a16ae597SJakob Stoklund Olesen     }
25091cbcaf9SJakob Stoklund Olesen }
251