1 //===- DFAPacketizerEmitter.cpp - Packetization DFA for a VLIW machine ----===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This class parses the Schedule.td file and produces an API that can be used
11 // to reason about whether an instruction can be added to a packet on a VLIW
12 // architecture. The class internally generates a deterministic finite
13 // automaton (DFA) that models all possible mappings of machine instructions
14 // to functional units as instructions are added to a packet.
15 //
16 //===----------------------------------------------------------------------===//
17 
18 #define DEBUG_TYPE "dfa-emitter"
19 
20 #include "CodeGenTarget.h"
21 #include "llvm/ADT/DenseSet.h"
22 #include "llvm/ADT/STLExtras.h"
23 #include "llvm/ADT/StringExtras.h"
24 #include "llvm/TableGen/Record.h"
25 #include "llvm/TableGen/TableGenBackend.h"
26 #include "llvm/Support/Debug.h"
27 #include <map>
28 #include <string>
29 #include <queue>
30 
31 using namespace llvm;
32 
33 // --------------------------------------------------------------------
34 // Definitions shared between DFAPacketizer.cpp and DFAPacketizerEmitter.cpp
35 
36 // DFA_MAX_RESTERMS * DFA_MAX_RESOURCES must fit within sizeof DFAInput.
37 // This is verified in DFAPacketizer.cpp:DFAPacketizer::DFAPacketizer.
38 //
39 // e.g. terms x resource bit combinations that fit in uint32_t:
40 //      4 terms x 8  bits = 32 bits
41 //      3 terms x 10 bits = 30 bits
42 //      2 terms x 16 bits = 32 bits
43 //
44 // e.g. terms x resource bit combinations that fit in uint64_t:
45 //      8 terms x 8  bits = 64 bits
46 //      7 terms x 9  bits = 63 bits
47 //      6 terms x 10 bits = 60 bits
48 //      5 terms x 12 bits = 60 bits
49 //      4 terms x 16 bits = 64 bits <--- current
50 //      3 terms x 21 bits = 63 bits
51 //      2 terms x 32 bits = 64 bits
52 //
53 #define DFA_MAX_RESTERMS        4   // The max # of AND'ed resource terms.
54 #define DFA_MAX_RESOURCES       16  // The max # of resource bits in one term.
55 
56 typedef uint64_t                DFAInput;
57 typedef int64_t                 DFAStateInput;
58 #define DFA_TBLTYPE             "int64_t" // For generating DFAStateInputTable.
59 
60 namespace {
addDFAFuncUnits(DFAInput Inp,unsigned FuncUnits)61   DFAInput addDFAFuncUnits(DFAInput Inp, unsigned FuncUnits) {
62     return (Inp << DFA_MAX_RESOURCES) | FuncUnits;
63   }
64 
65   /// Return the DFAInput for an instruction class input vector.
66   /// This function is used in both DFAPacketizer.cpp and in
67   /// DFAPacketizerEmitter.cpp.
getDFAInsnInput(const std::vector<unsigned> & InsnClass)68   DFAInput getDFAInsnInput(const std::vector<unsigned> &InsnClass) {
69     DFAInput InsnInput = 0;
70     assert ((InsnClass.size() <= DFA_MAX_RESTERMS) &&
71             "Exceeded maximum number of DFA terms");
72     for (auto U : InsnClass)
73       InsnInput = addDFAFuncUnits(InsnInput, U);
74     return InsnInput;
75   }
76 } // end anonymous namespace
77 
78 // --------------------------------------------------------------------
79 
80 #ifndef NDEBUG
81 // To enable debugging, run llvm-tblgen with: "-debug-only dfa-emitter".
82 //
83 // dbgsInsnClass - When debugging, print instruction class stages.
84 //
85 void dbgsInsnClass(const std::vector<unsigned> &InsnClass);
86 //
87 // dbgsStateInfo - When debugging, print the set of state info.
88 //
89 void dbgsStateInfo(const std::set<unsigned> &stateInfo);
90 //
91 // dbgsIndent - When debugging, indent by the specified amount.
92 //
93 void dbgsIndent(unsigned indent);
94 #endif
95 
96 //
97 // class DFAPacketizerEmitter: class that generates and prints out the DFA
98 // for resource tracking.
99 //
100 namespace {
101 class DFAPacketizerEmitter {
102 private:
103   std::string TargetName;
104   //
105   // allInsnClasses is the set of all possible resources consumed by an
106   // InstrStage.
107   //
108   std::vector<std::vector<unsigned>> allInsnClasses;
109   RecordKeeper &Records;
110 
111 public:
112   DFAPacketizerEmitter(RecordKeeper &R);
113 
114   //
115   // collectAllFuncUnits - Construct a map of function unit names to bits.
116   //
117   int collectAllFuncUnits(std::vector<Record*> &ProcItinList,
118                            std::map<std::string, unsigned> &FUNameToBitsMap,
119                            int &maxResources,
120                            raw_ostream &OS);
121 
122   //
123   // collectAllComboFuncs - Construct a map from a combo function unit bit to
124   //                        the bits of all included functional units.
125   //
126   int collectAllComboFuncs(std::vector<Record*> &ComboFuncList,
127                            std::map<std::string, unsigned> &FUNameToBitsMap,
128                            std::map<unsigned, unsigned> &ComboBitToBitsMap,
129                            raw_ostream &OS);
130 
131   //
132   // collectOneInsnClass - Populate allInsnClasses with one instruction class.
133   //
134   int collectOneInsnClass(const std::string &ProcName,
135                            std::vector<Record*> &ProcItinList,
136                            std::map<std::string, unsigned> &FUNameToBitsMap,
137                            Record *ItinData,
138                            raw_ostream &OS);
139 
140   //
141   // collectAllInsnClasses - Populate allInsnClasses which is a set of units
142   // used in each stage.
143   //
144   int collectAllInsnClasses(const std::string &ProcName,
145                            std::vector<Record*> &ProcItinList,
146                            std::map<std::string, unsigned> &FUNameToBitsMap,
147                            std::vector<Record*> &ItinDataList,
148                            int &maxStages,
149                            raw_ostream &OS);
150 
151   void run(raw_ostream &OS);
152 };
153 } // end anonymous namespace
154 
155 //
156 //
157 // State represents the usage of machine resources if the packet contains
158 // a set of instruction classes.
159 //
160 // Specifically, currentState is a set of bit-masks.
161 // The nth bit in a bit-mask indicates whether the nth resource is being used
162 // by this state. The set of bit-masks in a state represent the different
163 // possible outcomes of transitioning to this state.
164 // For example: consider a two resource architecture: resource L and resource M
165 // with three instruction classes: L, M, and L_or_M.
166 // From the initial state (currentState = 0x00), if we add instruction class
167 // L_or_M we will transition to a state with currentState = [0x01, 0x10]. This
168 // represents the possible resource states that can result from adding a L_or_M
169 // instruction
170 //
171 // Another way of thinking about this transition is we are mapping a NDFA with
172 // two states [0x01] and [0x10] into a DFA with a single state [0x01, 0x10].
173 //
174 // A State instance also contains a collection of transitions from that state:
175 // a map from inputs to new states.
176 //
177 namespace {
178 class State {
179  public:
180   static int currentStateNum;
181   // stateNum is the only member used for equality/ordering, all other members
182   // can be mutated even in const State objects.
183   const int stateNum;
184   mutable bool isInitial;
185   mutable std::set<unsigned> stateInfo;
186   typedef std::map<std::vector<unsigned>, const State *> TransitionMap;
187   mutable TransitionMap Transitions;
188 
189   State();
190 
operator <(const State & s) const191   bool operator<(const State &s) const {
192     return stateNum < s.stateNum;
193   }
194 
195   //
196   // canMaybeAddInsnClass - Quickly verifies if an instruction of type InsnClass
197   // may be a valid transition from this state i.e., can an instruction of type
198   // InsnClass be added to the packet represented by this state.
199   //
200   // Note that for multiple stages, this quick check does not take into account
201   // any possible resource competition between the stages themselves.  That is
202   // enforced in AddInsnClassStages which checks the cross product of all
203   // stages for resource availability (which is a more involved check).
204   //
205   bool canMaybeAddInsnClass(std::vector<unsigned> &InsnClass,
206                         std::map<unsigned, unsigned> &ComboBitToBitsMap) const;
207   //
208   // AddInsnClass - Return all combinations of resource reservation
209   // which are possible from this state (PossibleStates).
210   //
211   // PossibleStates is the set of valid resource states that ensue from valid
212   // transitions.
213   //
214   void AddInsnClass(std::vector<unsigned> &InsnClass,
215                         std::map<unsigned, unsigned> &ComboBitToBitsMap,
216                         std::set<unsigned> &PossibleStates) const;
217   //
218   // AddInsnClassStages - Return all combinations of resource reservation
219   // resulting from the cross product of all stages for this InsnClass
220   // which are possible from this state (PossibleStates).
221   //
222   void AddInsnClassStages(std::vector<unsigned> &InsnClass,
223                         std::map<unsigned, unsigned> &ComboBitToBitsMap,
224                         unsigned chkstage, unsigned numstages,
225                         unsigned prevState, unsigned origState,
226                         DenseSet<unsigned> &VisitedResourceStates,
227                         std::set<unsigned> &PossibleStates) const;
228   //
229   // addTransition - Add a transition from this state given the input InsnClass
230   //
231   void addTransition(std::vector<unsigned> InsnClass, const State *To) const;
232   //
233   // hasTransition - Returns true if there is a transition from this state
234   // given the input InsnClass
235   //
236   bool hasTransition(std::vector<unsigned> InsnClass) const;
237 };
238 } // end anonymous namespace
239 
240 //
241 // class DFA: deterministic finite automaton for processor resource tracking.
242 //
243 namespace {
244 class DFA {
245 public:
246   DFA();
247 
248   // Set of states. Need to keep this sorted to emit the transition table.
249   typedef std::set<State> StateSet;
250   StateSet states;
251 
252   State *currentState;
253 
254   //
255   // Modify the DFA.
256   //
257   const State &newState();
258 
259   //
260   // writeTable: Print out a table representing the DFA.
261   //
262   void writeTableAndAPI(raw_ostream &OS, const std::string &ClassName,
263                  int numInsnClasses = 0,
264                  int maxResources = 0, int numCombos = 0, int maxStages = 0);
265 };
266 } // end anonymous namespace
267 
268 #ifndef NDEBUG
269 // To enable debugging, run llvm-tblgen with: "-debug-only dfa-emitter".
270 //
271 // dbgsInsnClass - When debugging, print instruction class stages.
272 //
dbgsInsnClass(const std::vector<unsigned> & InsnClass)273 void dbgsInsnClass(const std::vector<unsigned> &InsnClass) {
274   DEBUG(dbgs() << "InsnClass: ");
275   for (unsigned i = 0; i < InsnClass.size(); ++i) {
276     if (i > 0) {
277       DEBUG(dbgs() << ", ");
278     }
279     DEBUG(dbgs() << "0x" << utohexstr(InsnClass[i]));
280   }
281   DFAInput InsnInput = getDFAInsnInput(InsnClass);
282   DEBUG(dbgs() << " (input: 0x" << utohexstr(InsnInput) << ")");
283 }
284 
285 //
286 // dbgsStateInfo - When debugging, print the set of state info.
287 //
dbgsStateInfo(const std::set<unsigned> & stateInfo)288 void dbgsStateInfo(const std::set<unsigned> &stateInfo) {
289   DEBUG(dbgs() << "StateInfo: ");
290   unsigned i = 0;
291   for (std::set<unsigned>::iterator SI = stateInfo.begin();
292        SI != stateInfo.end(); ++SI, ++i) {
293     unsigned thisState = *SI;
294     if (i > 0) {
295       DEBUG(dbgs() << ", ");
296     }
297     DEBUG(dbgs() << "0x" << utohexstr(thisState));
298   }
299 }
300 
301 //
302 // dbgsIndent - When debugging, indent by the specified amount.
303 //
dbgsIndent(unsigned indent)304 void dbgsIndent(unsigned indent) {
305   for (unsigned i = 0; i < indent; ++i) {
306     DEBUG(dbgs() << " ");
307   }
308 }
309 #endif // NDEBUG
310 
311 //
312 // Constructors and destructors for State and DFA
313 //
State()314 State::State() :
315   stateNum(currentStateNum++), isInitial(false) {}
316 
DFA()317 DFA::DFA(): currentState(nullptr) {}
318 
319 //
320 // addTransition - Add a transition from this state given the input InsnClass
321 //
addTransition(std::vector<unsigned> InsnClass,const State * To) const322 void State::addTransition(std::vector<unsigned> InsnClass, const State *To)
323       const {
324   assert(!Transitions.count(InsnClass) &&
325       "Cannot have multiple transitions for the same input");
326   Transitions[InsnClass] = To;
327 }
328 
329 //
330 // hasTransition - Returns true if there is a transition from this state
331 // given the input InsnClass
332 //
hasTransition(std::vector<unsigned> InsnClass) const333 bool State::hasTransition(std::vector<unsigned> InsnClass) const {
334   return Transitions.count(InsnClass) > 0;
335 }
336 
337 //
338 // AddInsnClass - Return all combinations of resource reservation
339 // which are possible from this state (PossibleStates).
340 //
341 // PossibleStates is the set of valid resource states that ensue from valid
342 // transitions.
343 //
AddInsnClass(std::vector<unsigned> & InsnClass,std::map<unsigned,unsigned> & ComboBitToBitsMap,std::set<unsigned> & PossibleStates) const344 void State::AddInsnClass(std::vector<unsigned> &InsnClass,
345                         std::map<unsigned, unsigned> &ComboBitToBitsMap,
346                         std::set<unsigned> &PossibleStates) const {
347   //
348   // Iterate over all resource states in currentState.
349   //
350   unsigned numstages = InsnClass.size();
351   assert((numstages > 0) && "InsnClass has no stages");
352 
353   for (std::set<unsigned>::iterator SI = stateInfo.begin();
354        SI != stateInfo.end(); ++SI) {
355     unsigned thisState = *SI;
356 
357     DenseSet<unsigned> VisitedResourceStates;
358 
359     DEBUG(dbgs() << "  thisState: 0x" << utohexstr(thisState) << "\n");
360     AddInsnClassStages(InsnClass, ComboBitToBitsMap,
361                                 numstages - 1, numstages,
362                                 thisState, thisState,
363                                 VisitedResourceStates, PossibleStates);
364   }
365 }
366 
AddInsnClassStages(std::vector<unsigned> & InsnClass,std::map<unsigned,unsigned> & ComboBitToBitsMap,unsigned chkstage,unsigned numstages,unsigned prevState,unsigned origState,DenseSet<unsigned> & VisitedResourceStates,std::set<unsigned> & PossibleStates) const367 void State::AddInsnClassStages(std::vector<unsigned> &InsnClass,
368                         std::map<unsigned, unsigned> &ComboBitToBitsMap,
369                         unsigned chkstage, unsigned numstages,
370                         unsigned prevState, unsigned origState,
371                         DenseSet<unsigned> &VisitedResourceStates,
372                         std::set<unsigned> &PossibleStates) const {
373 
374   assert((chkstage < numstages) && "AddInsnClassStages: stage out of range");
375   unsigned thisStage = InsnClass[chkstage];
376 
377   DEBUG({
378     dbgsIndent((1 + numstages - chkstage) << 1);
379     dbgs() << "AddInsnClassStages " << chkstage << " (0x"
380            << utohexstr(thisStage) << ") from ";
381     dbgsInsnClass(InsnClass);
382     dbgs() << "\n";
383   });
384 
385   //
386   // Iterate over all possible resources used in thisStage.
387   // For ex: for thisStage = 0x11, all resources = {0x01, 0x10}.
388   //
389   for (unsigned int j = 0; j < DFA_MAX_RESOURCES; ++j) {
390     unsigned resourceMask = (0x1 << j);
391     if (resourceMask & thisStage) {
392       unsigned combo = ComboBitToBitsMap[resourceMask];
393       if (combo && ((~prevState & combo) != combo)) {
394         DEBUG(dbgs() << "\tSkipped Add 0x" << utohexstr(prevState)
395                      << " - combo op 0x" << utohexstr(resourceMask)
396                      << " (0x" << utohexstr(combo) <<") cannot be scheduled\n");
397         continue;
398       }
399       //
400       // For each possible resource used in thisStage, generate the
401       // resource state if that resource was used.
402       //
403       unsigned ResultingResourceState = prevState | resourceMask | combo;
404       DEBUG({
405         dbgsIndent((2 + numstages - chkstage) << 1);
406         dbgs() << "0x" << utohexstr(prevState)
407                << " | 0x" << utohexstr(resourceMask);
408         if (combo)
409           dbgs() << " | 0x" << utohexstr(combo);
410         dbgs() << " = 0x" << utohexstr(ResultingResourceState) << " ";
411       });
412 
413       //
414       // If this is the final stage for this class
415       //
416       if (chkstage == 0) {
417         //
418         // Check if the resulting resource state can be accommodated in this
419         // packet.
420         // We compute resource OR prevState (originally started as origState).
421         // If the result of the OR is different than origState, it implies
422         // that there is at least one resource that can be used to schedule
423         // thisStage in the current packet.
424         // Insert ResultingResourceState into PossibleStates only if we haven't
425         // processed ResultingResourceState before.
426         //
427         if (ResultingResourceState != prevState) {
428           if (VisitedResourceStates.count(ResultingResourceState) == 0) {
429             VisitedResourceStates.insert(ResultingResourceState);
430             PossibleStates.insert(ResultingResourceState);
431             DEBUG(dbgs() << "\tResultingResourceState: 0x"
432                          << utohexstr(ResultingResourceState) << "\n");
433           } else {
434             DEBUG(dbgs() << "\tSkipped Add - state already seen\n");
435           }
436         } else {
437           DEBUG(dbgs() << "\tSkipped Add - no final resources available\n");
438         }
439       } else {
440         //
441         // If the current resource can be accommodated, check the next
442         // stage in InsnClass for available resources.
443         //
444         if (ResultingResourceState != prevState) {
445           DEBUG(dbgs() << "\n");
446           AddInsnClassStages(InsnClass, ComboBitToBitsMap,
447                                 chkstage - 1, numstages,
448                                 ResultingResourceState, origState,
449                                 VisitedResourceStates, PossibleStates);
450         } else {
451           DEBUG(dbgs() << "\tSkipped Add - no resources available\n");
452         }
453       }
454     }
455   }
456 }
457 
458 //
459 // canMaybeAddInsnClass - Quickly verifies if an instruction of type InsnClass
460 // may be a valid transition from this state i.e., can an instruction of type
461 // InsnClass be added to the packet represented by this state.
462 //
463 // Note that this routine is performing conservative checks that can be
464 // quickly executed acting as a filter before calling AddInsnClassStages.
465 // Any cases allowed through here will be caught later in AddInsnClassStages
466 // which performs the more expensive exact check.
467 //
canMaybeAddInsnClass(std::vector<unsigned> & InsnClass,std::map<unsigned,unsigned> & ComboBitToBitsMap) const468 bool State::canMaybeAddInsnClass(std::vector<unsigned> &InsnClass,
469                     std::map<unsigned, unsigned> &ComboBitToBitsMap) const {
470   for (std::set<unsigned>::const_iterator SI = stateInfo.begin();
471        SI != stateInfo.end(); ++SI) {
472 
473     // Check to see if all required resources are available.
474     bool available = true;
475 
476     // Inspect each stage independently.
477     // note: This is a conservative check as we aren't checking for
478     //       possible resource competition between the stages themselves
479     //       The full cross product is examined later in AddInsnClass.
480     for (unsigned i = 0; i < InsnClass.size(); ++i) {
481       unsigned resources = *SI;
482       if ((~resources & InsnClass[i]) == 0) {
483         available = false;
484         break;
485       }
486       // Make sure _all_ resources for a combo function are available.
487       // note: This is a quick conservative check as it won't catch an
488       //       unscheduleable combo if this stage is an OR expression
489       //       containing a combo.
490       //       These cases are caught later in AddInsnClass.
491       unsigned combo = ComboBitToBitsMap[InsnClass[i]];
492       if (combo && ((~resources & combo) != combo)) {
493         DEBUG(dbgs() << "\tSkipped canMaybeAdd 0x" << utohexstr(resources)
494                      << " - combo op 0x" << utohexstr(InsnClass[i])
495                      << " (0x" << utohexstr(combo) <<") cannot be scheduled\n");
496         available = false;
497         break;
498       }
499     }
500 
501     if (available) {
502       return true;
503     }
504   }
505   return false;
506 }
507 
newState()508 const State &DFA::newState() {
509   auto IterPair = states.insert(State());
510   assert(IterPair.second && "State already exists");
511   return *IterPair.first;
512 }
513 
514 int State::currentStateNum = 0;
515 
DFAPacketizerEmitter(RecordKeeper & R)516 DFAPacketizerEmitter::DFAPacketizerEmitter(RecordKeeper &R):
517   TargetName(CodeGenTarget(R).getName()),
518   allInsnClasses(), Records(R) {}
519 
520 //
521 // writeTableAndAPI - Print out a table representing the DFA and the
522 // associated API to create a DFA packetizer.
523 //
524 // Format:
525 // DFAStateInputTable[][2] = pairs of <Input, Transition> for all valid
526 //                           transitions.
527 // DFAStateEntryTable[i] = Index of the first entry in DFAStateInputTable for
528 //                         the ith state.
529 //
530 //
writeTableAndAPI(raw_ostream & OS,const std::string & TargetName,int numInsnClasses,int maxResources,int numCombos,int maxStages)531 void DFA::writeTableAndAPI(raw_ostream &OS, const std::string &TargetName,
532                            int numInsnClasses,
533                            int maxResources, int numCombos, int maxStages) {
534 
535   unsigned numStates = states.size();
536 
537   DEBUG(dbgs() << "-----------------------------------------------------------------------------\n");
538   DEBUG(dbgs() << "writeTableAndAPI\n");
539   DEBUG(dbgs() << "Total states: " << numStates << "\n");
540 
541   OS << "namespace llvm {\n";
542 
543   OS << "\n// Input format:\n";
544   OS << "#define DFA_MAX_RESTERMS        " << DFA_MAX_RESTERMS
545      << "\t// maximum AND'ed resource terms\n";
546   OS << "#define DFA_MAX_RESOURCES       " << DFA_MAX_RESOURCES
547      << "\t// maximum resource bits in one term\n";
548 
549   OS << "\n// " << TargetName << "DFAStateInputTable[][2] = "
550      << "pairs of <Input, NextState> for all valid\n";
551   OS << "//                           transitions.\n";
552   OS << "// " << numStates << "\tstates\n";
553   OS << "// " << numInsnClasses << "\tinstruction classes\n";
554   OS << "// " << maxResources << "\tresources max\n";
555   OS << "// " << numCombos << "\tcombo resources\n";
556   OS << "// " << maxStages << "\tstages max\n";
557   OS << "const " << DFA_TBLTYPE << " "
558      << TargetName << "DFAStateInputTable[][2] = {\n";
559 
560   // This table provides a map to the beginning of the transitions for State s
561   // in DFAStateInputTable.
562   std::vector<int> StateEntry(numStates+1);
563   static const std::string SentinelEntry = "{-1, -1}";
564 
565   // Tracks the total valid transitions encountered so far. It is used
566   // to construct the StateEntry table.
567   int ValidTransitions = 0;
568   DFA::StateSet::iterator SI = states.begin();
569   for (unsigned i = 0; i < numStates; ++i, ++SI) {
570     assert ((SI->stateNum == (int) i) && "Mismatch in state numbers");
571     StateEntry[i] = ValidTransitions;
572     for (State::TransitionMap::iterator
573         II = SI->Transitions.begin(), IE = SI->Transitions.end();
574         II != IE; ++II) {
575       OS << "{0x" << utohexstr(getDFAInsnInput(II->first)) << ", "
576          << II->second->stateNum
577          << "},\t";
578     }
579     ValidTransitions += SI->Transitions.size();
580 
581     // If there are no valid transitions from this stage, we need a sentinel
582     // transition.
583     if (ValidTransitions == StateEntry[i]) {
584       OS << SentinelEntry << ",\t";
585       ++ValidTransitions;
586     }
587 
588     OS << " // state " << i << ": " << StateEntry[i];
589     if (StateEntry[i] != (ValidTransitions-1)) {   // More than one transition.
590        OS << "-" << (ValidTransitions-1);
591     }
592     OS << "\n";
593   }
594 
595   // Print out a sentinel entry at the end of the StateInputTable. This is
596   // needed to iterate over StateInputTable in DFAPacketizer::ReadTable()
597   OS << SentinelEntry << "\t";
598   OS << " // state " << numStates << ": " << ValidTransitions;
599   OS << "\n";
600 
601   OS << "};\n\n";
602   OS << "// " << TargetName << "DFAStateEntryTable[i] = "
603      << "Index of the first entry in DFAStateInputTable for\n";
604   OS << "//                         "
605      << "the ith state.\n";
606   OS << "// " << numStates << " states\n";
607   OS << "const unsigned int " << TargetName << "DFAStateEntryTable[] = {\n";
608 
609   // Multiply i by 2 since each entry in DFAStateInputTable is a set of
610   // two numbers.
611   unsigned lastState = 0;
612   for (unsigned i = 0; i < numStates; ++i) {
613     if (i && ((i % 10) == 0)) {
614         lastState = i-1;
615         OS << "   // states " << (i-10) << ":" << lastState << "\n";
616     }
617     OS << StateEntry[i] << ", ";
618   }
619 
620   // Print out the index to the sentinel entry in StateInputTable
621   OS << ValidTransitions << ", ";
622   OS << "   // states " << (lastState+1) << ":" << numStates << "\n";
623 
624   OS << "};\n";
625   OS << "} // namespace\n";
626 
627   //
628   // Emit DFA Packetizer tables if the target is a VLIW machine.
629   //
630   std::string SubTargetClassName = TargetName + "GenSubtargetInfo";
631   OS << "\n" << "#include \"llvm/CodeGen/DFAPacketizer.h\"\n";
632   OS << "namespace llvm {\n";
633   OS << "DFAPacketizer *" << SubTargetClassName << "::"
634      << "createDFAPacketizer(const InstrItineraryData *IID) const {\n"
635      << "   return new DFAPacketizer(IID, " << TargetName
636      << "DFAStateInputTable, " << TargetName << "DFAStateEntryTable);\n}\n\n";
637   OS << "} // End llvm namespace \n";
638 }
639 
640 //
641 // collectAllFuncUnits - Construct a map of function unit names to bits.
642 //
collectAllFuncUnits(std::vector<Record * > & ProcItinList,std::map<std::string,unsigned> & FUNameToBitsMap,int & maxFUs,raw_ostream & OS)643 int DFAPacketizerEmitter::collectAllFuncUnits(
644                             std::vector<Record*> &ProcItinList,
645                             std::map<std::string, unsigned> &FUNameToBitsMap,
646                             int &maxFUs,
647                             raw_ostream &OS) {
648   DEBUG(dbgs() << "-----------------------------------------------------------------------------\n");
649   DEBUG(dbgs() << "collectAllFuncUnits");
650   DEBUG(dbgs() << " (" << ProcItinList.size() << " itineraries)\n");
651 
652   int totalFUs = 0;
653   // Parse functional units for all the itineraries.
654   for (unsigned i = 0, N = ProcItinList.size(); i < N; ++i) {
655     Record *Proc = ProcItinList[i];
656     std::vector<Record*> FUs = Proc->getValueAsListOfDefs("FU");
657 
658     DEBUG(dbgs() << "    FU:" << i
659                  << " (" << FUs.size() << " FUs) "
660                  << Proc->getName());
661 
662 
663     // Convert macros to bits for each stage.
664     unsigned numFUs = FUs.size();
665     for (unsigned j = 0; j < numFUs; ++j) {
666       assert ((j < DFA_MAX_RESOURCES) &&
667                       "Exceeded maximum number of representable resources");
668       unsigned FuncResources = (unsigned) (1U << j);
669       FUNameToBitsMap[FUs[j]->getName()] = FuncResources;
670       DEBUG(dbgs() << " " << FUs[j]->getName()
671                    << ":0x" << utohexstr(FuncResources));
672     }
673     if (((int) numFUs) > maxFUs) {
674       maxFUs = numFUs;
675     }
676     totalFUs += numFUs;
677     DEBUG(dbgs() << "\n");
678   }
679   return totalFUs;
680 }
681 
682 //
683 // collectAllComboFuncs - Construct a map from a combo function unit bit to
684 //                        the bits of all included functional units.
685 //
collectAllComboFuncs(std::vector<Record * > & ComboFuncList,std::map<std::string,unsigned> & FUNameToBitsMap,std::map<unsigned,unsigned> & ComboBitToBitsMap,raw_ostream & OS)686 int DFAPacketizerEmitter::collectAllComboFuncs(
687                             std::vector<Record*> &ComboFuncList,
688                             std::map<std::string, unsigned> &FUNameToBitsMap,
689                             std::map<unsigned, unsigned> &ComboBitToBitsMap,
690                             raw_ostream &OS) {
691   DEBUG(dbgs() << "-----------------------------------------------------------------------------\n");
692   DEBUG(dbgs() << "collectAllComboFuncs");
693   DEBUG(dbgs() << " (" << ComboFuncList.size() << " sets)\n");
694 
695   int numCombos = 0;
696   for (unsigned i = 0, N = ComboFuncList.size(); i < N; ++i) {
697     Record *Func = ComboFuncList[i];
698     std::vector<Record*> FUs = Func->getValueAsListOfDefs("CFD");
699 
700     DEBUG(dbgs() << "    CFD:" << i
701                  << " (" << FUs.size() << " combo FUs) "
702                  << Func->getName() << "\n");
703 
704     // Convert macros to bits for each stage.
705     for (unsigned j = 0, N = FUs.size(); j < N; ++j) {
706       assert ((j < DFA_MAX_RESOURCES) &&
707                       "Exceeded maximum number of DFA resources");
708       Record *FuncData = FUs[j];
709       Record *ComboFunc = FuncData->getValueAsDef("TheComboFunc");
710       const std::vector<Record*> &FuncList =
711                                    FuncData->getValueAsListOfDefs("FuncList");
712       const std::string &ComboFuncName = ComboFunc->getName();
713       unsigned ComboBit = FUNameToBitsMap[ComboFuncName];
714       unsigned ComboResources = ComboBit;
715       DEBUG(dbgs() << "      combo: " << ComboFuncName
716                    << ":0x" << utohexstr(ComboResources) << "\n");
717       for (unsigned k = 0, M = FuncList.size(); k < M; ++k) {
718         std::string FuncName = FuncList[k]->getName();
719         unsigned FuncResources = FUNameToBitsMap[FuncName];
720         DEBUG(dbgs() << "        " << FuncName
721                      << ":0x" << utohexstr(FuncResources) << "\n");
722         ComboResources |= FuncResources;
723       }
724       ComboBitToBitsMap[ComboBit] = ComboResources;
725       numCombos++;
726       DEBUG(dbgs() << "          => combo bits: " << ComboFuncName << ":0x"
727                    << utohexstr(ComboBit) << " = 0x"
728                    << utohexstr(ComboResources) << "\n");
729     }
730   }
731   return numCombos;
732 }
733 
734 //
735 // collectOneInsnClass - Populate allInsnClasses with one instruction class
736 //
collectOneInsnClass(const std::string & ProcName,std::vector<Record * > & ProcItinList,std::map<std::string,unsigned> & FUNameToBitsMap,Record * ItinData,raw_ostream & OS)737 int DFAPacketizerEmitter::collectOneInsnClass(const std::string &ProcName,
738                         std::vector<Record*> &ProcItinList,
739                         std::map<std::string, unsigned> &FUNameToBitsMap,
740                         Record *ItinData,
741                         raw_ostream &OS) {
742   const std::vector<Record*> &StageList =
743     ItinData->getValueAsListOfDefs("Stages");
744 
745   // The number of stages.
746   unsigned NStages = StageList.size();
747 
748   DEBUG(dbgs() << "    " << ItinData->getValueAsDef("TheClass")->getName()
749                << "\n");
750 
751   std::vector<unsigned> UnitBits;
752 
753   // Compute the bitwise or of each unit used in this stage.
754   for (unsigned i = 0; i < NStages; ++i) {
755     const Record *Stage = StageList[i];
756 
757     // Get unit list.
758     const std::vector<Record*> &UnitList =
759       Stage->getValueAsListOfDefs("Units");
760 
761     DEBUG(dbgs() << "        stage:" << i
762                  << " [" << UnitList.size() << " units]:");
763     unsigned dbglen = 26;  // cursor after stage dbgs
764 
765     // Compute the bitwise or of each unit used in this stage.
766     unsigned UnitBitValue = 0;
767     for (unsigned j = 0, M = UnitList.size(); j < M; ++j) {
768       // Conduct bitwise or.
769       std::string UnitName = UnitList[j]->getName();
770       DEBUG(dbgs() << " " << j << ":" << UnitName);
771       dbglen += 3 + UnitName.length();
772       assert(FUNameToBitsMap.count(UnitName));
773       UnitBitValue |= FUNameToBitsMap[UnitName];
774     }
775 
776     if (UnitBitValue != 0)
777       UnitBits.push_back(UnitBitValue);
778 
779     while (dbglen <= 64) {   // line up bits dbgs
780         dbglen += 8;
781         DEBUG(dbgs() << "\t");
782     }
783     DEBUG(dbgs() << " (bits: 0x" << utohexstr(UnitBitValue) << ")\n");
784   }
785 
786   if (UnitBits.size() > 0)
787     allInsnClasses.push_back(UnitBits);
788 
789   DEBUG({
790     dbgs() << "        ";
791     dbgsInsnClass(UnitBits);
792     dbgs() << "\n";
793   });
794 
795   return NStages;
796 }
797 
798 //
799 // collectAllInsnClasses - Populate allInsnClasses which is a set of units
800 // used in each stage.
801 //
collectAllInsnClasses(const std::string & ProcName,std::vector<Record * > & ProcItinList,std::map<std::string,unsigned> & FUNameToBitsMap,std::vector<Record * > & ItinDataList,int & maxStages,raw_ostream & OS)802 int DFAPacketizerEmitter::collectAllInsnClasses(const std::string &ProcName,
803                             std::vector<Record*> &ProcItinList,
804                             std::map<std::string, unsigned> &FUNameToBitsMap,
805                             std::vector<Record*> &ItinDataList,
806                             int &maxStages,
807                             raw_ostream &OS) {
808   // Collect all instruction classes.
809   unsigned M = ItinDataList.size();
810 
811   int numInsnClasses = 0;
812   DEBUG(dbgs() << "-----------------------------------------------------------------------------\n"
813                << "collectAllInsnClasses "
814                << ProcName
815                << " (" << M << " classes)\n");
816 
817   // Collect stages for each instruction class for all itinerary data
818   for (unsigned j = 0; j < M; j++) {
819     Record *ItinData = ItinDataList[j];
820     int NStages = collectOneInsnClass(ProcName, ProcItinList,
821                                       FUNameToBitsMap, ItinData, OS);
822     if (NStages > maxStages) {
823       maxStages = NStages;
824     }
825     numInsnClasses++;
826   }
827   return numInsnClasses;
828 }
829 
830 //
831 // Run the worklist algorithm to generate the DFA.
832 //
run(raw_ostream & OS)833 void DFAPacketizerEmitter::run(raw_ostream &OS) {
834 
835   // Collect processor iteraries.
836   std::vector<Record*> ProcItinList =
837     Records.getAllDerivedDefinitions("ProcessorItineraries");
838 
839   //
840   // Collect the Functional units.
841   //
842   std::map<std::string, unsigned> FUNameToBitsMap;
843   int maxResources = 0;
844   collectAllFuncUnits(ProcItinList,
845                               FUNameToBitsMap, maxResources, OS);
846 
847   //
848   // Collect the Combo Functional units.
849   //
850   std::map<unsigned, unsigned> ComboBitToBitsMap;
851   std::vector<Record*> ComboFuncList =
852     Records.getAllDerivedDefinitions("ComboFuncUnits");
853   int numCombos = collectAllComboFuncs(ComboFuncList,
854                               FUNameToBitsMap, ComboBitToBitsMap, OS);
855 
856   //
857   // Collect the itineraries.
858   //
859   int maxStages = 0;
860   int numInsnClasses = 0;
861   for (unsigned i = 0, N = ProcItinList.size(); i < N; i++) {
862     Record *Proc = ProcItinList[i];
863 
864     // Get processor itinerary name.
865     const std::string &ProcName = Proc->getName();
866 
867     // Skip default.
868     if (ProcName == "NoItineraries")
869       continue;
870 
871     // Sanity check for at least one instruction itinerary class.
872     unsigned NItinClasses =
873       Records.getAllDerivedDefinitions("InstrItinClass").size();
874     if (NItinClasses == 0)
875       return;
876 
877     // Get itinerary data list.
878     std::vector<Record*> ItinDataList = Proc->getValueAsListOfDefs("IID");
879 
880     // Collect all instruction classes
881     numInsnClasses += collectAllInsnClasses(ProcName, ProcItinList,
882                           FUNameToBitsMap, ItinDataList, maxStages, OS);
883   }
884 
885   //
886   // Run a worklist algorithm to generate the DFA.
887   //
888   DFA D;
889   const State *Initial = &D.newState();
890   Initial->isInitial = true;
891   Initial->stateInfo.insert(0x0);
892   SmallVector<const State*, 32> WorkList;
893 //  std::queue<State*> WorkList;
894   std::map<std::set<unsigned>, const State*> Visited;
895 
896   WorkList.push_back(Initial);
897 
898   //
899   // Worklist algorithm to create a DFA for processor resource tracking.
900   // C = {set of InsnClasses}
901   // Begin with initial node in worklist. Initial node does not have
902   // any consumed resources,
903   //     ResourceState = 0x0
904   // Visited = {}
905   // While worklist != empty
906   //    S = first element of worklist
907   //    For every instruction class C
908   //      if we can accommodate C in S:
909   //          S' = state with resource states = {S Union C}
910   //          Add a new transition: S x C -> S'
911   //          If S' is not in Visited:
912   //             Add S' to worklist
913   //             Add S' to Visited
914   //
915   while (!WorkList.empty()) {
916     const State *current = WorkList.pop_back_val();
917     DEBUG({
918       dbgs() << "---------------------\n";
919       dbgs() << "Processing state: " << current->stateNum << " - ";
920       dbgsStateInfo(current->stateInfo);
921       dbgs() << "\n";
922     });
923     for (unsigned i = 0; i < allInsnClasses.size(); i++) {
924       std::vector<unsigned> InsnClass = allInsnClasses[i];
925       DEBUG({
926         dbgs() << i << " ";
927         dbgsInsnClass(InsnClass);
928         dbgs() << "\n";
929       });
930 
931       std::set<unsigned> NewStateResources;
932       //
933       // If we haven't already created a transition for this input
934       // and the state can accommodate this InsnClass, create a transition.
935       //
936       if (!current->hasTransition(InsnClass) &&
937           current->canMaybeAddInsnClass(InsnClass, ComboBitToBitsMap)) {
938         const State *NewState = nullptr;
939         current->AddInsnClass(InsnClass, ComboBitToBitsMap, NewStateResources);
940         if (NewStateResources.size() == 0) {
941           DEBUG(dbgs() << "  Skipped - no new states generated\n");
942           continue;
943         }
944 
945         DEBUG({
946           dbgs() << "\t";
947           dbgsStateInfo(NewStateResources);
948           dbgs() << "\n";
949         });
950 
951         //
952         // If we have seen this state before, then do not create a new state.
953         //
954         auto VI = Visited.find(NewStateResources);
955         if (VI != Visited.end()) {
956           NewState = VI->second;
957           DEBUG({
958             dbgs() << "\tFound existing state: " << NewState->stateNum
959                    << " - ";
960             dbgsStateInfo(NewState->stateInfo);
961             dbgs() << "\n";
962           });
963         } else {
964           NewState = &D.newState();
965           NewState->stateInfo = NewStateResources;
966           Visited[NewStateResources] = NewState;
967           WorkList.push_back(NewState);
968           DEBUG({
969             dbgs() << "\tAccepted new state: " << NewState->stateNum << " - ";
970             dbgsStateInfo(NewState->stateInfo);
971             dbgs() << "\n";
972           });
973         }
974 
975         current->addTransition(InsnClass, NewState);
976       }
977     }
978   }
979 
980   // Print out the table.
981   D.writeTableAndAPI(OS, TargetName,
982                numInsnClasses, maxResources, numCombos, maxStages);
983 }
984 
985 namespace llvm {
986 
EmitDFAPacketizer(RecordKeeper & RK,raw_ostream & OS)987 void EmitDFAPacketizer(RecordKeeper &RK, raw_ostream &OS) {
988   emitSourceFileHeader("Target DFA Packetizer Tables", OS);
989   DFAPacketizerEmitter(RK).run(OS);
990 }
991 
992 } // end namespaec llvm
993