1 //===-- llvm/CodeGen/AsmPrinter.h - AsmPrinter Framework --------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains a class to be used as the base class for target specific
11 // asm writers.  This class primarily handles common functionality used by
12 // all asm writers.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #ifndef LLVM_CODEGEN_ASMPRINTER_H
17 #define LLVM_CODEGEN_ASMPRINTER_H
18 
19 #include "llvm/ADT/MapVector.h"
20 #include "llvm/ADT/Twine.h"
21 #include "llvm/CodeGen/MachineFunctionPass.h"
22 #include "llvm/CodeGen/DwarfStringPoolEntry.h"
23 #include "llvm/IR/InlineAsm.h"
24 #include "llvm/Support/DataTypes.h"
25 #include "llvm/Support/ErrorHandling.h"
26 
27 namespace llvm {
28 class AsmPrinterHandler;
29 class BlockAddress;
30 class ByteStreamer;
31 class GCStrategy;
32 class Constant;
33 class ConstantArray;
34 class DIE;
35 class DIEAbbrev;
36 class GCMetadataPrinter;
37 class GlobalValue;
38 class GlobalVariable;
39 class MachineBasicBlock;
40 class MachineFunction;
41 class MachineInstr;
42 class MachineLocation;
43 class MachineLoopInfo;
44 class MachineLoop;
45 class MachineConstantPoolValue;
46 class MachineJumpTableInfo;
47 class MachineModuleInfo;
48 class MCAsmInfo;
49 class MCCFIInstruction;
50 class MCContext;
51 class MCExpr;
52 class MCInst;
53 class MCSection;
54 class MCStreamer;
55 class MCSubtargetInfo;
56 class MCSymbol;
57 class MCTargetOptions;
58 class MDNode;
59 class DwarfDebug;
60 class Mangler;
61 class TargetLoweringObjectFile;
62 class DataLayout;
63 class TargetMachine;
64 
65 /// This class is intended to be used as a driving class for all asm writers.
66 class AsmPrinter : public MachineFunctionPass {
67 public:
68   /// Target machine description.
69   ///
70   TargetMachine &TM;
71 
72   /// Target Asm Printer information.
73   ///
74   const MCAsmInfo *MAI;
75 
76   /// This is the context for the output file that we are streaming. This owns
77   /// all of the global MC-related objects for the generated translation unit.
78   MCContext &OutContext;
79 
80   /// This is the MCStreamer object for the file we are generating. This
81   /// contains the transient state for the current translation unit that we are
82   /// generating (such as the current section etc).
83   std::unique_ptr<MCStreamer> OutStreamer;
84 
85   /// The current machine function.
86   const MachineFunction *MF;
87 
88   /// This is a pointer to the current MachineModuleInfo.
89   MachineModuleInfo *MMI;
90 
91   /// Name-mangler for global names.
92   ///
93   Mangler *Mang;
94 
95   /// The symbol for the current function. This is recalculated at the beginning
96   /// of each call to runOnMachineFunction().
97   ///
98   MCSymbol *CurrentFnSym;
99 
100   /// The symbol used to represent the start of the current function for the
101   /// purpose of calculating its size (e.g. using the .size directive). By
102   /// default, this is equal to CurrentFnSym.
103   MCSymbol *CurrentFnSymForSize;
104 
105   /// Map global GOT equivalent MCSymbols to GlobalVariables and keep track of
106   /// its number of uses by other globals.
107   typedef std::pair<const GlobalVariable *, unsigned> GOTEquivUsePair;
108   MapVector<const MCSymbol *, GOTEquivUsePair> GlobalGOTEquivs;
109 
110 private:
111   MCSymbol *CurrentFnBegin;
112   MCSymbol *CurrentFnEnd;
113   MCSymbol *CurExceptionSym;
114 
115   // The garbage collection metadata printer table.
116   void *GCMetadataPrinters; // Really a DenseMap.
117 
118   /// Emit comments in assembly output if this is true.
119   ///
120   bool VerboseAsm;
121   static char ID;
122 
123   /// If VerboseAsm is set, a pointer to the loop info for this function.
124   MachineLoopInfo *LI;
125 
126   struct HandlerInfo {
127     AsmPrinterHandler *Handler;
128     const char *TimerName, *TimerGroupName;
HandlerInfoHandlerInfo129     HandlerInfo(AsmPrinterHandler *Handler, const char *TimerName,
130                 const char *TimerGroupName)
131         : Handler(Handler), TimerName(TimerName),
132           TimerGroupName(TimerGroupName) {}
133   };
134   /// A vector of all debug/EH info emitters we should use. This vector
135   /// maintains ownership of the emitters.
136   SmallVector<HandlerInfo, 1> Handlers;
137 
138   /// If the target supports dwarf debug info, this pointer is non-null.
139   DwarfDebug *DD;
140 
141 protected:
142   explicit AsmPrinter(TargetMachine &TM, std::unique_ptr<MCStreamer> Streamer);
143 
144 public:
145   ~AsmPrinter() override;
146 
getDwarfDebug()147   DwarfDebug *getDwarfDebug() { return DD; }
getDwarfDebug()148   DwarfDebug *getDwarfDebug() const { return DD; }
149 
150   /// Return true if assembly output should contain comments.
151   ///
isVerbose()152   bool isVerbose() const { return VerboseAsm; }
153 
154   /// Return a unique ID for the current function.
155   ///
156   unsigned getFunctionNumber() const;
157 
getFunctionBegin()158   MCSymbol *getFunctionBegin() const { return CurrentFnBegin; }
getFunctionEnd()159   MCSymbol *getFunctionEnd() const { return CurrentFnEnd; }
160   MCSymbol *getCurExceptionSym();
161 
162   /// Return information about object file lowering.
163   const TargetLoweringObjectFile &getObjFileLowering() const;
164 
165   /// Return information about data layout.
166   const DataLayout &getDataLayout() const;
167 
168   /// Return the pointer size from the TargetMachine
169   unsigned getPointerSize() const;
170 
171   /// Return information about subtarget.
172   const MCSubtargetInfo &getSubtargetInfo() const;
173 
174   void EmitToStreamer(MCStreamer &S, const MCInst &Inst);
175 
176   /// Return the target triple string.
177   StringRef getTargetTriple() const;
178 
179   /// Return the current section we are emitting to.
180   const MCSection *getCurrentSection() const;
181 
182   void getNameWithPrefix(SmallVectorImpl<char> &Name,
183                          const GlobalValue *GV) const;
184 
185   MCSymbol *getSymbol(const GlobalValue *GV) const;
186 
187   //===------------------------------------------------------------------===//
188   // MachineFunctionPass Implementation.
189   //===------------------------------------------------------------------===//
190 
191   /// Record analysis usage.
192   ///
193   void getAnalysisUsage(AnalysisUsage &AU) const override;
194 
195   /// Set up the AsmPrinter when we are working on a new module. If your pass
196   /// overrides this, it must make sure to explicitly call this implementation.
197   bool doInitialization(Module &M) override;
198 
199   /// Shut down the asmprinter. If you override this in your pass, you must make
200   /// sure to call it explicitly.
201   bool doFinalization(Module &M) override;
202 
203   /// Emit the specified function out to the OutStreamer.
runOnMachineFunction(MachineFunction & MF)204   bool runOnMachineFunction(MachineFunction &MF) override {
205     SetupMachineFunction(MF);
206     EmitFunctionBody();
207     return false;
208   }
209 
210   //===------------------------------------------------------------------===//
211   // Coarse grained IR lowering routines.
212   //===------------------------------------------------------------------===//
213 
214   /// This should be called when a new MachineFunction is being processed from
215   /// runOnMachineFunction.
216   void SetupMachineFunction(MachineFunction &MF);
217 
218   /// This method emits the body and trailer for a function.
219   void EmitFunctionBody();
220 
221   void emitCFIInstruction(const MachineInstr &MI);
222 
223   void emitFrameAlloc(const MachineInstr &MI);
224 
225   enum CFIMoveType { CFI_M_None, CFI_M_EH, CFI_M_Debug };
226   CFIMoveType needsCFIMoves();
227 
228   bool needsSEHMoves();
229 
230   /// Print to the current output stream assembly representations of the
231   /// constants in the constant pool MCP. This is used to print out constants
232   /// which have been "spilled to memory" by the code generator.
233   ///
234   virtual void EmitConstantPool();
235 
236   /// Print assembly representations of the jump tables used by the current
237   /// function to the current output stream.
238   ///
239   virtual void EmitJumpTableInfo();
240 
241   /// Emit the specified global variable to the .s file.
242   virtual void EmitGlobalVariable(const GlobalVariable *GV);
243 
244   /// Check to see if the specified global is a special global used by LLVM. If
245   /// so, emit it and return true, otherwise do nothing and return false.
246   bool EmitSpecialLLVMGlobal(const GlobalVariable *GV);
247 
248   /// Emit an alignment directive to the specified power of two boundary. For
249   /// example, if you pass in 3 here, you will get an 8 byte alignment. If a
250   /// global value is specified, and if that global has an explicit alignment
251   /// requested, it will override the alignment request if required for
252   /// correctness.
253   ///
254   void EmitAlignment(unsigned NumBits, const GlobalObject *GO = nullptr) const;
255 
256   /// Lower the specified LLVM Constant to an MCExpr.
257   const MCExpr *lowerConstant(const Constant *CV);
258 
259   /// \brief Print a general LLVM constant to the .s file.
260   void EmitGlobalConstant(const DataLayout &DL, const Constant *CV);
261 
262   /// \brief Unnamed constant global variables solely contaning a pointer to
263   /// another globals variable act like a global variable "proxy", or GOT
264   /// equivalents, i.e., it's only used to hold the address of the latter. One
265   /// optimization is to replace accesses to these proxies by using the GOT
266   /// entry for the final global instead. Hence, we select GOT equivalent
267   /// candidates among all the module global variables, avoid emitting them
268   /// unnecessarily and finally replace references to them by pc relative
269   /// accesses to GOT entries.
270   void computeGlobalGOTEquivs(Module &M);
271 
272   /// \brief Constant expressions using GOT equivalent globals may not be
273   /// eligible for PC relative GOT entry conversion, in such cases we need to
274   /// emit the proxies we previously omitted in EmitGlobalVariable.
275   void emitGlobalGOTEquivs();
276 
277   //===------------------------------------------------------------------===//
278   // Overridable Hooks
279   //===------------------------------------------------------------------===//
280 
281   // Targets can, or in the case of EmitInstruction, must implement these to
282   // customize output.
283 
284   /// This virtual method can be overridden by targets that want to emit
285   /// something at the start of their file.
EmitStartOfAsmFile(Module &)286   virtual void EmitStartOfAsmFile(Module &) {}
287 
288   /// This virtual method can be overridden by targets that want to emit
289   /// something at the end of their file.
EmitEndOfAsmFile(Module &)290   virtual void EmitEndOfAsmFile(Module &) {}
291 
292   /// Targets can override this to emit stuff before the first basic block in
293   /// the function.
EmitFunctionBodyStart()294   virtual void EmitFunctionBodyStart() {}
295 
296   /// Targets can override this to emit stuff after the last basic block in the
297   /// function.
EmitFunctionBodyEnd()298   virtual void EmitFunctionBodyEnd() {}
299 
300   /// Targets can override this to emit stuff at the start of a basic block.
301   /// By default, this method prints the label for the specified
302   /// MachineBasicBlock, an alignment (if present) and a comment describing it
303   /// if appropriate.
304   virtual void EmitBasicBlockStart(const MachineBasicBlock &MBB) const;
305 
306   /// Targets can override this to emit stuff at the end of a basic block.
EmitBasicBlockEnd(const MachineBasicBlock & MBB)307   virtual void EmitBasicBlockEnd(const MachineBasicBlock &MBB) {}
308 
309   /// Targets should implement this to emit instructions.
EmitInstruction(const MachineInstr *)310   virtual void EmitInstruction(const MachineInstr *) {
311     llvm_unreachable("EmitInstruction not implemented");
312   }
313 
314   /// Return the symbol for the specified constant pool entry.
315   virtual MCSymbol *GetCPISymbol(unsigned CPID) const;
316 
317   virtual void EmitFunctionEntryLabel();
318 
319   virtual void EmitMachineConstantPoolValue(MachineConstantPoolValue *MCPV);
320 
321   /// Targets can override this to change how global constants that are part of
322   /// a C++ static/global constructor list are emitted.
EmitXXStructor(const DataLayout & DL,const Constant * CV)323   virtual void EmitXXStructor(const DataLayout &DL, const Constant *CV) {
324     EmitGlobalConstant(DL, CV);
325   }
326 
327   /// Return true if the basic block has exactly one predecessor and the control
328   /// transfer mechanism between the predecessor and this block is a
329   /// fall-through.
330   virtual bool
331   isBlockOnlyReachableByFallthrough(const MachineBasicBlock *MBB) const;
332 
333   /// Targets can override this to customize the output of IMPLICIT_DEF
334   /// instructions in verbose mode.
335   virtual void emitImplicitDef(const MachineInstr *MI) const;
336 
337   //===------------------------------------------------------------------===//
338   // Symbol Lowering Routines.
339   //===------------------------------------------------------------------===//
340 public:
341   MCSymbol *createTempSymbol(const Twine &Name) const;
342 
343   /// Return the MCSymbol for a private symbol with global value name as its
344   /// base, with the specified suffix.
345   MCSymbol *getSymbolWithGlobalValueBase(const GlobalValue *GV,
346                                          StringRef Suffix) const;
347 
348   /// Return the MCSymbol for the specified ExternalSymbol.
349   MCSymbol *GetExternalSymbolSymbol(StringRef Sym) const;
350 
351   /// Return the symbol for the specified jump table entry.
352   MCSymbol *GetJTISymbol(unsigned JTID, bool isLinkerPrivate = false) const;
353 
354   /// Return the symbol for the specified jump table .set
355   /// FIXME: privatize to AsmPrinter.
356   MCSymbol *GetJTSetSymbol(unsigned UID, unsigned MBBID) const;
357 
358   /// Return the MCSymbol used to satisfy BlockAddress uses of the specified
359   /// basic block.
360   MCSymbol *GetBlockAddressSymbol(const BlockAddress *BA) const;
361   MCSymbol *GetBlockAddressSymbol(const BasicBlock *BB) const;
362 
363   //===------------------------------------------------------------------===//
364   // Emission Helper Routines.
365   //===------------------------------------------------------------------===//
366 public:
367   /// This is just convenient handler for printing offsets.
368   void printOffset(int64_t Offset, raw_ostream &OS) const;
369 
370   /// Emit a byte directive and value.
371   ///
372   void EmitInt8(int Value) const;
373 
374   /// Emit a short directive and value.
375   ///
376   void EmitInt16(int Value) const;
377 
378   /// Emit a long directive and value.
379   ///
380   void EmitInt32(int Value) const;
381 
382   /// Emit something like ".long Hi-Lo" where the size in bytes of the directive
383   /// is specified by Size and Hi/Lo specify the labels.  This implicitly uses
384   /// .set if it is available.
385   void EmitLabelDifference(const MCSymbol *Hi, const MCSymbol *Lo,
386                            unsigned Size) const;
387 
388   /// Emit something like ".long Label+Offset" where the size in bytes of the
389   /// directive is specified by Size and Label specifies the label.  This
390   /// implicitly uses .set if it is available.
391   void EmitLabelPlusOffset(const MCSymbol *Label, uint64_t Offset,
392                            unsigned Size, bool IsSectionRelative = false) const;
393 
394   /// Emit something like ".long Label" where the size in bytes of the directive
395   /// is specified by Size and Label specifies the label.
396   void EmitLabelReference(const MCSymbol *Label, unsigned Size,
397                           bool IsSectionRelative = false) const {
398     EmitLabelPlusOffset(Label, 0, Size, IsSectionRelative);
399   }
400 
401   //===------------------------------------------------------------------===//
402   // Dwarf Emission Helper Routines
403   //===------------------------------------------------------------------===//
404 
405   /// Emit the specified signed leb128 value.
406   void EmitSLEB128(int64_t Value, const char *Desc = nullptr) const;
407 
408   /// Emit the specified unsigned leb128 value.
409   void EmitULEB128(uint64_t Value, const char *Desc = nullptr,
410                    unsigned PadTo = 0) const;
411 
412   /// Emit a .byte 42 directive that corresponds to an encoding.  If verbose
413   /// assembly output is enabled, we output comments describing the encoding.
414   /// Desc is a string saying what the encoding is specifying (e.g. "LSDA").
415   void EmitEncodingByte(unsigned Val, const char *Desc = nullptr) const;
416 
417   /// Return the size of the encoding in bytes.
418   unsigned GetSizeOfEncodedValue(unsigned Encoding) const;
419 
420   /// Emit reference to a ttype global with a specified encoding.
421   void EmitTTypeReference(const GlobalValue *GV, unsigned Encoding) const;
422 
423   /// Emit a reference to a symbol for use in dwarf. Different object formats
424   /// represent this in different ways. Some use a relocation others encode
425   /// the label offset in its section.
426   void emitDwarfSymbolReference(const MCSymbol *Label,
427                                 bool ForceOffset = false) const;
428 
429   /// Emit the 4-byte offset of a string from the start of its section.
430   ///
431   /// When possible, emit a DwarfStringPool section offset without any
432   /// relocations, and without using the symbol.  Otherwise, defers to \a
433   /// emitDwarfSymbolReference().
434   void emitDwarfStringOffset(DwarfStringPoolEntryRef S) const;
435 
436   /// Get the value for DW_AT_APPLE_isa. Zero if no isa encoding specified.
getISAEncoding()437   virtual unsigned getISAEncoding() { return 0; }
438 
439   /// EmitDwarfRegOp - Emit a dwarf register operation.
440   virtual void EmitDwarfRegOp(ByteStreamer &BS,
441                               const MachineLocation &MLoc) const;
442 
443   //===------------------------------------------------------------------===//
444   // Dwarf Lowering Routines
445   //===------------------------------------------------------------------===//
446 
447   /// \brief Emit frame instruction to describe the layout of the frame.
448   void emitCFIInstruction(const MCCFIInstruction &Inst) const;
449 
450   /// \brief Emit Dwarf abbreviation table.
emitDwarfAbbrevs(const T & Abbrevs)451   template <typename T> void emitDwarfAbbrevs(const T &Abbrevs) const {
452     // For each abbreviation.
453     for (const auto &Abbrev : Abbrevs)
454       emitDwarfAbbrev(*Abbrev);
455 
456     // Mark end of abbreviations.
457     EmitULEB128(0, "EOM(3)");
458   }
459 
460   void emitDwarfAbbrev(const DIEAbbrev &Abbrev) const;
461 
462   /// \brief Recursively emit Dwarf DIE tree.
463   void emitDwarfDIE(const DIE &Die) const;
464 
465   //===------------------------------------------------------------------===//
466   // Inline Asm Support
467   //===------------------------------------------------------------------===//
468 public:
469   // These are hooks that targets can override to implement inline asm
470   // support.  These should probably be moved out of AsmPrinter someday.
471 
472   /// Print information related to the specified machine instr that is
473   /// independent of the operand, and may be independent of the instr itself.
474   /// This can be useful for portably encoding the comment character or other
475   /// bits of target-specific knowledge into the asmstrings.  The syntax used is
476   /// ${:comment}.  Targets can override this to add support for their own
477   /// strange codes.
478   virtual void PrintSpecial(const MachineInstr *MI, raw_ostream &OS,
479                             const char *Code) const;
480 
481   /// Print the specified operand of MI, an INLINEASM instruction, using the
482   /// specified assembler variant.  Targets should override this to format as
483   /// appropriate.  This method can return true if the operand is erroneous.
484   virtual bool PrintAsmOperand(const MachineInstr *MI, unsigned OpNo,
485                                unsigned AsmVariant, const char *ExtraCode,
486                                raw_ostream &OS);
487 
488   /// Print the specified operand of MI, an INLINEASM instruction, using the
489   /// specified assembler variant as an address. Targets should override this to
490   /// format as appropriate.  This method can return true if the operand is
491   /// erroneous.
492   virtual bool PrintAsmMemoryOperand(const MachineInstr *MI, unsigned OpNo,
493                                      unsigned AsmVariant, const char *ExtraCode,
494                                      raw_ostream &OS);
495 
496   /// Let the target do anything it needs to do before emitting inlineasm.
497   /// \p StartInfo - the subtarget info before parsing inline asm
498   virtual void emitInlineAsmStart() const;
499 
500   /// Let the target do anything it needs to do after emitting inlineasm.
501   /// This callback can be used restore the original mode in case the
502   /// inlineasm contains directives to switch modes.
503   /// \p StartInfo - the original subtarget info before inline asm
504   /// \p EndInfo   - the final subtarget info after parsing the inline asm,
505   ///                or NULL if the value is unknown.
506   virtual void emitInlineAsmEnd(const MCSubtargetInfo &StartInfo,
507                                 const MCSubtargetInfo *EndInfo) const;
508 
509 private:
510   /// Private state for PrintSpecial()
511   // Assign a unique ID to this machine instruction.
512   mutable const MachineInstr *LastMI;
513   mutable unsigned LastFn;
514   mutable unsigned Counter;
515 
516   /// This method emits the header for the current function.
517   virtual void EmitFunctionHeader();
518 
519   /// Emit a blob of inline asm to the output streamer.
520   void
521   EmitInlineAsm(StringRef Str, const MCSubtargetInfo &STI,
522                 const MCTargetOptions &MCOptions,
523                 const MDNode *LocMDNode = nullptr,
524                 InlineAsm::AsmDialect AsmDialect = InlineAsm::AD_ATT) const;
525 
526   /// This method formats and emits the specified machine instruction that is an
527   /// inline asm.
528   void EmitInlineAsm(const MachineInstr *MI) const;
529 
530   //===------------------------------------------------------------------===//
531   // Internal Implementation Details
532   //===------------------------------------------------------------------===//
533 
534   /// This emits visibility information about symbol, if this is suported by the
535   /// target.
536   void EmitVisibility(MCSymbol *Sym, unsigned Visibility,
537                       bool IsDefinition = true) const;
538 
539   void EmitLinkage(const GlobalValue *GV, MCSymbol *GVSym) const;
540 
541   void EmitJumpTableEntry(const MachineJumpTableInfo *MJTI,
542                           const MachineBasicBlock *MBB, unsigned uid) const;
543   void EmitLLVMUsedList(const ConstantArray *InitList);
544   /// Emit llvm.ident metadata in an '.ident' directive.
545   void EmitModuleIdents(Module &M);
546   void EmitXXStructorList(const DataLayout &DL, const Constant *List,
547                           bool isCtor);
548   GCMetadataPrinter *GetOrCreateGCPrinter(GCStrategy &C);
549 };
550 }
551 
552 #endif
553