1 //===- ObjectFile.h - File format independent object file -------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file declares a file format independent ObjectFile class.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #ifndef LLVM_OBJECT_OBJECT_FILE_H
15 #define LLVM_OBJECT_OBJECT_FILE_H
16 
17 #include "llvm/Object/Binary.h"
18 #include "llvm/ADT/StringRef.h"
19 #include "llvm/Support/DataTypes.h"
20 #include "llvm/Support/ErrorHandling.h"
21 #include "llvm/Support/MemoryBuffer.h"
22 #include <cstring>
23 
24 namespace llvm {
25 namespace object {
26 
27 class ObjectFile;
28 
29 union DataRefImpl {
30   struct {
31     // ELF needs this for relocations. This entire union should probably be a
32     // char[max(8, sizeof(uintptr_t))] and require the impl to cast.
33     uint16_t a, b;
34     uint32_t c;
35   } w;
36   struct {
37     uint32_t a, b;
38   } d;
39   uintptr_t p;
40 };
41 
42 template<class content_type>
43 class content_iterator {
44   content_type Current;
45 public:
content_iterator(content_type symb)46   content_iterator(content_type symb)
47     : Current(symb) {}
48 
49   const content_type* operator->() const {
50     return &Current;
51   }
52 
53   const content_type &operator*() const {
54     return Current;
55   }
56 
57   bool operator==(const content_iterator &other) const {
58     return Current == other.Current;
59   }
60 
61   bool operator!=(const content_iterator &other) const {
62     return !(*this == other);
63   }
64 
increment(error_code & err)65   content_iterator& increment(error_code &err) {
66     content_type next;
67     if (error_code ec = Current.getNext(next))
68       err = ec;
69     else
70       Current = next;
71     return *this;
72   }
73 };
74 
75 static bool operator ==(const DataRefImpl &a, const DataRefImpl &b) {
76   // Check bitwise identical. This is the only legal way to compare a union w/o
77   // knowing which member is in use.
78   return std::memcmp(&a, &b, sizeof(DataRefImpl)) == 0;
79 }
80 
81 /// SymbolRef - This is a value type class that represents a single symbol in
82 /// the list of symbols in the object file.
83 class SymbolRef {
84   friend class SectionRef;
85   DataRefImpl SymbolPimpl;
86   const ObjectFile *OwningObject;
87 
88 public:
SymbolRef()89   SymbolRef() : OwningObject(NULL) {
90     std::memset(&SymbolPimpl, 0, sizeof(SymbolPimpl));
91   }
92 
93   enum SymbolType {
94     ST_Function,
95     ST_Data,
96     ST_External,    // Defined in another object file
97     ST_Other
98   };
99 
100   SymbolRef(DataRefImpl SymbolP, const ObjectFile *Owner);
101 
102   bool operator==(const SymbolRef &Other) const;
103 
104   error_code getNext(SymbolRef &Result) const;
105 
106   error_code getName(StringRef &Result) const;
107   error_code getAddress(uint64_t &Result) const;
108   error_code getOffset(uint64_t &Result) const;
109   error_code getSize(uint64_t &Result) const;
110   error_code getSymbolType(SymbolRef::SymbolType &Result) const;
111 
112   /// Returns the ascii char that should be displayed in a symbol table dump via
113   /// nm for this symbol.
114   error_code getNMTypeChar(char &Result) const;
115 
116   /// Returns true for symbols that are internal to the object file format such
117   /// as section symbols.
118   error_code isInternal(bool &Result) const;
119 
120   /// Returns true for symbols that can be used in another objects,
121   /// such as library functions
122   error_code isGlobal(bool &Result) const;
123 
124   DataRefImpl getRawDataRefImpl() const;
125 };
126 typedef content_iterator<SymbolRef> symbol_iterator;
127 
128 /// RelocationRef - This is a value type class that represents a single
129 /// relocation in the list of relocations in the object file.
130 class RelocationRef {
131   DataRefImpl RelocationPimpl;
132   const ObjectFile *OwningObject;
133 
134 public:
RelocationRef()135   RelocationRef() : OwningObject(NULL) {
136     std::memset(&RelocationPimpl, 0, sizeof(RelocationPimpl));
137   }
138 
139   RelocationRef(DataRefImpl RelocationP, const ObjectFile *Owner);
140 
141   bool operator==(const RelocationRef &Other) const;
142 
143   error_code getNext(RelocationRef &Result) const;
144 
145   error_code getAddress(uint64_t &Result) const;
146   error_code getSymbol(SymbolRef &Result) const;
147   error_code getType(uint32_t &Result) const;
148 
149   /// @brief Get a string that represents the type of this relocation.
150   ///
151   /// This is for display purposes only.
152   error_code getTypeName(SmallVectorImpl<char> &Result) const;
153   error_code getAdditionalInfo(int64_t &Result) const;
154 
155   /// @brief Get a string that represents the calculation of the value of this
156   ///        relocation.
157   ///
158   /// This is for display purposes only.
159   error_code getValueString(SmallVectorImpl<char> &Result) const;
160 };
161 typedef content_iterator<RelocationRef> relocation_iterator;
162 
163 /// SectionRef - This is a value type class that represents a single section in
164 /// the list of sections in the object file.
165 class SectionRef {
166   friend class SymbolRef;
167   DataRefImpl SectionPimpl;
168   const ObjectFile *OwningObject;
169 
170 public:
SectionRef()171   SectionRef() : OwningObject(NULL) {
172     std::memset(&SectionPimpl, 0, sizeof(SectionPimpl));
173   }
174 
175   SectionRef(DataRefImpl SectionP, const ObjectFile *Owner);
176 
177   bool operator==(const SectionRef &Other) const;
178 
179   error_code getNext(SectionRef &Result) const;
180 
181   error_code getName(StringRef &Result) const;
182   error_code getAddress(uint64_t &Result) const;
183   error_code getSize(uint64_t &Result) const;
184   error_code getContents(StringRef &Result) const;
185 
186   /// @brief Get the alignment of this section as the actual value (not log 2).
187   error_code getAlignment(uint64_t &Result) const;
188 
189   // FIXME: Move to the normalization layer when it's created.
190   error_code isText(bool &Result) const;
191   error_code isData(bool &Result) const;
192   error_code isBSS(bool &Result) const;
193 
194   error_code containsSymbol(SymbolRef S, bool &Result) const;
195 
196   relocation_iterator begin_relocations() const;
197   relocation_iterator end_relocations() const;
198 };
199 typedef content_iterator<SectionRef> section_iterator;
200 
201 const uint64_t UnknownAddressOrSize = ~0ULL;
202 
203 /// ObjectFile - This class is the base class for all object file types.
204 /// Concrete instances of this object are created by createObjectFile, which
205 /// figure out which type to create.
206 class ObjectFile : public Binary {
207 private:
208   ObjectFile(); // = delete
209   ObjectFile(const ObjectFile &other); // = delete
210 
211 protected:
212   ObjectFile(unsigned int Type, MemoryBuffer *source, error_code &ec);
213 
base()214   const uint8_t *base() const {
215     return reinterpret_cast<const uint8_t *>(Data->getBufferStart());
216   }
217 
218   // These functions are for SymbolRef to call internally. The main goal of
219   // this is to allow SymbolRef::SymbolPimpl to point directly to the symbol
220   // entry in the memory mapped object file. SymbolPimpl cannot contain any
221   // virtual functions because then it could not point into the memory mapped
222   // file.
223   //
224   // Implementations assume that the DataRefImpl is valid and has not been
225   // modified externally. It's UB otherwise.
226   friend class SymbolRef;
227   virtual error_code getSymbolNext(DataRefImpl Symb, SymbolRef &Res) const = 0;
228   virtual error_code getSymbolName(DataRefImpl Symb, StringRef &Res) const = 0;
229   virtual error_code getSymbolAddress(DataRefImpl Symb, uint64_t &Res) const =0;
230   virtual error_code getSymbolOffset(DataRefImpl Symb, uint64_t &Res) const =0;
231   virtual error_code getSymbolSize(DataRefImpl Symb, uint64_t &Res) const = 0;
232   virtual error_code getSymbolNMTypeChar(DataRefImpl Symb, char &Res) const = 0;
233   virtual error_code isSymbolInternal(DataRefImpl Symb, bool &Res) const = 0;
234   virtual error_code isSymbolGlobal(DataRefImpl Symb, bool &Res) const = 0;
235   virtual error_code getSymbolType(DataRefImpl Symb, SymbolRef::SymbolType &Res) const = 0;
236 
237   // Same as above for SectionRef.
238   friend class SectionRef;
239   virtual error_code getSectionNext(DataRefImpl Sec, SectionRef &Res) const = 0;
240   virtual error_code getSectionName(DataRefImpl Sec, StringRef &Res) const = 0;
241   virtual error_code getSectionAddress(DataRefImpl Sec, uint64_t &Res) const =0;
242   virtual error_code getSectionSize(DataRefImpl Sec, uint64_t &Res) const = 0;
243   virtual error_code getSectionContents(DataRefImpl Sec, StringRef &Res)const=0;
244   virtual error_code getSectionAlignment(DataRefImpl Sec, uint64_t &Res)const=0;
245   virtual error_code isSectionText(DataRefImpl Sec, bool &Res) const = 0;
246   virtual error_code isSectionData(DataRefImpl Sec, bool &Res) const = 0;
247   virtual error_code isSectionBSS(DataRefImpl Sec, bool &Res) const = 0;
248   virtual error_code sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb,
249                                            bool &Result) const = 0;
250   virtual relocation_iterator getSectionRelBegin(DataRefImpl Sec) const = 0;
251   virtual relocation_iterator getSectionRelEnd(DataRefImpl Sec) const = 0;
252 
253 
254   // Same as above for RelocationRef.
255   friend class RelocationRef;
256   virtual error_code getRelocationNext(DataRefImpl Rel,
257                                        RelocationRef &Res) const = 0;
258   virtual error_code getRelocationAddress(DataRefImpl Rel,
259                                           uint64_t &Res) const =0;
260   virtual error_code getRelocationSymbol(DataRefImpl Rel,
261                                          SymbolRef &Res) const = 0;
262   virtual error_code getRelocationType(DataRefImpl Rel,
263                                        uint32_t &Res) const = 0;
264   virtual error_code getRelocationTypeName(DataRefImpl Rel,
265                                        SmallVectorImpl<char> &Result) const = 0;
266   virtual error_code getRelocationAdditionalInfo(DataRefImpl Rel,
267                                                  int64_t &Res) const = 0;
268   virtual error_code getRelocationValueString(DataRefImpl Rel,
269                                        SmallVectorImpl<char> &Result) const = 0;
270 
271 public:
272 
273   virtual symbol_iterator begin_symbols() const = 0;
274   virtual symbol_iterator end_symbols() const = 0;
275 
276   virtual section_iterator begin_sections() const = 0;
277   virtual section_iterator end_sections() const = 0;
278 
279   /// @brief The number of bytes used to represent an address in this object
280   ///        file format.
281   virtual uint8_t getBytesInAddress() const = 0;
282 
283   virtual StringRef getFileFormatName() const = 0;
284   virtual /* Triple::ArchType */ unsigned getArch() const = 0;
285 
286   /// @returns Pointer to ObjectFile subclass to handle this type of object.
287   /// @param ObjectPath The path to the object file. ObjectPath.isObject must
288   ///        return true.
289   /// @brief Create ObjectFile from path.
290   static ObjectFile *createObjectFile(StringRef ObjectPath);
291   static ObjectFile *createObjectFile(MemoryBuffer *Object);
292 
classof(const Binary * v)293   static inline bool classof(const Binary *v) {
294     return v->getType() >= isObject &&
295            v->getType() < lastObject;
296   }
classof(const ObjectFile * v)297   static inline bool classof(const ObjectFile *v) { return true; }
298 
299 public:
300   static ObjectFile *createCOFFObjectFile(MemoryBuffer *Object);
301   static ObjectFile *createELFObjectFile(MemoryBuffer *Object);
302   static ObjectFile *createMachOObjectFile(MemoryBuffer *Object);
303 };
304 
305 // Inline function definitions.
SymbolRef(DataRefImpl SymbolP,const ObjectFile * Owner)306 inline SymbolRef::SymbolRef(DataRefImpl SymbolP, const ObjectFile *Owner)
307   : SymbolPimpl(SymbolP)
308   , OwningObject(Owner) {}
309 
310 inline bool SymbolRef::operator==(const SymbolRef &Other) const {
311   return SymbolPimpl == Other.SymbolPimpl;
312 }
313 
getNext(SymbolRef & Result)314 inline error_code SymbolRef::getNext(SymbolRef &Result) const {
315   return OwningObject->getSymbolNext(SymbolPimpl, Result);
316 }
317 
getName(StringRef & Result)318 inline error_code SymbolRef::getName(StringRef &Result) const {
319   return OwningObject->getSymbolName(SymbolPimpl, Result);
320 }
321 
getAddress(uint64_t & Result)322 inline error_code SymbolRef::getAddress(uint64_t &Result) const {
323   return OwningObject->getSymbolAddress(SymbolPimpl, Result);
324 }
325 
getOffset(uint64_t & Result)326 inline error_code SymbolRef::getOffset(uint64_t &Result) const {
327   return OwningObject->getSymbolOffset(SymbolPimpl, Result);
328 }
329 
getSize(uint64_t & Result)330 inline error_code SymbolRef::getSize(uint64_t &Result) const {
331   return OwningObject->getSymbolSize(SymbolPimpl, Result);
332 }
333 
getNMTypeChar(char & Result)334 inline error_code SymbolRef::getNMTypeChar(char &Result) const {
335   return OwningObject->getSymbolNMTypeChar(SymbolPimpl, Result);
336 }
337 
isInternal(bool & Result)338 inline error_code SymbolRef::isInternal(bool &Result) const {
339   return OwningObject->isSymbolInternal(SymbolPimpl, Result);
340 }
341 
isGlobal(bool & Result)342 inline error_code SymbolRef::isGlobal(bool &Result) const {
343   return OwningObject->isSymbolGlobal(SymbolPimpl, Result);
344 }
345 
getSymbolType(SymbolRef::SymbolType & Result)346 inline error_code SymbolRef::getSymbolType(SymbolRef::SymbolType &Result) const {
347   return OwningObject->getSymbolType(SymbolPimpl, Result);
348 }
349 
getRawDataRefImpl()350 inline DataRefImpl SymbolRef::getRawDataRefImpl() const {
351   return SymbolPimpl;
352 }
353 
354 
355 /// SectionRef
SectionRef(DataRefImpl SectionP,const ObjectFile * Owner)356 inline SectionRef::SectionRef(DataRefImpl SectionP,
357                               const ObjectFile *Owner)
358   : SectionPimpl(SectionP)
359   , OwningObject(Owner) {}
360 
361 inline bool SectionRef::operator==(const SectionRef &Other) const {
362   return SectionPimpl == Other.SectionPimpl;
363 }
364 
getNext(SectionRef & Result)365 inline error_code SectionRef::getNext(SectionRef &Result) const {
366   return OwningObject->getSectionNext(SectionPimpl, Result);
367 }
368 
getName(StringRef & Result)369 inline error_code SectionRef::getName(StringRef &Result) const {
370   return OwningObject->getSectionName(SectionPimpl, Result);
371 }
372 
getAddress(uint64_t & Result)373 inline error_code SectionRef::getAddress(uint64_t &Result) const {
374   return OwningObject->getSectionAddress(SectionPimpl, Result);
375 }
376 
getSize(uint64_t & Result)377 inline error_code SectionRef::getSize(uint64_t &Result) const {
378   return OwningObject->getSectionSize(SectionPimpl, Result);
379 }
380 
getContents(StringRef & Result)381 inline error_code SectionRef::getContents(StringRef &Result) const {
382   return OwningObject->getSectionContents(SectionPimpl, Result);
383 }
384 
getAlignment(uint64_t & Result)385 inline error_code SectionRef::getAlignment(uint64_t &Result) const {
386   return OwningObject->getSectionAlignment(SectionPimpl, Result);
387 }
388 
isText(bool & Result)389 inline error_code SectionRef::isText(bool &Result) const {
390   return OwningObject->isSectionText(SectionPimpl, Result);
391 }
392 
isData(bool & Result)393 inline error_code SectionRef::isData(bool &Result) const {
394   return OwningObject->isSectionData(SectionPimpl, Result);
395 }
396 
isBSS(bool & Result)397 inline error_code SectionRef::isBSS(bool &Result) const {
398   return OwningObject->isSectionBSS(SectionPimpl, Result);
399 }
400 
containsSymbol(SymbolRef S,bool & Result)401 inline error_code SectionRef::containsSymbol(SymbolRef S, bool &Result) const {
402   return OwningObject->sectionContainsSymbol(SectionPimpl, S.SymbolPimpl,
403                                              Result);
404 }
405 
begin_relocations()406 inline relocation_iterator SectionRef::begin_relocations() const {
407   return OwningObject->getSectionRelBegin(SectionPimpl);
408 }
409 
end_relocations()410 inline relocation_iterator SectionRef::end_relocations() const {
411   return OwningObject->getSectionRelEnd(SectionPimpl);
412 }
413 
414 
415 /// RelocationRef
RelocationRef(DataRefImpl RelocationP,const ObjectFile * Owner)416 inline RelocationRef::RelocationRef(DataRefImpl RelocationP,
417                               const ObjectFile *Owner)
418   : RelocationPimpl(RelocationP)
419   , OwningObject(Owner) {}
420 
421 inline bool RelocationRef::operator==(const RelocationRef &Other) const {
422   return RelocationPimpl == Other.RelocationPimpl;
423 }
424 
getNext(RelocationRef & Result)425 inline error_code RelocationRef::getNext(RelocationRef &Result) const {
426   return OwningObject->getRelocationNext(RelocationPimpl, Result);
427 }
428 
getAddress(uint64_t & Result)429 inline error_code RelocationRef::getAddress(uint64_t &Result) const {
430   return OwningObject->getRelocationAddress(RelocationPimpl, Result);
431 }
432 
getSymbol(SymbolRef & Result)433 inline error_code RelocationRef::getSymbol(SymbolRef &Result) const {
434   return OwningObject->getRelocationSymbol(RelocationPimpl, Result);
435 }
436 
getType(uint32_t & Result)437 inline error_code RelocationRef::getType(uint32_t &Result) const {
438   return OwningObject->getRelocationType(RelocationPimpl, Result);
439 }
440 
getTypeName(SmallVectorImpl<char> & Result)441 inline error_code RelocationRef::getTypeName(SmallVectorImpl<char> &Result)
442   const {
443   return OwningObject->getRelocationTypeName(RelocationPimpl, Result);
444 }
445 
getAdditionalInfo(int64_t & Result)446 inline error_code RelocationRef::getAdditionalInfo(int64_t &Result) const {
447   return OwningObject->getRelocationAdditionalInfo(RelocationPimpl, Result);
448 }
449 
getValueString(SmallVectorImpl<char> & Result)450 inline error_code RelocationRef::getValueString(SmallVectorImpl<char> &Result)
451   const {
452   return OwningObject->getRelocationValueString(RelocationPimpl, Result);
453 }
454 
455 } // end namespace object
456 } // end namespace llvm
457 
458 #endif
459