1 /*
2  * Copyright (C) 2012 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #include "elf_file.h"
18 
19 #include <inttypes.h>
20 #include <sys/mman.h>  // For the PROT_* and MAP_* constants.
21 #include <sys/types.h>
22 #include <unistd.h>
23 
24 #include "android-base/stringprintf.h"
25 #include "android-base/strings.h"
26 
27 #include "arch/instruction_set.h"
28 #include "base/leb128.h"
29 #include "base/stl_util.h"
30 #include "base/unix_file/fd_file.h"
31 #include "base/utils.h"
32 #include "elf/elf_utils.h"
33 #include "elf_file_impl.h"
34 
35 namespace art {
36 
37 using android::base::StringPrintf;
38 
39 template <typename ElfTypes>
ElfFileImpl(File * file,bool writable,bool program_header_only)40 ElfFileImpl<ElfTypes>::ElfFileImpl(File* file, bool writable, bool program_header_only)
41   : writable_(writable),
42     program_header_only_(program_header_only),
43     header_(nullptr),
44     base_address_(nullptr),
45     program_headers_start_(nullptr),
46     section_headers_start_(nullptr),
47     dynamic_program_header_(nullptr),
48     dynamic_section_start_(nullptr),
49     symtab_section_start_(nullptr),
50     dynsym_section_start_(nullptr),
51     strtab_section_start_(nullptr),
52     dynstr_section_start_(nullptr),
53     hash_section_start_(nullptr),
54     symtab_symbol_table_(nullptr),
55     dynsym_symbol_table_(nullptr) {
56   CHECK(file != nullptr);
57 }
58 
59 template <typename ElfTypes>
Open(File * file,bool writable,bool program_header_only,bool low_4gb,std::string * error_msg)60 ElfFileImpl<ElfTypes>* ElfFileImpl<ElfTypes>::Open(File* file,
61                                                    bool writable,
62                                                    bool program_header_only,
63                                                    bool low_4gb,
64                                                    std::string* error_msg) {
65   std::unique_ptr<ElfFileImpl<ElfTypes>> elf_file(
66       new ElfFileImpl<ElfTypes>(file, writable, program_header_only));
67   int prot;
68   int flags;
69   if (writable) {
70     prot = PROT_READ | PROT_WRITE;
71     flags = MAP_SHARED;
72   } else {
73     prot = PROT_READ;
74     flags = MAP_PRIVATE;
75   }
76   if (!elf_file->Setup(file, prot, flags, low_4gb, error_msg)) {
77     return nullptr;
78   }
79   return elf_file.release();
80 }
81 
82 template <typename ElfTypes>
Open(File * file,int prot,int flags,bool low_4gb,std::string * error_msg)83 ElfFileImpl<ElfTypes>* ElfFileImpl<ElfTypes>::Open(File* file,
84                                                    int prot,
85                                                    int flags,
86                                                    bool low_4gb,
87                                                    std::string* error_msg) {
88   std::unique_ptr<ElfFileImpl<ElfTypes>> elf_file(
89       new ElfFileImpl<ElfTypes>(file, (prot & PROT_WRITE) != 0, /* program_header_only= */ false));
90   if (!elf_file->Setup(file, prot, flags, low_4gb, error_msg)) {
91     return nullptr;
92   }
93   return elf_file.release();
94 }
95 
96 template <typename ElfTypes>
Setup(File * file,int prot,int flags,bool low_4gb,std::string * error_msg)97 bool ElfFileImpl<ElfTypes>::Setup(File* file,
98                                   int prot,
99                                   int flags,
100                                   bool low_4gb,
101                                   std::string* error_msg) {
102   int64_t temp_file_length = file->GetLength();
103   if (temp_file_length < 0) {
104     errno = -temp_file_length;
105     *error_msg = StringPrintf("Failed to get length of file: '%s' fd=%d: %s",
106                               file->GetPath().c_str(), file->Fd(), strerror(errno));
107     return false;
108   }
109   size_t file_length = static_cast<size_t>(temp_file_length);
110   if (file_length < sizeof(Elf_Ehdr)) {
111     *error_msg = StringPrintf("File size of %zd bytes not large enough to contain ELF header of "
112                               "%zd bytes: '%s'", file_length, sizeof(Elf_Ehdr),
113                               file->GetPath().c_str());
114     return false;
115   }
116 
117   if (program_header_only_) {
118     // first just map ELF header to get program header size information
119     size_t elf_header_size = sizeof(Elf_Ehdr);
120     if (!SetMap(file,
121                 MemMap::MapFile(elf_header_size,
122                                 prot,
123                                 flags,
124                                 file->Fd(),
125                                 0,
126                                 low_4gb,
127                                 file->GetPath().c_str(),
128                                 error_msg),
129                 error_msg)) {
130       return false;
131     }
132     // then remap to cover program header
133     size_t program_header_size = header_->e_phoff + (header_->e_phentsize * header_->e_phnum);
134     if (file_length < program_header_size) {
135       *error_msg = StringPrintf("File size of %zd bytes not large enough to contain ELF program "
136                                 "header of %zd bytes: '%s'", file_length,
137                                 sizeof(Elf_Ehdr), file->GetPath().c_str());
138       return false;
139     }
140     if (!SetMap(file,
141                 MemMap::MapFile(program_header_size,
142                                 prot,
143                                 flags,
144                                 file->Fd(),
145                                 0,
146                                 low_4gb,
147                                 file->GetPath().c_str(),
148                                 error_msg),
149                 error_msg)) {
150       *error_msg = StringPrintf("Failed to map ELF program headers: %s", error_msg->c_str());
151       return false;
152     }
153   } else {
154     // otherwise map entire file
155     if (!SetMap(file,
156                 MemMap::MapFile(file->GetLength(),
157                                 prot,
158                                 flags,
159                                 file->Fd(),
160                                 0,
161                                 low_4gb,
162                                 file->GetPath().c_str(),
163                                 error_msg),
164                 error_msg)) {
165       *error_msg = StringPrintf("Failed to map ELF file: %s", error_msg->c_str());
166       return false;
167     }
168   }
169 
170   if (program_header_only_) {
171     program_headers_start_ = Begin() + GetHeader().e_phoff;
172   } else {
173     if (!CheckAndSet(GetHeader().e_phoff, "program headers", &program_headers_start_, error_msg)) {
174       return false;
175     }
176 
177     // Setup section headers.
178     if (!CheckAndSet(GetHeader().e_shoff, "section headers", &section_headers_start_, error_msg)) {
179       return false;
180     }
181 
182     // Find shstrtab.
183     Elf_Shdr* shstrtab_section_header = GetSectionNameStringSection();
184     if (shstrtab_section_header == nullptr) {
185       *error_msg = StringPrintf("Failed to find shstrtab section header in ELF file: '%s'",
186                                 file->GetPath().c_str());
187       return false;
188     }
189 
190     // Find .dynamic section info from program header
191     dynamic_program_header_ = FindProgamHeaderByType(PT_DYNAMIC);
192     if (dynamic_program_header_ == nullptr) {
193       *error_msg = StringPrintf("Failed to find PT_DYNAMIC program header in ELF file: '%s'",
194                                 file->GetPath().c_str());
195       return false;
196     }
197 
198     if (!CheckAndSet(GetDynamicProgramHeader().p_offset, "dynamic section",
199                      reinterpret_cast<uint8_t**>(&dynamic_section_start_), error_msg)) {
200       return false;
201     }
202 
203     // Find other sections from section headers
204     for (Elf_Word i = 0; i < GetSectionHeaderNum(); i++) {
205       Elf_Shdr* section_header = GetSectionHeader(i);
206       if (section_header == nullptr) {
207         *error_msg = StringPrintf("Failed to find section header for section %d in ELF file: '%s'",
208                                   i, file->GetPath().c_str());
209         return false;
210       }
211       switch (section_header->sh_type) {
212         case SHT_SYMTAB: {
213           if (!CheckAndSet(section_header->sh_offset, "symtab",
214                            reinterpret_cast<uint8_t**>(&symtab_section_start_), error_msg)) {
215             return false;
216           }
217           break;
218         }
219         case SHT_DYNSYM: {
220           if (!CheckAndSet(section_header->sh_offset, "dynsym",
221                            reinterpret_cast<uint8_t**>(&dynsym_section_start_), error_msg)) {
222             return false;
223           }
224           break;
225         }
226         case SHT_STRTAB: {
227           // TODO: base these off of sh_link from .symtab and .dynsym above
228           if ((section_header->sh_flags & SHF_ALLOC) != 0) {
229             // Check that this is named ".dynstr" and ignore otherwise.
230             const char* header_name = GetString(*shstrtab_section_header, section_header->sh_name);
231             if (strncmp(".dynstr", header_name, 8) == 0) {
232               if (!CheckAndSet(section_header->sh_offset, "dynstr",
233                                reinterpret_cast<uint8_t**>(&dynstr_section_start_), error_msg)) {
234                 return false;
235               }
236             }
237           } else {
238             // Check that this is named ".strtab" and ignore otherwise.
239             const char* header_name = GetString(*shstrtab_section_header, section_header->sh_name);
240             if (strncmp(".strtab", header_name, 8) == 0) {
241               if (!CheckAndSet(section_header->sh_offset, "strtab",
242                                reinterpret_cast<uint8_t**>(&strtab_section_start_), error_msg)) {
243                 return false;
244               }
245             }
246           }
247           break;
248         }
249         case SHT_DYNAMIC: {
250           if (reinterpret_cast<uint8_t*>(dynamic_section_start_) !=
251               Begin() + section_header->sh_offset) {
252             LOG(WARNING) << "Failed to find matching SHT_DYNAMIC for PT_DYNAMIC in "
253                          << file->GetPath() << ": " << std::hex
254                          << reinterpret_cast<void*>(dynamic_section_start_)
255                          << " != " << reinterpret_cast<void*>(Begin() + section_header->sh_offset);
256             return false;
257           }
258           break;
259         }
260         case SHT_HASH: {
261           if (!CheckAndSet(section_header->sh_offset, "hash section",
262                            reinterpret_cast<uint8_t**>(&hash_section_start_), error_msg)) {
263             return false;
264           }
265           break;
266         }
267       }
268     }
269 
270     // Check for the existence of some sections.
271     if (!CheckSectionsExist(file, error_msg)) {
272       return false;
273     }
274   }
275 
276   return true;
277 }
278 
279 template <typename ElfTypes>
~ElfFileImpl()280 ElfFileImpl<ElfTypes>::~ElfFileImpl() {
281   delete symtab_symbol_table_;
282   delete dynsym_symbol_table_;
283 }
284 
285 template <typename ElfTypes>
CheckAndSet(Elf32_Off offset,const char * label,uint8_t ** target,std::string * error_msg)286 bool ElfFileImpl<ElfTypes>::CheckAndSet(Elf32_Off offset, const char* label,
287                                         uint8_t** target, std::string* error_msg) {
288   if (Begin() + offset >= End()) {
289     *error_msg = StringPrintf("Offset %d is out of range for %s in ELF file: '%s'", offset, label,
290                               file_path_.c_str());
291     return false;
292   }
293   *target = Begin() + offset;
294   return true;
295 }
296 
297 template <typename ElfTypes>
CheckSectionsLinked(const uint8_t * source,const uint8_t * target) const298 bool ElfFileImpl<ElfTypes>::CheckSectionsLinked(const uint8_t* source,
299                                                 const uint8_t* target) const {
300   // Only works in whole-program mode, as we need to iterate over the sections.
301   // Note that we normally can't search by type, as duplicates are allowed for most section types.
302   if (program_header_only_) {
303     return true;
304   }
305 
306   Elf_Shdr* source_section = nullptr;
307   Elf_Word target_index = 0;
308   bool target_found = false;
309   for (Elf_Word i = 0; i < GetSectionHeaderNum(); i++) {
310     Elf_Shdr* section_header = GetSectionHeader(i);
311 
312     if (Begin() + section_header->sh_offset == source) {
313       // Found the source.
314       source_section = section_header;
315       if (target_index) {
316         break;
317       }
318     } else if (Begin() + section_header->sh_offset == target) {
319       target_index = i;
320       target_found = true;
321       if (source_section != nullptr) {
322         break;
323       }
324     }
325   }
326 
327   return target_found && source_section != nullptr && source_section->sh_link == target_index;
328 }
329 
330 template <typename ElfTypes>
CheckSectionsExist(File * file,std::string * error_msg) const331   bool ElfFileImpl<ElfTypes>::CheckSectionsExist(File* file, std::string* error_msg) const {
332   if (!program_header_only_) {
333     // If in full mode, need section headers.
334     if (section_headers_start_ == nullptr) {
335       *error_msg = StringPrintf("No section headers in ELF file: '%s'", file->GetPath().c_str());
336       return false;
337     }
338   }
339 
340   // This is redundant, but defensive.
341   if (dynamic_program_header_ == nullptr) {
342     *error_msg = StringPrintf("Failed to find PT_DYNAMIC program header in ELF file: '%s'",
343                               file->GetPath().c_str());
344     return false;
345   }
346 
347   // Need a dynamic section. This is redundant, but defensive.
348   if (dynamic_section_start_ == nullptr) {
349     *error_msg = StringPrintf("Failed to find dynamic section in ELF file: '%s'",
350                               file->GetPath().c_str());
351     return false;
352   }
353 
354   // Symtab validation. These is not really a hard failure, as we are currently not using the
355   // symtab internally, but it's nice to be defensive.
356   if (symtab_section_start_ != nullptr) {
357     // When there's a symtab, there should be a strtab.
358     if (strtab_section_start_ == nullptr) {
359       *error_msg = StringPrintf("No strtab for symtab in ELF file: '%s'", file->GetPath().c_str());
360       return false;
361     }
362 
363     // The symtab should link to the strtab.
364     if (!CheckSectionsLinked(reinterpret_cast<const uint8_t*>(symtab_section_start_),
365                              reinterpret_cast<const uint8_t*>(strtab_section_start_))) {
366       *error_msg = StringPrintf("Symtab is not linked to the strtab in ELF file: '%s'",
367                                 file->GetPath().c_str());
368       return false;
369     }
370   }
371 
372   // We always need a dynstr & dynsym.
373   if (dynstr_section_start_ == nullptr) {
374     *error_msg = StringPrintf("No dynstr in ELF file: '%s'", file->GetPath().c_str());
375     return false;
376   }
377   if (dynsym_section_start_ == nullptr) {
378     *error_msg = StringPrintf("No dynsym in ELF file: '%s'", file->GetPath().c_str());
379     return false;
380   }
381 
382   // Need a hash section for dynamic symbol lookup.
383   if (hash_section_start_ == nullptr) {
384     *error_msg = StringPrintf("Failed to find hash section in ELF file: '%s'",
385                               file->GetPath().c_str());
386     return false;
387   }
388 
389   // And the hash section should be linking to the dynsym.
390   if (!CheckSectionsLinked(reinterpret_cast<const uint8_t*>(hash_section_start_),
391                            reinterpret_cast<const uint8_t*>(dynsym_section_start_))) {
392     *error_msg = StringPrintf("Hash section is not linked to the dynstr in ELF file: '%s'",
393                               file->GetPath().c_str());
394     return false;
395   }
396 
397   // We'd also like to confirm a shstrtab in program_header_only_ mode (else Open() does this for
398   // us). This is usually the last in an oat file, and a good indicator of whether writing was
399   // successful (or the process crashed and left garbage).
400   if (program_header_only_) {
401     // It might not be mapped, but we can compare against the file size.
402     int64_t offset = static_cast<int64_t>(GetHeader().e_shoff +
403                                           (GetHeader().e_shstrndx * GetHeader().e_shentsize));
404     if (offset >= file->GetLength()) {
405       *error_msg = StringPrintf("Shstrtab is not in the mapped ELF file: '%s'",
406                                 file->GetPath().c_str());
407       return false;
408     }
409   }
410 
411   return true;
412 }
413 
414 template <typename ElfTypes>
SetMap(File * file,MemMap && map,std::string * error_msg)415 bool ElfFileImpl<ElfTypes>::SetMap(File* file, MemMap&& map, std::string* error_msg) {
416   if (!map.IsValid()) {
417     // MemMap::Open should have already set an error.
418     DCHECK(!error_msg->empty());
419     return false;
420   }
421   map_ = std::move(map);
422   CHECK(map_.IsValid()) << file->GetPath();
423   CHECK(map_.Begin() != nullptr) << file->GetPath();
424 
425   header_ = reinterpret_cast<Elf_Ehdr*>(map_.Begin());
426   if ((ELFMAG0 != header_->e_ident[EI_MAG0])
427       || (ELFMAG1 != header_->e_ident[EI_MAG1])
428       || (ELFMAG2 != header_->e_ident[EI_MAG2])
429       || (ELFMAG3 != header_->e_ident[EI_MAG3])) {
430     *error_msg = StringPrintf("Failed to find ELF magic value %d %d %d %d in %s, found %d %d %d %d",
431                               ELFMAG0, ELFMAG1, ELFMAG2, ELFMAG3,
432                               file->GetPath().c_str(),
433                               header_->e_ident[EI_MAG0],
434                               header_->e_ident[EI_MAG1],
435                               header_->e_ident[EI_MAG2],
436                               header_->e_ident[EI_MAG3]);
437     return false;
438   }
439   uint8_t elf_class = (sizeof(Elf_Addr) == sizeof(Elf64_Addr)) ? ELFCLASS64 : ELFCLASS32;
440   if (elf_class != header_->e_ident[EI_CLASS]) {
441     *error_msg = StringPrintf("Failed to find expected EI_CLASS value %d in %s, found %d",
442                               elf_class,
443                               file->GetPath().c_str(),
444                               header_->e_ident[EI_CLASS]);
445     return false;
446   }
447   if (ELFDATA2LSB != header_->e_ident[EI_DATA]) {
448     *error_msg = StringPrintf("Failed to find expected EI_DATA value %d in %s, found %d",
449                               ELFDATA2LSB,
450                               file->GetPath().c_str(),
451                               header_->e_ident[EI_CLASS]);
452     return false;
453   }
454   if (EV_CURRENT != header_->e_ident[EI_VERSION]) {
455     *error_msg = StringPrintf("Failed to find expected EI_VERSION value %d in %s, found %d",
456                               EV_CURRENT,
457                               file->GetPath().c_str(),
458                               header_->e_ident[EI_CLASS]);
459     return false;
460   }
461   if (ET_DYN != header_->e_type) {
462     *error_msg = StringPrintf("Failed to find expected e_type value %d in %s, found %d",
463                               ET_DYN,
464                               file->GetPath().c_str(),
465                               header_->e_type);
466     return false;
467   }
468   if (EV_CURRENT != header_->e_version) {
469     *error_msg = StringPrintf("Failed to find expected e_version value %d in %s, found %d",
470                               EV_CURRENT,
471                               file->GetPath().c_str(),
472                               header_->e_version);
473     return false;
474   }
475   if (0 != header_->e_entry) {
476     *error_msg = StringPrintf("Failed to find expected e_entry value %d in %s, found %d",
477                               0,
478                               file->GetPath().c_str(),
479                               static_cast<int32_t>(header_->e_entry));
480     return false;
481   }
482   if (0 == header_->e_phoff) {
483     *error_msg = StringPrintf("Failed to find non-zero e_phoff value in %s",
484                               file->GetPath().c_str());
485     return false;
486   }
487   if (0 == header_->e_shoff) {
488     *error_msg = StringPrintf("Failed to find non-zero e_shoff value in %s",
489                               file->GetPath().c_str());
490     return false;
491   }
492   if (0 == header_->e_ehsize) {
493     *error_msg = StringPrintf("Failed to find non-zero e_ehsize value in %s",
494                               file->GetPath().c_str());
495     return false;
496   }
497   if (0 == header_->e_phentsize) {
498     *error_msg = StringPrintf("Failed to find non-zero e_phentsize value in %s",
499                               file->GetPath().c_str());
500     return false;
501   }
502   if (0 == header_->e_phnum) {
503     *error_msg = StringPrintf("Failed to find non-zero e_phnum value in %s",
504                               file->GetPath().c_str());
505     return false;
506   }
507   if (0 == header_->e_shentsize) {
508     *error_msg = StringPrintf("Failed to find non-zero e_shentsize value in %s",
509                               file->GetPath().c_str());
510     return false;
511   }
512   if (0 == header_->e_shnum) {
513     *error_msg = StringPrintf("Failed to find non-zero e_shnum value in %s",
514                               file->GetPath().c_str());
515     return false;
516   }
517   if (0 == header_->e_shstrndx) {
518     *error_msg = StringPrintf("Failed to find non-zero e_shstrndx value in %s",
519                               file->GetPath().c_str());
520     return false;
521   }
522   if (header_->e_shstrndx >= header_->e_shnum) {
523     *error_msg = StringPrintf("Failed to find e_shnum value %d less than %d in %s",
524                               header_->e_shstrndx,
525                               header_->e_shnum,
526                               file->GetPath().c_str());
527     return false;
528   }
529 
530   if (!program_header_only_) {
531     if (header_->e_phoff >= Size()) {
532       *error_msg = StringPrintf("Failed to find e_phoff value %" PRIu64 " less than %zd in %s",
533                                 static_cast<uint64_t>(header_->e_phoff),
534                                 Size(),
535                                 file->GetPath().c_str());
536       return false;
537     }
538     if (header_->e_shoff >= Size()) {
539       *error_msg = StringPrintf("Failed to find e_shoff value %" PRIu64 " less than %zd in %s",
540                                 static_cast<uint64_t>(header_->e_shoff),
541                                 Size(),
542                                 file->GetPath().c_str());
543       return false;
544     }
545   }
546   return true;
547 }
548 
549 template <typename ElfTypes>
GetHeader() const550 typename ElfTypes::Ehdr& ElfFileImpl<ElfTypes>::GetHeader() const {
551   CHECK(header_ != nullptr);  // Header has been checked in SetMap
552   return *header_;
553 }
554 
555 template <typename ElfTypes>
GetProgramHeadersStart() const556 uint8_t* ElfFileImpl<ElfTypes>::GetProgramHeadersStart() const {
557   CHECK(program_headers_start_ != nullptr);  // Header has been set in Setup
558   return program_headers_start_;
559 }
560 
561 template <typename ElfTypes>
GetSectionHeadersStart() const562 uint8_t* ElfFileImpl<ElfTypes>::GetSectionHeadersStart() const {
563   CHECK(!program_header_only_);              // Only used in "full" mode.
564   CHECK(section_headers_start_ != nullptr);  // Is checked in CheckSectionsExist
565   return section_headers_start_;
566 }
567 
568 template <typename ElfTypes>
GetDynamicProgramHeader() const569 typename ElfTypes::Phdr& ElfFileImpl<ElfTypes>::GetDynamicProgramHeader() const {
570   CHECK(dynamic_program_header_ != nullptr);  // Is checked in CheckSectionsExist
571   return *dynamic_program_header_;
572 }
573 
574 template <typename ElfTypes>
GetDynamicSectionStart() const575 typename ElfTypes::Dyn* ElfFileImpl<ElfTypes>::GetDynamicSectionStart() const {
576   CHECK(dynamic_section_start_ != nullptr);  // Is checked in CheckSectionsExist
577   return dynamic_section_start_;
578 }
579 
580 template <typename ElfTypes>
GetSymbolSectionStart(Elf_Word section_type) const581 typename ElfTypes::Sym* ElfFileImpl<ElfTypes>::GetSymbolSectionStart(
582     Elf_Word section_type) const {
583   CHECK(IsSymbolSectionType(section_type)) << file_path_ << " " << section_type;
584   switch (section_type) {
585     case SHT_SYMTAB: {
586       return symtab_section_start_;
587       break;
588     }
589     case SHT_DYNSYM: {
590       return dynsym_section_start_;
591       break;
592     }
593     default: {
594       LOG(FATAL) << section_type;
595       return nullptr;
596     }
597   }
598 }
599 
600 template <typename ElfTypes>
GetStringSectionStart(Elf_Word section_type) const601 const char* ElfFileImpl<ElfTypes>::GetStringSectionStart(
602     Elf_Word section_type) const {
603   CHECK(IsSymbolSectionType(section_type)) << file_path_ << " " << section_type;
604   switch (section_type) {
605     case SHT_SYMTAB: {
606       return strtab_section_start_;
607     }
608     case SHT_DYNSYM: {
609       return dynstr_section_start_;
610     }
611     default: {
612       LOG(FATAL) << section_type;
613       return nullptr;
614     }
615   }
616 }
617 
618 template <typename ElfTypes>
GetString(Elf_Word section_type,Elf_Word i) const619 const char* ElfFileImpl<ElfTypes>::GetString(Elf_Word section_type,
620                                              Elf_Word i) const {
621   CHECK(IsSymbolSectionType(section_type)) << file_path_ << " " << section_type;
622   if (i == 0) {
623     return nullptr;
624   }
625   const char* string_section_start = GetStringSectionStart(section_type);
626   if (string_section_start == nullptr) {
627     return nullptr;
628   }
629   return string_section_start + i;
630 }
631 
632 // WARNING: The following methods do not check for an error condition (non-existent hash section).
633 //          It is the caller's job to do this.
634 
635 template <typename ElfTypes>
GetHashSectionStart() const636 typename ElfTypes::Word* ElfFileImpl<ElfTypes>::GetHashSectionStart() const {
637   return hash_section_start_;
638 }
639 
640 template <typename ElfTypes>
GetHashBucketNum() const641 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetHashBucketNum() const {
642   return GetHashSectionStart()[0];
643 }
644 
645 template <typename ElfTypes>
GetHashChainNum() const646 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetHashChainNum() const {
647   return GetHashSectionStart()[1];
648 }
649 
650 template <typename ElfTypes>
GetHashBucket(size_t i,bool * ok) const651 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetHashBucket(size_t i, bool* ok) const {
652   if (i >= GetHashBucketNum()) {
653     *ok = false;
654     return 0;
655   }
656   *ok = true;
657   // 0 is nbucket, 1 is nchain
658   return GetHashSectionStart()[2 + i];
659 }
660 
661 template <typename ElfTypes>
GetHashChain(size_t i,bool * ok) const662 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetHashChain(size_t i, bool* ok) const {
663   if (i >= GetHashChainNum()) {
664     *ok = false;
665     return 0;
666   }
667   *ok = true;
668   // 0 is nbucket, 1 is nchain, & chains are after buckets
669   return GetHashSectionStart()[2 + GetHashBucketNum() + i];
670 }
671 
672 template <typename ElfTypes>
GetProgramHeaderNum() const673 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetProgramHeaderNum() const {
674   return GetHeader().e_phnum;
675 }
676 
677 template <typename ElfTypes>
GetProgramHeader(Elf_Word i) const678 typename ElfTypes::Phdr* ElfFileImpl<ElfTypes>::GetProgramHeader(Elf_Word i) const {
679   CHECK_LT(i, GetProgramHeaderNum()) << file_path_;  // Validity check for caller.
680   uint8_t* program_header = GetProgramHeadersStart() + (i * GetHeader().e_phentsize);
681   CHECK_LT(program_header, End());
682   return reinterpret_cast<Elf_Phdr*>(program_header);
683 }
684 
685 template <typename ElfTypes>
FindProgamHeaderByType(Elf_Word type) const686 typename ElfTypes::Phdr* ElfFileImpl<ElfTypes>::FindProgamHeaderByType(Elf_Word type) const {
687   for (Elf_Word i = 0; i < GetProgramHeaderNum(); i++) {
688     Elf_Phdr* program_header = GetProgramHeader(i);
689     if (program_header->p_type == type) {
690       return program_header;
691     }
692   }
693   return nullptr;
694 }
695 
696 template <typename ElfTypes>
GetSectionHeaderNum() const697 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetSectionHeaderNum() const {
698   return GetHeader().e_shnum;
699 }
700 
701 template <typename ElfTypes>
GetSectionHeader(Elf_Word i) const702 typename ElfTypes::Shdr* ElfFileImpl<ElfTypes>::GetSectionHeader(Elf_Word i) const {
703   // Can only access arbitrary sections when we have the whole file, not just program header.
704   // Even if we Load(), it doesn't bring in all the sections.
705   CHECK(!program_header_only_) << file_path_;
706   if (i >= GetSectionHeaderNum()) {
707     return nullptr;  // Failure condition.
708   }
709   uint8_t* section_header = GetSectionHeadersStart() + (i * GetHeader().e_shentsize);
710   if (section_header >= End()) {
711     return nullptr;  // Failure condition.
712   }
713   return reinterpret_cast<Elf_Shdr*>(section_header);
714 }
715 
716 template <typename ElfTypes>
FindSectionByType(Elf_Word type) const717 typename ElfTypes::Shdr* ElfFileImpl<ElfTypes>::FindSectionByType(Elf_Word type) const {
718   // Can only access arbitrary sections when we have the whole file, not just program header.
719   // We could change this to switch on known types if they were detected during loading.
720   CHECK(!program_header_only_) << file_path_;
721   for (Elf_Word i = 0; i < GetSectionHeaderNum(); i++) {
722     Elf_Shdr* section_header = GetSectionHeader(i);
723     if (section_header->sh_type == type) {
724       return section_header;
725     }
726   }
727   return nullptr;
728 }
729 
730 // from bionic
elfhash(const char * _name)731 static unsigned elfhash(const char *_name) {
732   const unsigned char *name = (const unsigned char *) _name;
733   unsigned h = 0, g;
734 
735   while (*name) {
736     h = (h << 4) + *name++;
737     g = h & 0xf0000000;
738     h ^= g;
739     h ^= g >> 24;
740   }
741   return h;
742 }
743 
744 template <typename ElfTypes>
GetSectionNameStringSection() const745 typename ElfTypes::Shdr* ElfFileImpl<ElfTypes>::GetSectionNameStringSection() const {
746   return GetSectionHeader(GetHeader().e_shstrndx);
747 }
748 
749 template <typename ElfTypes>
FindDynamicSymbolAddress(const std::string & symbol_name) const750 const uint8_t* ElfFileImpl<ElfTypes>::FindDynamicSymbolAddress(
751     const std::string& symbol_name) const {
752   // Check that we have a hash section.
753   if (GetHashSectionStart() == nullptr) {
754     return nullptr;  // Failure condition.
755   }
756   const Elf_Sym* sym = FindDynamicSymbol(symbol_name);
757   if (sym != nullptr) {
758     // TODO: we need to change this to calculate base_address_ in ::Open,
759     // otherwise it will be wrongly 0 if ::Load has not yet been called.
760     return base_address_ + sym->st_value;
761   } else {
762     return nullptr;
763   }
764 }
765 
766 // WARNING: Only called from FindDynamicSymbolAddress. Elides check for hash section.
767 template <typename ElfTypes>
FindDynamicSymbol(const std::string & symbol_name) const768 const typename ElfTypes::Sym* ElfFileImpl<ElfTypes>::FindDynamicSymbol(
769     const std::string& symbol_name) const {
770   if (GetHashBucketNum() == 0) {
771     // No dynamic symbols at all.
772     return nullptr;
773   }
774   Elf_Word hash = elfhash(symbol_name.c_str());
775   Elf_Word bucket_index = hash % GetHashBucketNum();
776   bool ok;
777   Elf_Word symbol_and_chain_index = GetHashBucket(bucket_index, &ok);
778   if (!ok) {
779     return nullptr;
780   }
781   while (symbol_and_chain_index != 0 /* STN_UNDEF */) {
782     Elf_Sym* symbol = GetSymbol(SHT_DYNSYM, symbol_and_chain_index);
783     if (symbol == nullptr) {
784       return nullptr;  // Failure condition.
785     }
786     const char* name = GetString(SHT_DYNSYM, symbol->st_name);
787     if (symbol_name == name) {
788       return symbol;
789     }
790     symbol_and_chain_index = GetHashChain(symbol_and_chain_index, &ok);
791     if (!ok) {
792       return nullptr;
793     }
794   }
795   return nullptr;
796 }
797 
798 template <typename ElfTypes>
IsSymbolSectionType(Elf_Word section_type)799 bool ElfFileImpl<ElfTypes>::IsSymbolSectionType(Elf_Word section_type) {
800   return ((section_type == SHT_SYMTAB) || (section_type == SHT_DYNSYM));
801 }
802 
803 template <typename ElfTypes>
GetSymbolNum(Elf_Shdr & section_header) const804 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetSymbolNum(Elf_Shdr& section_header) const {
805   CHECK(IsSymbolSectionType(section_header.sh_type))
806       << file_path_ << " " << section_header.sh_type;
807   CHECK_NE(0U, section_header.sh_entsize) << file_path_;
808   return section_header.sh_size / section_header.sh_entsize;
809 }
810 
811 template <typename ElfTypes>
GetSymbol(Elf_Word section_type,Elf_Word i) const812 typename ElfTypes::Sym* ElfFileImpl<ElfTypes>::GetSymbol(Elf_Word section_type, Elf_Word i) const {
813   Elf_Sym* sym_start = GetSymbolSectionStart(section_type);
814   if (sym_start == nullptr) {
815     return nullptr;
816   }
817   return sym_start + i;
818 }
819 
820 template <typename ElfTypes>
821 typename ElfFileImpl<ElfTypes>::SymbolTable**
GetSymbolTable(Elf_Word section_type)822 ElfFileImpl<ElfTypes>::GetSymbolTable(Elf_Word section_type) {
823   CHECK(IsSymbolSectionType(section_type)) << file_path_ << " " << section_type;
824   switch (section_type) {
825     case SHT_SYMTAB: {
826       return &symtab_symbol_table_;
827     }
828     case SHT_DYNSYM: {
829       return &dynsym_symbol_table_;
830     }
831     default: {
832       LOG(FATAL) << section_type;
833       return nullptr;
834     }
835   }
836 }
837 
838 template <typename ElfTypes>
FindSymbolByName(Elf_Word section_type,const std::string & symbol_name,bool build_map)839 typename ElfTypes::Sym* ElfFileImpl<ElfTypes>::FindSymbolByName(
840     Elf_Word section_type, const std::string& symbol_name, bool build_map) {
841   CHECK(!program_header_only_) << file_path_;
842   CHECK(IsSymbolSectionType(section_type)) << file_path_ << " " << section_type;
843 
844   SymbolTable** symbol_table = GetSymbolTable(section_type);
845   if (*symbol_table != nullptr || build_map) {
846     if (*symbol_table == nullptr) {
847       DCHECK(build_map);
848       *symbol_table = new SymbolTable;
849       Elf_Shdr* symbol_section = FindSectionByType(section_type);
850       if (symbol_section == nullptr) {
851         return nullptr;  // Failure condition.
852       }
853       Elf_Shdr* string_section = GetSectionHeader(symbol_section->sh_link);
854       if (string_section == nullptr) {
855         return nullptr;  // Failure condition.
856       }
857       for (uint32_t i = 0; i < GetSymbolNum(*symbol_section); i++) {
858         Elf_Sym* symbol = GetSymbol(section_type, i);
859         if (symbol == nullptr) {
860           return nullptr;  // Failure condition.
861         }
862         unsigned char type = (sizeof(Elf_Addr) == sizeof(Elf64_Addr))
863                              ? ELF64_ST_TYPE(symbol->st_info)
864                              : ELF32_ST_TYPE(symbol->st_info);
865         if (type == STT_NOTYPE) {
866           continue;
867         }
868         const char* name = GetString(*string_section, symbol->st_name);
869         if (name == nullptr) {
870           continue;
871         }
872         std::pair<typename SymbolTable::iterator, bool> result =
873             (*symbol_table)->insert(std::make_pair(name, symbol));
874         if (!result.second) {
875           // If a duplicate, make sure it has the same logical value. Seen on x86.
876           if ((symbol->st_value != result.first->second->st_value) ||
877               (symbol->st_size != result.first->second->st_size) ||
878               (symbol->st_info != result.first->second->st_info) ||
879               (symbol->st_other != result.first->second->st_other) ||
880               (symbol->st_shndx != result.first->second->st_shndx)) {
881             return nullptr;  // Failure condition.
882           }
883         }
884       }
885     }
886     CHECK(*symbol_table != nullptr);
887     typename SymbolTable::const_iterator it = (*symbol_table)->find(symbol_name);
888     if (it == (*symbol_table)->end()) {
889       return nullptr;
890     }
891     return it->second;
892   }
893 
894   // Fall back to linear search
895   Elf_Shdr* symbol_section = FindSectionByType(section_type);
896   if (symbol_section == nullptr) {
897     return nullptr;
898   }
899   Elf_Shdr* string_section = GetSectionHeader(symbol_section->sh_link);
900   if (string_section == nullptr) {
901     return nullptr;
902   }
903   for (uint32_t i = 0; i < GetSymbolNum(*symbol_section); i++) {
904     Elf_Sym* symbol = GetSymbol(section_type, i);
905     if (symbol == nullptr) {
906       return nullptr;  // Failure condition.
907     }
908     const char* name = GetString(*string_section, symbol->st_name);
909     if (name == nullptr) {
910       continue;
911     }
912     if (symbol_name == name) {
913       return symbol;
914     }
915   }
916   return nullptr;
917 }
918 
919 template <typename ElfTypes>
FindSymbolAddress(Elf_Word section_type,const std::string & symbol_name,bool build_map)920 typename ElfTypes::Addr ElfFileImpl<ElfTypes>::FindSymbolAddress(
921     Elf_Word section_type, const std::string& symbol_name, bool build_map) {
922   Elf_Sym* symbol = FindSymbolByName(section_type, symbol_name, build_map);
923   if (symbol == nullptr) {
924     return 0;
925   }
926   return symbol->st_value;
927 }
928 
929 template <typename ElfTypes>
GetString(Elf_Shdr & string_section,Elf_Word i) const930 const char* ElfFileImpl<ElfTypes>::GetString(Elf_Shdr& string_section,
931                                              Elf_Word i) const {
932   CHECK(!program_header_only_) << file_path_;
933   // TODO: remove this static_cast from enum when using -std=gnu++0x
934   if (static_cast<Elf_Word>(SHT_STRTAB) != string_section.sh_type) {
935     return nullptr;  // Failure condition.
936   }
937   if (i >= string_section.sh_size) {
938     return nullptr;
939   }
940   if (i == 0) {
941     return nullptr;
942   }
943   uint8_t* strings = Begin() + string_section.sh_offset;
944   uint8_t* string = strings + i;
945   if (string >= End()) {
946     return nullptr;
947   }
948   return reinterpret_cast<const char*>(string);
949 }
950 
951 template <typename ElfTypes>
GetDynamicNum() const952 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetDynamicNum() const {
953   return GetDynamicProgramHeader().p_filesz / sizeof(Elf_Dyn);
954 }
955 
956 template <typename ElfTypes>
GetDynamic(Elf_Word i) const957 typename ElfTypes::Dyn& ElfFileImpl<ElfTypes>::GetDynamic(Elf_Word i) const {
958   CHECK_LT(i, GetDynamicNum()) << file_path_;
959   return *(GetDynamicSectionStart() + i);
960 }
961 
962 template <typename ElfTypes>
FindDynamicByType(Elf_Sword type) const963 typename ElfTypes::Dyn* ElfFileImpl<ElfTypes>::FindDynamicByType(Elf_Sword type) const {
964   for (Elf_Word i = 0; i < GetDynamicNum(); i++) {
965     Elf_Dyn* dyn = &GetDynamic(i);
966     if (dyn->d_tag == type) {
967       return dyn;
968     }
969   }
970   return nullptr;
971 }
972 
973 template <typename ElfTypes>
FindDynamicValueByType(Elf_Sword type) const974 typename ElfTypes::Word ElfFileImpl<ElfTypes>::FindDynamicValueByType(Elf_Sword type) const {
975   Elf_Dyn* dyn = FindDynamicByType(type);
976   if (dyn == nullptr) {
977     return 0;
978   } else {
979     return dyn->d_un.d_val;
980   }
981 }
982 
983 template <typename ElfTypes>
GetRelSectionStart(Elf_Shdr & section_header) const984 typename ElfTypes::Rel* ElfFileImpl<ElfTypes>::GetRelSectionStart(Elf_Shdr& section_header) const {
985   CHECK(SHT_REL == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
986   return reinterpret_cast<Elf_Rel*>(Begin() + section_header.sh_offset);
987 }
988 
989 template <typename ElfTypes>
GetRelNum(Elf_Shdr & section_header) const990 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetRelNum(Elf_Shdr& section_header) const {
991   CHECK(SHT_REL == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
992   CHECK_NE(0U, section_header.sh_entsize) << file_path_;
993   return section_header.sh_size / section_header.sh_entsize;
994 }
995 
996 template <typename ElfTypes>
GetRel(Elf_Shdr & section_header,Elf_Word i) const997 typename ElfTypes::Rel& ElfFileImpl<ElfTypes>::GetRel(Elf_Shdr& section_header, Elf_Word i) const {
998   CHECK(SHT_REL == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
999   CHECK_LT(i, GetRelNum(section_header)) << file_path_;
1000   return *(GetRelSectionStart(section_header) + i);
1001 }
1002 
1003 template <typename ElfTypes>
GetRelaSectionStart(Elf_Shdr & section_header) const1004 typename ElfTypes::Rela* ElfFileImpl<ElfTypes>::GetRelaSectionStart(Elf_Shdr& section_header) const {
1005   CHECK(SHT_RELA == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
1006   return reinterpret_cast<Elf_Rela*>(Begin() + section_header.sh_offset);
1007 }
1008 
1009 template <typename ElfTypes>
GetRelaNum(Elf_Shdr & section_header) const1010 typename ElfTypes::Word ElfFileImpl<ElfTypes>::GetRelaNum(Elf_Shdr& section_header) const {
1011   CHECK(SHT_RELA == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
1012   return section_header.sh_size / section_header.sh_entsize;
1013 }
1014 
1015 template <typename ElfTypes>
GetRela(Elf_Shdr & section_header,Elf_Word i) const1016 typename ElfTypes::Rela& ElfFileImpl<ElfTypes>::GetRela(Elf_Shdr& section_header, Elf_Word i) const {
1017   CHECK(SHT_RELA == section_header.sh_type) << file_path_ << " " << section_header.sh_type;
1018   CHECK_LT(i, GetRelaNum(section_header)) << file_path_;
1019   return *(GetRelaSectionStart(section_header) + i);
1020 }
1021 
1022 template <typename ElfTypes>
GetLoadedSize(size_t * size,std::string * error_msg) const1023 bool ElfFileImpl<ElfTypes>::GetLoadedSize(size_t* size, std::string* error_msg) const {
1024   uint8_t* vaddr_begin;
1025   return GetLoadedAddressRange(&vaddr_begin, size, error_msg);
1026 }
1027 
1028 // Base on bionic phdr_table_get_load_size
1029 template <typename ElfTypes>
GetLoadedAddressRange(uint8_t ** vaddr_begin,size_t * vaddr_size,std::string * error_msg) const1030 bool ElfFileImpl<ElfTypes>::GetLoadedAddressRange(/*out*/uint8_t** vaddr_begin,
1031                                                   /*out*/size_t* vaddr_size,
1032                                                   /*out*/std::string* error_msg) const {
1033   Elf_Addr min_vaddr = static_cast<Elf_Addr>(-1);
1034   Elf_Addr max_vaddr = 0u;
1035   for (Elf_Word i = 0; i < GetProgramHeaderNum(); i++) {
1036     Elf_Phdr* program_header = GetProgramHeader(i);
1037     if (program_header->p_type != PT_LOAD) {
1038       continue;
1039     }
1040     Elf_Addr begin_vaddr = program_header->p_vaddr;
1041     if (begin_vaddr < min_vaddr) {
1042        min_vaddr = begin_vaddr;
1043     }
1044     Elf_Addr end_vaddr = program_header->p_vaddr + program_header->p_memsz;
1045     if (UNLIKELY(begin_vaddr > end_vaddr)) {
1046       std::ostringstream oss;
1047       oss << "Program header #" << i << " has overflow in p_vaddr+p_memsz: 0x" << std::hex
1048           << program_header->p_vaddr << "+0x" << program_header->p_memsz << "=0x" << end_vaddr
1049           << " in ELF file \"" << file_path_ << "\"";
1050       *error_msg = oss.str();
1051       *vaddr_begin = nullptr;
1052       *vaddr_size = static_cast<size_t>(-1);
1053       return false;
1054     }
1055     if (end_vaddr > max_vaddr) {
1056       max_vaddr = end_vaddr;
1057     }
1058   }
1059   min_vaddr = RoundDown(min_vaddr, kPageSize);
1060   max_vaddr = RoundUp(max_vaddr, kPageSize);
1061   CHECK_LT(min_vaddr, max_vaddr) << file_path_;
1062   // Check that the range fits into the runtime address space.
1063   if (UNLIKELY(max_vaddr - 1u > std::numeric_limits<size_t>::max())) {
1064     std::ostringstream oss;
1065     oss << "Loaded range is 0x" << std::hex << min_vaddr << "-0x" << max_vaddr
1066         << " but maximum size_t is 0x" << std::numeric_limits<size_t>::max()
1067         << " for ELF file \"" << file_path_ << "\"";
1068     *error_msg = oss.str();
1069     *vaddr_begin = nullptr;
1070     *vaddr_size = static_cast<size_t>(-1);
1071     return false;
1072   }
1073   *vaddr_begin = reinterpret_cast<uint8_t*>(min_vaddr);
1074   *vaddr_size = dchecked_integral_cast<size_t>(max_vaddr - min_vaddr);
1075   return true;
1076 }
1077 
GetInstructionSetFromELF(uint16_t e_machine,uint32_t e_flags ATTRIBUTE_UNUSED)1078 static InstructionSet GetInstructionSetFromELF(uint16_t e_machine,
1079                                                uint32_t e_flags ATTRIBUTE_UNUSED) {
1080   switch (e_machine) {
1081     case EM_ARM:
1082       return InstructionSet::kArm;
1083     case EM_AARCH64:
1084       return InstructionSet::kArm64;
1085     case EM_386:
1086       return InstructionSet::kX86;
1087     case EM_X86_64:
1088       return InstructionSet::kX86_64;
1089   }
1090   return InstructionSet::kNone;
1091 }
1092 
1093 template <typename ElfTypes>
Load(File * file,bool executable,bool low_4gb,MemMap * reservation,std::string * error_msg)1094 bool ElfFileImpl<ElfTypes>::Load(File* file,
1095                                  bool executable,
1096                                  bool low_4gb,
1097                                  /*inout*/MemMap* reservation,
1098                                  /*out*/std::string* error_msg) {
1099   CHECK(program_header_only_) << file->GetPath();
1100 
1101   if (executable) {
1102     InstructionSet elf_ISA = GetInstructionSetFromELF(GetHeader().e_machine, GetHeader().e_flags);
1103     if (elf_ISA != kRuntimeISA) {
1104       std::ostringstream oss;
1105       oss << "Expected ISA " << kRuntimeISA << " but found " << elf_ISA;
1106       *error_msg = oss.str();
1107       return false;
1108     }
1109   }
1110 
1111   bool reserved = false;
1112   for (Elf_Word i = 0; i < GetProgramHeaderNum(); i++) {
1113     Elf_Phdr* program_header = GetProgramHeader(i);
1114 
1115     // Record .dynamic header information for later use
1116     if (program_header->p_type == PT_DYNAMIC) {
1117       dynamic_program_header_ = program_header;
1118       continue;
1119     }
1120 
1121     // Not something to load, move on.
1122     if (program_header->p_type != PT_LOAD) {
1123       continue;
1124     }
1125 
1126     // Found something to load.
1127 
1128     // Before load the actual segments, reserve a contiguous chunk
1129     // of required size and address for all segments, but with no
1130     // permissions. We'll then carve that up with the proper
1131     // permissions as we load the actual segments. If p_vaddr is
1132     // non-zero, the segments require the specific address specified,
1133     // which either was specified in the file because we already set
1134     // base_address_ after the first zero segment).
1135     int64_t temp_file_length = file->GetLength();
1136     if (temp_file_length < 0) {
1137       errno = -temp_file_length;
1138       *error_msg = StringPrintf("Failed to get length of file: '%s' fd=%d: %s",
1139                                 file->GetPath().c_str(), file->Fd(), strerror(errno));
1140       return false;
1141     }
1142     size_t file_length = static_cast<size_t>(temp_file_length);
1143     if (!reserved) {
1144       uint8_t* vaddr_begin;
1145       size_t vaddr_size;
1146       if (!GetLoadedAddressRange(&vaddr_begin, &vaddr_size, error_msg)) {
1147         DCHECK(!error_msg->empty());
1148         return false;
1149       }
1150       std::string reservation_name = "ElfFile reservation for " + file->GetPath();
1151       MemMap local_reservation = MemMap::MapAnonymous(
1152           reservation_name.c_str(),
1153           (reservation != nullptr) ? reservation->Begin() : nullptr,
1154           vaddr_size,
1155           PROT_NONE,
1156           low_4gb,
1157           /* reuse= */ false,
1158           reservation,
1159           error_msg);
1160       if (!local_reservation.IsValid()) {
1161         *error_msg = StringPrintf("Failed to allocate %s: %s",
1162                                   reservation_name.c_str(),
1163                                   error_msg->c_str());
1164         return false;
1165       }
1166       reserved = true;
1167 
1168       // Base address is the difference of actual mapped location and the vaddr_begin.
1169       base_address_ = reinterpret_cast<uint8_t*>(
1170           static_cast<uintptr_t>(local_reservation.Begin() - vaddr_begin));
1171       // By adding the p_vaddr of a section/symbol to base_address_ we will always get the
1172       // dynamic memory address of where that object is actually mapped
1173       //
1174       // TODO: base_address_ needs to be calculated in ::Open, otherwise
1175       // FindDynamicSymbolAddress returns the wrong values until Load is called.
1176       segments_.push_back(std::move(local_reservation));
1177     }
1178     // empty segment, nothing to map
1179     if (program_header->p_memsz == 0) {
1180       continue;
1181     }
1182     uint8_t* p_vaddr = base_address_ + program_header->p_vaddr;
1183     int prot = 0;
1184     if (executable && ((program_header->p_flags & PF_X) != 0)) {
1185       prot |= PROT_EXEC;
1186     }
1187     if ((program_header->p_flags & PF_W) != 0) {
1188       prot |= PROT_WRITE;
1189     }
1190     if ((program_header->p_flags & PF_R) != 0) {
1191       prot |= PROT_READ;
1192     }
1193     int flags = 0;
1194     if (writable_) {
1195       prot |= PROT_WRITE;
1196       flags |= MAP_SHARED;
1197     } else {
1198       flags |= MAP_PRIVATE;
1199     }
1200     if (program_header->p_filesz > program_header->p_memsz) {
1201       *error_msg = StringPrintf("Invalid p_filesz > p_memsz (%" PRIu64 " > %" PRIu64 "): %s",
1202                                 static_cast<uint64_t>(program_header->p_filesz),
1203                                 static_cast<uint64_t>(program_header->p_memsz),
1204                                 file->GetPath().c_str());
1205       return false;
1206     }
1207     if (program_header->p_filesz < program_header->p_memsz &&
1208         !IsAligned<kPageSize>(program_header->p_filesz)) {
1209       *error_msg = StringPrintf("Unsupported unaligned p_filesz < p_memsz (%" PRIu64
1210                                 " < %" PRIu64 "): %s",
1211                                 static_cast<uint64_t>(program_header->p_filesz),
1212                                 static_cast<uint64_t>(program_header->p_memsz),
1213                                 file->GetPath().c_str());
1214       return false;
1215     }
1216     if (file_length < (program_header->p_offset + program_header->p_filesz)) {
1217       *error_msg = StringPrintf("File size of %zd bytes not large enough to contain ELF segment "
1218                                 "%d of %" PRIu64 " bytes: '%s'", file_length, i,
1219                                 static_cast<uint64_t>(program_header->p_offset + program_header->p_filesz),
1220                                 file->GetPath().c_str());
1221       return false;
1222     }
1223     if (program_header->p_filesz != 0u) {
1224       MemMap segment =
1225           MemMap::MapFileAtAddress(p_vaddr,
1226                                    program_header->p_filesz,
1227                                    prot,
1228                                    flags,
1229                                    file->Fd(),
1230                                    program_header->p_offset,
1231                                    /* low_4gb= */ false,
1232                                    file->GetPath().c_str(),
1233                                    /* reuse= */ true,  // implies MAP_FIXED
1234                                    /* reservation= */ nullptr,
1235                                    error_msg);
1236       if (!segment.IsValid()) {
1237         *error_msg = StringPrintf("Failed to map ELF file segment %d from %s: %s",
1238                                   i, file->GetPath().c_str(), error_msg->c_str());
1239         return false;
1240       }
1241       if (segment.Begin() != p_vaddr) {
1242         *error_msg = StringPrintf("Failed to map ELF file segment %d from %s at expected address %p, "
1243                                   "instead mapped to %p",
1244                                   i, file->GetPath().c_str(), p_vaddr, segment.Begin());
1245         return false;
1246       }
1247       segments_.push_back(std::move(segment));
1248     }
1249     if (program_header->p_filesz < program_header->p_memsz) {
1250       std::string name = StringPrintf("Zero-initialized segment %" PRIu64 " of ELF file %s",
1251                                       static_cast<uint64_t>(i), file->GetPath().c_str());
1252       MemMap segment = MemMap::MapAnonymous(name.c_str(),
1253                                             p_vaddr + program_header->p_filesz,
1254                                             program_header->p_memsz - program_header->p_filesz,
1255                                             prot,
1256                                             /* low_4gb= */ false,
1257                                             /* reuse= */ true,
1258                                             /* reservation= */ nullptr,
1259                                             error_msg);
1260       if (!segment.IsValid()) {
1261         *error_msg = StringPrintf("Failed to map zero-initialized ELF file segment %d from %s: %s",
1262                                   i, file->GetPath().c_str(), error_msg->c_str());
1263         return false;
1264       }
1265       if (segment.Begin() != p_vaddr) {
1266         *error_msg = StringPrintf("Failed to map zero-initialized ELF file segment %d from %s "
1267                                   "at expected address %p, instead mapped to %p",
1268                                   i, file->GetPath().c_str(), p_vaddr, segment.Begin());
1269         return false;
1270       }
1271       segments_.push_back(std::move(segment));
1272     }
1273   }
1274 
1275   // Now that we are done loading, .dynamic should be in memory to find .dynstr, .dynsym, .hash
1276   uint8_t* dsptr = base_address_ + GetDynamicProgramHeader().p_vaddr;
1277   if ((dsptr < Begin() || dsptr >= End()) && !ValidPointer(dsptr)) {
1278     *error_msg = StringPrintf("dynamic section address invalid in ELF file %s",
1279                               file->GetPath().c_str());
1280     return false;
1281   }
1282   dynamic_section_start_ = reinterpret_cast<Elf_Dyn*>(dsptr);
1283 
1284   for (Elf_Word i = 0; i < GetDynamicNum(); i++) {
1285     Elf_Dyn& elf_dyn = GetDynamic(i);
1286     uint8_t* d_ptr = base_address_ + elf_dyn.d_un.d_ptr;
1287     switch (elf_dyn.d_tag) {
1288       case DT_HASH: {
1289         if (!ValidPointer(d_ptr)) {
1290           *error_msg = StringPrintf("DT_HASH value %p does not refer to a loaded ELF segment of %s",
1291                                     d_ptr, file->GetPath().c_str());
1292           return false;
1293         }
1294         hash_section_start_ = reinterpret_cast<Elf_Word*>(d_ptr);
1295         break;
1296       }
1297       case DT_STRTAB: {
1298         if (!ValidPointer(d_ptr)) {
1299           *error_msg = StringPrintf("DT_HASH value %p does not refer to a loaded ELF segment of %s",
1300                                     d_ptr, file->GetPath().c_str());
1301           return false;
1302         }
1303         dynstr_section_start_ = reinterpret_cast<char*>(d_ptr);
1304         break;
1305       }
1306       case DT_SYMTAB: {
1307         if (!ValidPointer(d_ptr)) {
1308           *error_msg = StringPrintf("DT_HASH value %p does not refer to a loaded ELF segment of %s",
1309                                     d_ptr, file->GetPath().c_str());
1310           return false;
1311         }
1312         dynsym_section_start_ = reinterpret_cast<Elf_Sym*>(d_ptr);
1313         break;
1314       }
1315       case DT_NULL: {
1316         if (GetDynamicNum() != i+1) {
1317           *error_msg = StringPrintf("DT_NULL found after %d .dynamic entries, "
1318                                     "expected %d as implied by size of PT_DYNAMIC segment in %s",
1319                                     i + 1, GetDynamicNum(), file->GetPath().c_str());
1320           return false;
1321         }
1322         break;
1323       }
1324     }
1325   }
1326 
1327   // Check for the existence of some sections.
1328   if (!CheckSectionsExist(file, error_msg)) {
1329     return false;
1330   }
1331 
1332   return true;
1333 }
1334 
1335 template <typename ElfTypes>
ValidPointer(const uint8_t * start) const1336 bool ElfFileImpl<ElfTypes>::ValidPointer(const uint8_t* start) const {
1337   for (const MemMap& segment : segments_) {
1338     if (segment.Begin() <= start && start < segment.End()) {
1339       return true;
1340     }
1341   }
1342   return false;
1343 }
1344 
1345 
1346 template <typename ElfTypes>
FindSectionByName(const std::string & name) const1347 typename ElfTypes::Shdr* ElfFileImpl<ElfTypes>::FindSectionByName(
1348     const std::string& name) const {
1349   CHECK(!program_header_only_);
1350   Elf_Shdr* shstrtab_sec = GetSectionNameStringSection();
1351   if (shstrtab_sec == nullptr) {
1352     return nullptr;
1353   }
1354   for (uint32_t i = 0; i < GetSectionHeaderNum(); i++) {
1355     Elf_Shdr* shdr = GetSectionHeader(i);
1356     if (shdr == nullptr) {
1357       return nullptr;
1358     }
1359     const char* sec_name = GetString(*shstrtab_sec, shdr->sh_name);
1360     if (sec_name == nullptr) {
1361       continue;
1362     }
1363     if (name == sec_name) {
1364       return shdr;
1365     }
1366   }
1367   return nullptr;
1368 }
1369 
1370 template <typename ElfTypes>
Strip(File * file,std::string * error_msg)1371 bool ElfFileImpl<ElfTypes>::Strip(File* file, std::string* error_msg) {
1372   // ELF files produced by MCLinker look roughly like this
1373   //
1374   // +------------+
1375   // | Elf_Ehdr   | contains number of Elf_Shdr and offset to first
1376   // +------------+
1377   // | Elf_Phdr   | program headers
1378   // | Elf_Phdr   |
1379   // | ...        |
1380   // | Elf_Phdr   |
1381   // +------------+
1382   // | section    | mixture of needed and unneeded sections
1383   // +------------+
1384   // | section    |
1385   // +------------+
1386   // | ...        |
1387   // +------------+
1388   // | section    |
1389   // +------------+
1390   // | Elf_Shdr   | section headers
1391   // | Elf_Shdr   |
1392   // | ...        | contains offset to section start
1393   // | Elf_Shdr   |
1394   // +------------+
1395   //
1396   // To strip:
1397   // - leave the Elf_Ehdr and Elf_Phdr values in place.
1398   // - walk the sections making a new set of Elf_Shdr section headers for what we want to keep
1399   // - move the sections are keeping up to fill in gaps of sections we want to strip
1400   // - write new Elf_Shdr section headers to end of file, updating Elf_Ehdr
1401   // - truncate rest of file
1402   //
1403 
1404   std::vector<Elf_Shdr> section_headers;
1405   std::vector<Elf_Word> section_headers_original_indexes;
1406   section_headers.reserve(GetSectionHeaderNum());
1407 
1408 
1409   Elf_Shdr* string_section = GetSectionNameStringSection();
1410   CHECK(string_section != nullptr);
1411   for (Elf_Word i = 0; i < GetSectionHeaderNum(); i++) {
1412     Elf_Shdr* sh = GetSectionHeader(i);
1413     CHECK(sh != nullptr);
1414     const char* name = GetString(*string_section, sh->sh_name);
1415     if (name == nullptr) {
1416       CHECK_EQ(0U, i);
1417       section_headers.push_back(*sh);
1418       section_headers_original_indexes.push_back(0);
1419       continue;
1420     }
1421     if (android::base::StartsWith(name, ".debug")
1422         || (strcmp(name, ".strtab") == 0)
1423         || (strcmp(name, ".symtab") == 0)) {
1424       continue;
1425     }
1426     section_headers.push_back(*sh);
1427     section_headers_original_indexes.push_back(i);
1428   }
1429   CHECK_NE(0U, section_headers.size());
1430   CHECK_EQ(section_headers.size(), section_headers_original_indexes.size());
1431 
1432   // section 0 is the null section, sections start at offset of first section
1433   CHECK(GetSectionHeader(1) != nullptr);
1434   Elf_Off offset = GetSectionHeader(1)->sh_offset;
1435   for (size_t i = 1; i < section_headers.size(); i++) {
1436     Elf_Shdr& new_sh = section_headers[i];
1437     Elf_Shdr* old_sh = GetSectionHeader(section_headers_original_indexes[i]);
1438     CHECK(old_sh != nullptr);
1439     CHECK_EQ(new_sh.sh_name, old_sh->sh_name);
1440     if (old_sh->sh_addralign > 1) {
1441       offset = RoundUp(offset, old_sh->sh_addralign);
1442     }
1443     if (old_sh->sh_offset == offset) {
1444       // already in place
1445       offset += old_sh->sh_size;
1446       continue;
1447     }
1448     // shift section earlier
1449     memmove(Begin() + offset,
1450             Begin() + old_sh->sh_offset,
1451             old_sh->sh_size);
1452     new_sh.sh_offset = offset;
1453     offset += old_sh->sh_size;
1454   }
1455 
1456   Elf_Off shoff = offset;
1457   size_t section_headers_size_in_bytes = section_headers.size() * sizeof(Elf_Shdr);
1458   memcpy(Begin() + offset, &section_headers[0], section_headers_size_in_bytes);
1459   offset += section_headers_size_in_bytes;
1460 
1461   GetHeader().e_shnum = section_headers.size();
1462   GetHeader().e_shoff = shoff;
1463   int result = ftruncate(file->Fd(), offset);
1464   if (result != 0) {
1465     *error_msg = StringPrintf("Failed to truncate while stripping ELF file: '%s': %s",
1466                               file->GetPath().c_str(), strerror(errno));
1467     return false;
1468   }
1469   return true;
1470 }
1471 
1472 // Explicit instantiations
1473 template class ElfFileImpl<ElfTypes32>;
1474 template class ElfFileImpl<ElfTypes64>;
1475 
ElfFile(ElfFileImpl32 * elf32)1476 ElfFile::ElfFile(ElfFileImpl32* elf32) : elf32_(elf32), elf64_(nullptr) {
1477 }
1478 
ElfFile(ElfFileImpl64 * elf64)1479 ElfFile::ElfFile(ElfFileImpl64* elf64) : elf32_(nullptr), elf64_(elf64) {
1480 }
1481 
~ElfFile()1482 ElfFile::~ElfFile() {
1483   // Should never have 32 and 64-bit impls.
1484   CHECK_NE(elf32_.get() == nullptr, elf64_.get() == nullptr);
1485 }
1486 
Open(File * file,bool writable,bool program_header_only,bool low_4gb,std::string * error_msg)1487 ElfFile* ElfFile::Open(File* file,
1488                        bool writable,
1489                        bool program_header_only,
1490                        bool low_4gb,
1491                        /*out*/std::string* error_msg) {
1492   if (file->GetLength() < EI_NIDENT) {
1493     *error_msg = StringPrintf("File %s is too short to be a valid ELF file",
1494                               file->GetPath().c_str());
1495     return nullptr;
1496   }
1497   MemMap map = MemMap::MapFile(EI_NIDENT,
1498                                PROT_READ,
1499                                MAP_PRIVATE,
1500                                file->Fd(),
1501                                0,
1502                                low_4gb,
1503                                file->GetPath().c_str(),
1504                                error_msg);
1505   if (!map.IsValid() || map.Size() != EI_NIDENT) {
1506     return nullptr;
1507   }
1508   uint8_t* header = map.Begin();
1509   if (header[EI_CLASS] == ELFCLASS64) {
1510     ElfFileImpl64* elf_file_impl = ElfFileImpl64::Open(file,
1511                                                        writable,
1512                                                        program_header_only,
1513                                                        low_4gb,
1514                                                        error_msg);
1515     if (elf_file_impl == nullptr) {
1516       return nullptr;
1517     }
1518     return new ElfFile(elf_file_impl);
1519   } else if (header[EI_CLASS] == ELFCLASS32) {
1520     ElfFileImpl32* elf_file_impl = ElfFileImpl32::Open(file,
1521                                                        writable,
1522                                                        program_header_only,
1523                                                        low_4gb,
1524                                                        error_msg);
1525     if (elf_file_impl == nullptr) {
1526       return nullptr;
1527     }
1528     return new ElfFile(elf_file_impl);
1529   } else {
1530     *error_msg = StringPrintf("Failed to find expected EI_CLASS value %d or %d in %s, found %d",
1531                               ELFCLASS32, ELFCLASS64,
1532                               file->GetPath().c_str(),
1533                               header[EI_CLASS]);
1534     return nullptr;
1535   }
1536 }
1537 
Open(File * file,int mmap_prot,int mmap_flags,std::string * error_msg)1538 ElfFile* ElfFile::Open(File* file, int mmap_prot, int mmap_flags, /*out*/std::string* error_msg) {
1539   // low_4gb support not required for this path.
1540   constexpr bool low_4gb = false;
1541   if (file->GetLength() < EI_NIDENT) {
1542     *error_msg = StringPrintf("File %s is too short to be a valid ELF file",
1543                               file->GetPath().c_str());
1544     return nullptr;
1545   }
1546   MemMap map = MemMap::MapFile(EI_NIDENT,
1547                                PROT_READ,
1548                                MAP_PRIVATE,
1549                                file->Fd(),
1550                                /* start= */ 0,
1551                                low_4gb,
1552                                file->GetPath().c_str(),
1553                                error_msg);
1554   if (!map.IsValid() || map.Size() != EI_NIDENT) {
1555     return nullptr;
1556   }
1557   uint8_t* header = map.Begin();
1558   if (header[EI_CLASS] == ELFCLASS64) {
1559     ElfFileImpl64* elf_file_impl = ElfFileImpl64::Open(file,
1560                                                        mmap_prot,
1561                                                        mmap_flags,
1562                                                        low_4gb,
1563                                                        error_msg);
1564     if (elf_file_impl == nullptr) {
1565       return nullptr;
1566     }
1567     return new ElfFile(elf_file_impl);
1568   } else if (header[EI_CLASS] == ELFCLASS32) {
1569     ElfFileImpl32* elf_file_impl = ElfFileImpl32::Open(file,
1570                                                        mmap_prot,
1571                                                        mmap_flags,
1572                                                        low_4gb,
1573                                                        error_msg);
1574     if (elf_file_impl == nullptr) {
1575       return nullptr;
1576     }
1577     return new ElfFile(elf_file_impl);
1578   } else {
1579     *error_msg = StringPrintf("Failed to find expected EI_CLASS value %d or %d in %s, found %d",
1580                               ELFCLASS32, ELFCLASS64,
1581                               file->GetPath().c_str(),
1582                               header[EI_CLASS]);
1583     return nullptr;
1584   }
1585 }
1586 
1587 #define DELEGATE_TO_IMPL(func, ...) \
1588   if (elf64_.get() != nullptr) { \
1589     return elf64_->func(__VA_ARGS__); \
1590   } else { \
1591     DCHECK(elf32_.get() != nullptr); \
1592     return elf32_->func(__VA_ARGS__); \
1593   }
1594 
Load(File * file,bool executable,bool low_4gb,MemMap * reservation,std::string * error_msg)1595 bool ElfFile::Load(File* file,
1596                    bool executable,
1597                    bool low_4gb,
1598                    /*inout*/MemMap* reservation,
1599                    /*out*/std::string* error_msg) {
1600   DELEGATE_TO_IMPL(Load, file, executable, low_4gb, reservation, error_msg);
1601 }
1602 
FindDynamicSymbolAddress(const std::string & symbol_name) const1603 const uint8_t* ElfFile::FindDynamicSymbolAddress(const std::string& symbol_name) const {
1604   DELEGATE_TO_IMPL(FindDynamicSymbolAddress, symbol_name);
1605 }
1606 
Size() const1607 size_t ElfFile::Size() const {
1608   DELEGATE_TO_IMPL(Size);
1609 }
1610 
Begin() const1611 uint8_t* ElfFile::Begin() const {
1612   DELEGATE_TO_IMPL(Begin);
1613 }
1614 
End() const1615 uint8_t* ElfFile::End() const {
1616   DELEGATE_TO_IMPL(End);
1617 }
1618 
GetFilePath() const1619 const std::string& ElfFile::GetFilePath() const {
1620   DELEGATE_TO_IMPL(GetFilePath);
1621 }
1622 
GetSectionOffsetAndSize(const char * section_name,uint64_t * offset,uint64_t * size) const1623 bool ElfFile::GetSectionOffsetAndSize(const char* section_name, uint64_t* offset,
1624                                       uint64_t* size) const {
1625   if (elf32_.get() == nullptr) {
1626     CHECK(elf64_.get() != nullptr);
1627 
1628     Elf64_Shdr *shdr = elf64_->FindSectionByName(section_name);
1629     if (shdr == nullptr) {
1630       return false;
1631     }
1632     if (offset != nullptr) {
1633       *offset = shdr->sh_offset;
1634     }
1635     if (size != nullptr) {
1636       *size = shdr->sh_size;
1637     }
1638     return true;
1639   } else {
1640     Elf32_Shdr *shdr = elf32_->FindSectionByName(section_name);
1641     if (shdr == nullptr) {
1642       return false;
1643     }
1644     if (offset != nullptr) {
1645       *offset = shdr->sh_offset;
1646     }
1647     if (size != nullptr) {
1648       *size = shdr->sh_size;
1649     }
1650     return true;
1651   }
1652 }
1653 
HasSection(const std::string & name) const1654 bool ElfFile::HasSection(const std::string& name) const {
1655   if (elf64_.get() != nullptr) {
1656     return elf64_->FindSectionByName(name) != nullptr;
1657   } else {
1658     return elf32_->FindSectionByName(name) != nullptr;
1659   }
1660 }
1661 
FindSymbolAddress(unsigned section_type,const std::string & symbol_name,bool build_map)1662 uint64_t ElfFile::FindSymbolAddress(unsigned section_type,
1663                                     const std::string& symbol_name,
1664                                     bool build_map) {
1665   DELEGATE_TO_IMPL(FindSymbolAddress, section_type, symbol_name, build_map);
1666 }
1667 
GetLoadedSize(size_t * size,std::string * error_msg) const1668 bool ElfFile::GetLoadedSize(size_t* size, std::string* error_msg) const {
1669   DELEGATE_TO_IMPL(GetLoadedSize, size, error_msg);
1670 }
1671 
Strip(File * file,std::string * error_msg)1672 bool ElfFile::Strip(File* file, std::string* error_msg) {
1673   std::unique_ptr<ElfFile> elf_file(ElfFile::Open(file, true, false, /*low_4gb=*/false, error_msg));
1674   if (elf_file.get() == nullptr) {
1675     return false;
1676   }
1677 
1678   if (elf_file->elf64_.get() != nullptr) {
1679     return elf_file->elf64_->Strip(file, error_msg);
1680   } else {
1681     return elf_file->elf32_->Strip(file, error_msg);
1682   }
1683 }
1684 
1685 }  // namespace art
1686