1 //===-- ubsan_type_hash.cc ------------------------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Implementation of a hash table for fast checking of inheritance
11 // relationships. This file is only linked into C++ compilations, and is
12 // permitted to use language features which require a C++ ABI library.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #include "ubsan_platform.h"
17 #if CAN_SANITIZE_UB
18 #include "ubsan_type_hash.h"
19 
20 #include "sanitizer_common/sanitizer_common.h"
21 
22 // The following are intended to be binary compatible with the definitions
23 // given in the Itanium ABI. We make no attempt to be ODR-compatible with
24 // those definitions, since existing ABI implementations aren't.
25 
26 namespace std {
27   class type_info {
28   public:
29     virtual ~type_info();
30 
31     const char *__type_name;
32   };
33 }
34 
35 namespace __cxxabiv1 {
36 
37 /// Type info for classes with no bases, and base class for type info for
38 /// classes with bases.
39 class __class_type_info : public std::type_info {
40   ~__class_type_info() override;
41 };
42 
43 /// Type info for classes with simple single public inheritance.
44 class __si_class_type_info : public __class_type_info {
45 public:
46   ~__si_class_type_info() override;
47 
48   const __class_type_info *__base_type;
49 };
50 
51 class __base_class_type_info {
52 public:
53   const __class_type_info *__base_type;
54   long __offset_flags;
55 
56   enum __offset_flags_masks {
57     __virtual_mask = 0x1,
58     __public_mask = 0x2,
59     __offset_shift = 8
60   };
61 };
62 
63 /// Type info for classes with multiple, virtual, or non-public inheritance.
64 class __vmi_class_type_info : public __class_type_info {
65 public:
66   ~__vmi_class_type_info() override;
67 
68   unsigned int flags;
69   unsigned int base_count;
70   __base_class_type_info base_info[1];
71 };
72 
73 }
74 
75 namespace abi = __cxxabiv1;
76 
77 // We implement a simple two-level cache for type-checking results. For each
78 // (vptr,type) pair, a hash is computed. This hash is assumed to be globally
79 // unique; if it collides, we will get false negatives, but:
80 //  * such a collision would have to occur on the *first* bad access,
81 //  * the probability of such a collision is low (and for a 64-bit target, is
82 //    negligible), and
83 //  * the vptr, and thus the hash, can be affected by ASLR, so multiple runs
84 //    give better coverage.
85 //
86 // The first caching layer is a small hash table with no chaining; buckets are
87 // reused as needed. The second caching layer is a large hash table with open
88 // chaining. We can freely evict from either layer since this is just a cache.
89 //
90 // FIXME: Make these hash table accesses thread-safe. The races here are benign:
91 //        assuming the unsequenced loads and stores don't misbehave too badly,
92 //        the worst case is false negatives or poor cache behavior, not false
93 //        positives or crashes.
94 
95 /// Find a bucket to store the given hash value in.
getTypeCacheHashTableBucket(__ubsan::HashValue V)96 static __ubsan::HashValue *getTypeCacheHashTableBucket(__ubsan::HashValue V) {
97   static const unsigned HashTableSize = 65537;
98   static __ubsan::HashValue __ubsan_vptr_hash_set[HashTableSize];
99 
100   unsigned First = (V & 65535) ^ 1;
101   unsigned Probe = First;
102   for (int Tries = 5; Tries; --Tries) {
103     if (!__ubsan_vptr_hash_set[Probe] || __ubsan_vptr_hash_set[Probe] == V)
104       return &__ubsan_vptr_hash_set[Probe];
105     Probe += ((V >> 16) & 65535) + 1;
106     if (Probe >= HashTableSize)
107       Probe -= HashTableSize;
108   }
109   // FIXME: Pick a random entry from the probe sequence to evict rather than
110   //        just taking the first.
111   return &__ubsan_vptr_hash_set[First];
112 }
113 
114 /// A cache of recently-checked hashes. Mini hash table with "random" evictions.
115 __ubsan::HashValue
116 __ubsan::__ubsan_vptr_type_cache[__ubsan::VptrTypeCacheSize];
117 
118 /// \brief Determine whether \p Derived has a \p Base base class subobject at
119 /// offset \p Offset.
isDerivedFromAtOffset(const abi::__class_type_info * Derived,const abi::__class_type_info * Base,sptr Offset)120 static bool isDerivedFromAtOffset(const abi::__class_type_info *Derived,
121                                   const abi::__class_type_info *Base,
122                                   sptr Offset) {
123   if (Derived->__type_name == Base->__type_name)
124     return Offset == 0;
125 
126   if (const abi::__si_class_type_info *SI =
127         dynamic_cast<const abi::__si_class_type_info*>(Derived))
128     return isDerivedFromAtOffset(SI->__base_type, Base, Offset);
129 
130   const abi::__vmi_class_type_info *VTI =
131     dynamic_cast<const abi::__vmi_class_type_info*>(Derived);
132   if (!VTI)
133     // No base class subobjects.
134     return false;
135 
136   // Look for a base class which is derived from \p Base at the right offset.
137   for (unsigned int base = 0; base != VTI->base_count; ++base) {
138     // FIXME: Curtail the recursion if this base can't possibly contain the
139     //        given offset.
140     sptr OffsetHere = VTI->base_info[base].__offset_flags >>
141                       abi::__base_class_type_info::__offset_shift;
142     if (VTI->base_info[base].__offset_flags &
143           abi::__base_class_type_info::__virtual_mask)
144       // For now, just punt on virtual bases and say 'yes'.
145       // FIXME: OffsetHere is the offset in the vtable of the virtual base
146       //        offset. Read the vbase offset out of the vtable and use it.
147       return true;
148     if (isDerivedFromAtOffset(VTI->base_info[base].__base_type,
149                               Base, Offset - OffsetHere))
150       return true;
151   }
152 
153   return false;
154 }
155 
156 /// \brief Find the derived-most dynamic base class of \p Derived at offset
157 /// \p Offset.
findBaseAtOffset(const abi::__class_type_info * Derived,sptr Offset)158 static const abi::__class_type_info *findBaseAtOffset(
159     const abi::__class_type_info *Derived, sptr Offset) {
160   if (!Offset)
161     return Derived;
162 
163   if (const abi::__si_class_type_info *SI =
164         dynamic_cast<const abi::__si_class_type_info*>(Derived))
165     return findBaseAtOffset(SI->__base_type, Offset);
166 
167   const abi::__vmi_class_type_info *VTI =
168     dynamic_cast<const abi::__vmi_class_type_info*>(Derived);
169   if (!VTI)
170     // No base class subobjects.
171     return 0;
172 
173   for (unsigned int base = 0; base != VTI->base_count; ++base) {
174     sptr OffsetHere = VTI->base_info[base].__offset_flags >>
175                       abi::__base_class_type_info::__offset_shift;
176     if (VTI->base_info[base].__offset_flags &
177           abi::__base_class_type_info::__virtual_mask)
178       // FIXME: Can't handle virtual bases yet.
179       continue;
180     if (const abi::__class_type_info *Base =
181           findBaseAtOffset(VTI->base_info[base].__base_type,
182                            Offset - OffsetHere))
183       return Base;
184   }
185 
186   return 0;
187 }
188 
189 namespace {
190 
191 struct VtablePrefix {
192   /// The offset from the vptr to the start of the most-derived object.
193   /// This should never be greater than zero, and will usually be exactly
194   /// zero.
195   sptr Offset;
196   /// The type_info object describing the most-derived class type.
197   std::type_info *TypeInfo;
198 };
getVtablePrefix(void * Object)199 VtablePrefix *getVtablePrefix(void *Object) {
200   VtablePrefix **VptrPtr = reinterpret_cast<VtablePrefix**>(Object);
201   if (!*VptrPtr)
202     return 0;
203   VtablePrefix *Prefix = *VptrPtr - 1;
204   if (Prefix->Offset > 0 || !Prefix->TypeInfo)
205     // This can't possibly be a valid vtable.
206     return 0;
207   return Prefix;
208 }
209 
210 }
211 
checkDynamicType(void * Object,void * Type,HashValue Hash)212 bool __ubsan::checkDynamicType(void *Object, void *Type, HashValue Hash) {
213   // A crash anywhere within this function probably means the vptr is corrupted.
214   // FIXME: Perform these checks more cautiously.
215 
216   // Check whether this is something we've evicted from the cache.
217   HashValue *Bucket = getTypeCacheHashTableBucket(Hash);
218   if (*Bucket == Hash) {
219     __ubsan_vptr_type_cache[Hash % VptrTypeCacheSize] = Hash;
220     return true;
221   }
222 
223   VtablePrefix *Vtable = getVtablePrefix(Object);
224   if (!Vtable)
225     return false;
226 
227   // Check that this is actually a type_info object for a class type.
228   abi::__class_type_info *Derived =
229     dynamic_cast<abi::__class_type_info*>(Vtable->TypeInfo);
230   if (!Derived)
231     return false;
232 
233   abi::__class_type_info *Base = (abi::__class_type_info*)Type;
234   if (!isDerivedFromAtOffset(Derived, Base, -Vtable->Offset))
235     return false;
236 
237   // Success. Cache this result.
238   __ubsan_vptr_type_cache[Hash % VptrTypeCacheSize] = Hash;
239   *Bucket = Hash;
240   return true;
241 }
242 
getDynamicTypeInfo(void * Object)243 __ubsan::DynamicTypeInfo __ubsan::getDynamicTypeInfo(void *Object) {
244   VtablePrefix *Vtable = getVtablePrefix(Object);
245   if (!Vtable)
246     return DynamicTypeInfo(0, 0, 0);
247   const abi::__class_type_info *ObjectType = findBaseAtOffset(
248     static_cast<const abi::__class_type_info*>(Vtable->TypeInfo),
249     -Vtable->Offset);
250   return DynamicTypeInfo(Vtable->TypeInfo->__type_name, -Vtable->Offset,
251                          ObjectType ? ObjectType->__type_name : "<unknown>");
252 }
253 
254 #endif  // CAN_SANITIZE_UB
255