1 /*
2  * Copyright (C) 2017 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #ifndef ART_RUNTIME_CLASS_LOADER_CONTEXT_H_
18 #define ART_RUNTIME_CLASS_LOADER_CONTEXT_H_
19 
20 #include <string>
21 #include <vector>
22 #include <set>
23 
24 #include "arch/instruction_set.h"
25 #include "base/dchecked_vector.h"
26 #include "dex/dex_file.h"
27 #include "handle_scope.h"
28 #include "mirror/class_loader.h"
29 #include "oat_file.h"
30 #include "scoped_thread_state_change.h"
31 
32 namespace art {
33 
34 class DexFile;
35 class OatFile;
36 
37 // Utility class which holds the class loader context used during compilation/verification.
38 class ClassLoaderContext {
39  public:
40   enum class VerificationResult {
41     kVerifies,
42     kMismatch,
43   };
44 
45   enum ClassLoaderType {
46     kInvalidClassLoader = 0,
47     kPathClassLoader = 1,
48     kDelegateLastClassLoader = 2,
49     kInMemoryDexClassLoader = 3
50   };
51 
52   // Special encoding used to denote a foreign ClassLoader was found when trying to encode class
53   // loader contexts for each classpath element in a ClassLoader. See
54   // EncodeClassPathContextsForClassLoader. Keep in sync with PackageDexUsage in the framework.
55   static constexpr const char* kUnsupportedClassLoaderContextEncoding =
56       "=UnsupportedClassLoaderContext=";
57 
58   ~ClassLoaderContext();
59 
60   // Opens requested class path files and appends them to ClassLoaderInfo::opened_dex_files.
61   // If the dex files have been stripped, the method opens them from their oat files which are added
62   // to ClassLoaderInfo::opened_oat_files. The 'classpath_dir' argument specifies the directory to
63   // use for the relative class paths.
64   // Returns true if all dex files where successfully opened.
65   // It may be called only once per ClassLoaderContext. Subsequent calls will return the same
66   // result without doing anything.
67   // If `context_fds` is an empty vector, files will be opened using the class path locations as
68   // filenames. Otherwise `context_fds` is expected to contain file descriptors to class path dex
69   // files, following the order of dex file locations in a flattened class loader context. If their
70   // number (size of `context_fds`) does not match the number of dex files, OpenDexFiles will fail.
71   //
72   // This will replace the class path locations with the locations of the opened dex files.
73   // (Note that one dex file can contain multidexes. Each multidex will be added to the classpath
74   // separately.)
75   //
76   // only_read_checksums controls whether or not we only read the dex locations and the checksums
77   // from the apk instead of fully opening the dex files.
78   //
79   // This method is not thread safe.
80   //
81   // Note that a "false" return could mean that either an apk/jar contained no dex files or
82   // that we hit a I/O or checksum mismatch error.
83   // TODO(calin): Currently there's no easy way to tell the difference.
84   //
85   // TODO(calin): we're forced to complicate the flow in this class with a different
86   // OpenDexFiles step because the current dex2oat flow requires the dex files be opened before
87   // the class loader is created. Consider reworking the dex2oat part.
88   bool OpenDexFiles(const std::string& classpath_dir = "",
89                     const std::vector<int>& context_fds = std::vector<int>(),
90                     bool only_read_checksums = false);
91 
92   // Remove the specified compilation sources from all classpaths present in this context.
93   // Should only be called before the first call to OpenDexFiles().
94   bool RemoveLocationsFromClassPaths(const dchecked_vector<std::string>& compilation_sources);
95 
96   // Creates the entire class loader hierarchy according to the current context.
97   // Returns the first class loader from the chain.
98   //
99   // For example: if the context was built from the spec
100   // "ClassLoaderType1[ClasspathElem1:ClasspathElem2...];ClassLoaderType2[...]..."
101   // the method returns the class loader correponding to ClassLoader1. The parent chain will be
102   // ClassLoader1 --> ClassLoader2 --> ... --> BootClassLoader.
103   //
104   // The compilation sources are appended to the classpath of the first class loader (in the above
105   // example ClassLoader1).
106   //
107   // If the context is empty, this method only creates a single PathClassLoader with the
108   // given compilation_sources.
109   //
110   // Shared libraries found in the chain will be canonicalized based on the dex files they
111   // contain.
112   //
113   // Implementation notes:
114   //   1) the objects are not completely set up. Do not use this outside of tests and the compiler.
115   //   2) should only be called before the first call to OpenDexFiles().
116   jobject CreateClassLoader(const std::vector<const DexFile*>& compilation_sources) const;
117 
118   // Encodes the context as a string suitable to be added in oat files.
119   // (so that it can be read and verified at runtime against the actual class
120   // loader hierarchy).
121   // Should only be called if OpenDexFiles() returned true.
122   // If stored context is non-null, the stored names are overwritten by the class path from the
123   // stored context.
124   // E.g. if the context is PCL[a.dex:b.dex] this will return
125   // "PCL[a.dex*a_checksum*b.dex*a_checksum]".
126   std::string EncodeContextForOatFile(const std::string& base_dir,
127                                       ClassLoaderContext* stored_context = nullptr) const;
128 
129   // Encodes the context as a string suitable to be passed to dex2oat.
130   // This is the same as EncodeContextForOatFile but without adding the checksums
131   // and only adding each dex files once (no multidex).
132   // Should only be called if OpenDexFiles() returned true.
133   std::string EncodeContextForDex2oat(const std::string& base_dir) const;
134 
135   // Encodes the contexts for each of the classpath elements in the child-most
136   // classloader. Under the hood EncodeContextForDex2oat is used, so no checksums
137   // will be encoded.
138   // Should only be called if the dex files are opened (either via OpenDexFiles() or by creating the
139   // context from a live class loader).
140   // Notably, for each classpath element the encoded classloader context will contain only the
141   // elements that appear before it in the containing classloader. E.g. if `this` contains
142   // (from child to parent):
143   //
144   // PathClassLoader { multidex.apk!classes.dex, multidex.apk!classes2.dex, foo.dex, bar.dex } ->
145   //    PathClassLoader { baz.dex } -> BootClassLoader
146   //
147   // then the return value will look like:
148   //
149   // `{ "multidex.apk": "PCL[];PCL[baz.dex]",
150   //    "foo.dex"     : "PCL[multidex.apk];PCL[baz.dex]",
151   //    "bar.dex"     : "PCL[multidex.apk:foo.dex];PCL[baz.dex]" }`
152   std::map<std::string, std::string> EncodeClassPathContexts(const std::string& base_dir) const;
153 
154   // Flattens the opened dex files into the given vector.
155   // Should only be called if OpenDexFiles() returned true.
156   std::vector<const DexFile*> FlattenOpenedDexFiles() const;
157 
158   // Return a colon-separated list of dex file locations from this class loader
159   // context after flattening.
160   std::string FlattenDexPaths() const;
161 
162   // Verifies that the current context is identical to the context encoded as `context_spec`.
163   // Identical means:
164   //    - the number and type of the class loaders from the chain matches
165   //    - the class loader from the same position have the same classpath
166   //      (the order and checksum of the dex files matches)
167   // This should be called after OpenDexFiles() with only_read_checksums=true. There's no
168   // need to fully open the dex files if the only thing that needs to be done is to verify
169   // the context.
170   //
171   // Names are only verified if verify_names is true.
172   // Checksums are only verified if verify_checksums is true.
173   VerificationResult VerifyClassLoaderContextMatch(const std::string& context_spec,
174                                                    bool verify_names = true,
175                                                    bool verify_checksums = true) const;
176 
177   // Checks if any of the given dex files is already loaded in the current class loader context.
178   // It only checks the first class loader.
179   // Returns the list of duplicate dex files (empty if there are no duplicates).
180   std::set<const DexFile*> CheckForDuplicateDexFiles(
181       const std::vector<const DexFile*>& dex_files);
182 
183   // Creates the class loader context from the given string.
184   // The format: ClassLoaderType1[ClasspathElem1:ClasspathElem2...];ClassLoaderType2[...]...
185   // ClassLoaderType is either "PCL" (PathClassLoader) or "DLC" (DelegateLastClassLoader).
186   // ClasspathElem is the path of dex/jar/apk file.
187   //
188   // The spec represents a class loader chain with the natural interpretation:
189   // ClassLoader1 has ClassLoader2 as parent which has ClassLoader3 as a parent and so on.
190   // The last class loader is assumed to have the BootClassLoader as a parent.
191   //
192   // Note that we allowed class loaders with an empty class path in order to support a custom
193   // class loader for the source dex files.
194   static std::unique_ptr<ClassLoaderContext> Create(const std::string& spec);
195 
196   // Creates a context for the given class_loader and dex_elements.
197   // The method will walk the parent chain starting from `class_loader` and add their dex files
198   // to the current class loaders chain. The `dex_elements` will be added at the end of the
199   // classpath belonging to the `class_loader` argument.
200   // The ownership of the opened dex files will be retained by the given `class_loader`.
201   // If there are errors in processing the class loader chain (e.g. unsupported elements) the
202   // method returns null.
203   static std::unique_ptr<ClassLoaderContext> CreateContextForClassLoader(jobject class_loader,
204                                                                          jobjectArray dex_elements);
205 
206   // Returns the default class loader context to be used when none is specified.
207   // This will return a context with a single and empty PathClassLoader.
208   static std::unique_ptr<ClassLoaderContext> Default();
209 
210   // Encodes the contexts for each of the classpath elements in `class_loader`. See
211   // ClassLoaderContext::EncodeClassPathContexts for more information about the return value.
212   //
213   // If `class_loader` does not derive from BaseDexClassLoader then an empty map is returned.
214   // Otherwise if a foreign ClassLoader is found in the class loader chain then the results values
215   // will all be ClassLoaderContext::kUnsupportedClassLoaderContextEncoding.
216   static std::map<std::string, std::string> EncodeClassPathContextsForClassLoader(
217       jobject class_loader);
218 
219   // Returns whether `encoded_class_loader_context` is a valid encoded ClassLoaderContext or
220   // EncodedUnsupportedClassLoaderContext.
221   static bool IsValidEncoding(const std::string& possible_encoded_class_loader_context);
222 
223   struct ClassLoaderInfo {
224     // The type of this class loader.
225     ClassLoaderType type;
226     // Shared libraries this context has.
227     std::vector<std::unique_ptr<ClassLoaderInfo>> shared_libraries;
228     // The list of class path elements that this loader loads.
229     // Note that this list may contain relative paths.
230     std::vector<std::string> classpath;
231     // Original opened class path (ignoring multidex).
232     std::vector<std::string> original_classpath;
233     // The list of class path elements checksums.
234     // May be empty if the checksums are not given when the context is created.
235     std::vector<uint32_t> checksums;
236     // After OpenDexFiles is called this holds the opened dex files.
237     std::vector<std::unique_ptr<const DexFile>> opened_dex_files;
238     // After OpenDexFiles, in case some of the dex files were opened from their oat files
239     // this holds the list of opened oat files.
240     std::vector<std::unique_ptr<OatFile>> opened_oat_files;
241     // The parent class loader.
242     std::unique_ptr<ClassLoaderInfo> parent;
243 
ClassLoaderInfoClassLoaderInfo244     explicit ClassLoaderInfo(ClassLoaderType cl_type) : type(cl_type) {}
245   };
246 
247  private:
248   // Creates an empty context (with no class loaders).
249   ClassLoaderContext();
250 
251   // Get the parent of the class loader chain at depth `index`.
GetParent(size_t index)252   ClassLoaderInfo* GetParent(size_t index) const {
253     ClassLoaderInfo* result = class_loader_chain_.get();
254     while ((result != nullptr) && (index-- != 0)) {
255       result = result->parent.get();
256     }
257     return result;
258   }
259 
GetParentChainSize()260   size_t GetParentChainSize() const {
261     size_t result = 0;
262     ClassLoaderInfo* info = class_loader_chain_.get();
263     while (info != nullptr) {
264       ++result;
265       info = info->parent.get();
266     }
267     return result;
268   }
269 
270   // Constructs an empty context.
271   // `owns_the_dex_files` specifies whether or not the context will own the opened dex files
272   // present in the class loader chain. If `owns_the_dex_files` is true then OpenDexFiles cannot
273   // be called on this context (dex_files_open_attempted_ and dex_files_open_result_ will be set
274   // to true as well)
275   explicit ClassLoaderContext(bool owns_the_dex_files);
276 
277   // Reads the class loader spec in place and returns true if the spec is valid and the
278   // compilation context was constructed.
279   bool Parse(const std::string& spec, bool parse_checksums = false);
280   ClassLoaderInfo* ParseInternal(const std::string& spec, bool parse_checksums);
281 
282   // Attempts to parse a single class loader spec.
283   // Returns the ClassLoaderInfo abstraction for this spec, or null if it cannot be parsed.
284   std::unique_ptr<ClassLoaderInfo> ParseClassLoaderSpec(
285       const std::string& class_loader_spec,
286       bool parse_checksums = false);
287 
288   // CHECKs that the dex files were opened (OpenDexFiles was called and set dex_files_open_result_
289   // to true). Aborts if not. The `calling_method` is used in the log message to identify the source
290   // of the call.
291   void CheckDexFilesOpened(const std::string& calling_method) const;
292 
293   // Creates the `ClassLoaderInfo` representing`class_loader` and attach it to `this`.
294   // The dex file present in `dex_elements` array (if not null) will be added at the end of
295   // the classpath.
296   bool CreateInfoFromClassLoader(ScopedObjectAccessAlreadyRunnable& soa,
297                                  Handle<mirror::ClassLoader> class_loader,
298                                  Handle<mirror::ObjectArray<mirror::Object>> dex_elements,
299                                  ClassLoaderInfo* child_info,
300                                  bool is_shared_library)
301     REQUIRES_SHARED(Locks::mutator_lock_);
302 
303   // Encodes the context as a string suitable to be passed to dex2oat or to be added to the
304   // oat file as the class path key.
305   // If for_dex2oat is true, the encoding adds each file once (i.e. it does not add multidex
306   // location). Otherwise, for oat files, the encoding adds all the dex files (including multidex)
307   // together with their checksums.
308   // Should only be called if OpenDexFiles() returned true.
309   std::string EncodeContext(const std::string& base_dir,
310                             bool for_dex2oat,
311                             ClassLoaderContext* stored_context) const;
312 
313   // Internal version of `EncodeContext`, which will be called recursively
314   // on the parent and shared libraries.
315   void EncodeContextInternal(const ClassLoaderInfo& info,
316                              const std::string& base_dir,
317                              bool for_dex2oat,
318                              ClassLoaderInfo* stored_info,
319                              std::ostringstream& out) const;
320 
321   // Encodes e.g. PCL[foo.dex:bar.dex]
322   void EncodeClassPath(const std::string& base_dir,
323                        const std::vector<std::string>& dex_locations,
324                        const std::vector<uint32_t>& checksums,
325                        ClassLoaderType type,
326                        std::ostringstream& out) const;
327 
328   // Encodes the shared libraries classloaders and the parent classloader if
329   // either are present in info, e.g. {PCL[foo.dex]#PCL[bar.dex]};PCL[baz.dex]
330   void EncodeSharedLibAndParent(const ClassLoaderInfo& info,
331                                 const std::string& base_dir,
332                                 bool for_dex2oat,
333                                 ClassLoaderInfo* stored_info,
334                                 std::ostringstream& out) const;
335 
336   bool ClassLoaderInfoMatch(const ClassLoaderInfo& info,
337                             const ClassLoaderInfo& expected_info,
338                             const std::string& context_spec,
339                             bool verify_names,
340                             bool verify_checksums) const;
341 
342   // Extracts the class loader type from the given spec.
343   // Return ClassLoaderContext::kInvalidClassLoader if the class loader type is not
344   // recognized.
345   static ClassLoaderType ExtractClassLoaderType(const std::string& class_loader_spec);
346 
347   // Returns the string representation of the class loader type.
348   // The returned format can be used when parsing a context spec.
349   static const char* GetClassLoaderTypeName(ClassLoaderType type);
350 
351   // Encodes the state of processing the dex files associated with the context.
352   enum ContextDexFilesState {
353     // The dex files are not opened.
354     kDexFilesNotOpened = 1,
355     // The dex checksums/locations were read from the apk/dex but the dex files were not opened.
356     kDexFilesChecksumsRead = 2,
357     // The dex files are opened (either because we called OpenDexFiles, or we used a class loader
358     // to create the context). This implies kDexFilesChecksumsRead.
359     kDexFilesOpened = 3,
360     // We failed to open the dex files or read the checksums.
361     kDexFilesOpenFailed = 4
362   };
363 
364   // The class loader chain.
365   std::unique_ptr<ClassLoaderInfo> class_loader_chain_;
366 
367   // The opening state of the dex files.
368   ContextDexFilesState dex_files_state_;
369 
370   // Whether or not the context owns the opened dex and oat files.
371   // If true, the opened dex files will be de-allocated when the context is destructed.
372   // If false, the objects will continue to be alive.
373   // Note that for convenience the the opened dex/oat files are stored as unique pointers
374   // which will release their ownership in the destructor based on this flag.
375   const bool owns_the_dex_files_;
376 
377   friend class ClassLoaderContextTest;
378 
379   DISALLOW_COPY_AND_ASSIGN(ClassLoaderContext);
380 };
381 
382 }  // namespace art
383 #endif  // ART_RUNTIME_CLASS_LOADER_CONTEXT_H_
384