1 /*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 /*
18 * Preparation and completion of hprof data generation. The output is
19 * written into two files and then combined. This is necessary because
20 * we generate some of the data (strings and classes) while we dump the
21 * heap, and some analysis tools require that the class and string data
22 * appear first.
23 */
24
25 #include "hprof.h"
26
27 #include <cutils/open_memstream.h>
28 #include <errno.h>
29 #include <fcntl.h>
30 #include <stdio.h>
31 #include <string.h>
32 #include <sys/time.h>
33 #include <sys/uio.h>
34 #include <time.h>
35 #include <unistd.h>
36
37 #include <set>
38
39 #include <android-base/logging.h>
40 #include <android-base/stringprintf.h>
41
42 #include "art_field-inl.h"
43 #include "art_method-inl.h"
44 #include "base/array_ref.h"
45 #include "base/macros.h"
46 #include "base/mutex.h"
47 #include "base/os.h"
48 #include "base/safe_map.h"
49 #include "base/time_utils.h"
50 #include "base/unix_file/fd_file.h"
51 #include "class_linker.h"
52 #include "common_throws.h"
53 #include "debugger.h"
54 #include "dex/dex_file-inl.h"
55 #include "gc/accounting/heap_bitmap.h"
56 #include "gc/allocation_record.h"
57 #include "gc/heap-visit-objects-inl.h"
58 #include "gc/heap.h"
59 #include "gc/scoped_gc_critical_section.h"
60 #include "gc/space/space.h"
61 #include "gc_root.h"
62 #include "globals.h"
63 #include "jdwp/jdwp.h"
64 #include "jdwp/jdwp_priv.h"
65 #include "mirror/class-inl.h"
66 #include "mirror/class.h"
67 #include "mirror/object-refvisitor-inl.h"
68 #include "scoped_thread_state_change-inl.h"
69 #include "thread_list.h"
70
71 namespace art {
72
73 namespace hprof {
74
75 static constexpr bool kDirectStream = true;
76
77 static constexpr uint32_t kHprofTime = 0;
78 static constexpr uint32_t kHprofNullThread = 0;
79
80 static constexpr size_t kMaxObjectsPerSegment = 128;
81 static constexpr size_t kMaxBytesPerSegment = 4096;
82
83 // The static field-name for the synthetic object generated to account for class static overhead.
84 static constexpr const char* kClassOverheadName = "$classOverhead";
85
86 enum HprofTag {
87 HPROF_TAG_STRING = 0x01,
88 HPROF_TAG_LOAD_CLASS = 0x02,
89 HPROF_TAG_UNLOAD_CLASS = 0x03,
90 HPROF_TAG_STACK_FRAME = 0x04,
91 HPROF_TAG_STACK_TRACE = 0x05,
92 HPROF_TAG_ALLOC_SITES = 0x06,
93 HPROF_TAG_HEAP_SUMMARY = 0x07,
94 HPROF_TAG_START_THREAD = 0x0A,
95 HPROF_TAG_END_THREAD = 0x0B,
96 HPROF_TAG_HEAP_DUMP = 0x0C,
97 HPROF_TAG_HEAP_DUMP_SEGMENT = 0x1C,
98 HPROF_TAG_HEAP_DUMP_END = 0x2C,
99 HPROF_TAG_CPU_SAMPLES = 0x0D,
100 HPROF_TAG_CONTROL_SETTINGS = 0x0E,
101 };
102
103 // Values for the first byte of HEAP_DUMP and HEAP_DUMP_SEGMENT records:
104 enum HprofHeapTag {
105 // Traditional.
106 HPROF_ROOT_UNKNOWN = 0xFF,
107 HPROF_ROOT_JNI_GLOBAL = 0x01,
108 HPROF_ROOT_JNI_LOCAL = 0x02,
109 HPROF_ROOT_JAVA_FRAME = 0x03,
110 HPROF_ROOT_NATIVE_STACK = 0x04,
111 HPROF_ROOT_STICKY_CLASS = 0x05,
112 HPROF_ROOT_THREAD_BLOCK = 0x06,
113 HPROF_ROOT_MONITOR_USED = 0x07,
114 HPROF_ROOT_THREAD_OBJECT = 0x08,
115 HPROF_CLASS_DUMP = 0x20,
116 HPROF_INSTANCE_DUMP = 0x21,
117 HPROF_OBJECT_ARRAY_DUMP = 0x22,
118 HPROF_PRIMITIVE_ARRAY_DUMP = 0x23,
119
120 // Android.
121 HPROF_HEAP_DUMP_INFO = 0xfe,
122 HPROF_ROOT_INTERNED_STRING = 0x89,
123 HPROF_ROOT_FINALIZING = 0x8a, // Obsolete.
124 HPROF_ROOT_DEBUGGER = 0x8b,
125 HPROF_ROOT_REFERENCE_CLEANUP = 0x8c, // Obsolete.
126 HPROF_ROOT_VM_INTERNAL = 0x8d,
127 HPROF_ROOT_JNI_MONITOR = 0x8e,
128 HPROF_UNREACHABLE = 0x90, // Obsolete.
129 HPROF_PRIMITIVE_ARRAY_NODATA_DUMP = 0xc3, // Obsolete.
130 };
131
132 enum HprofHeapId {
133 HPROF_HEAP_DEFAULT = 0,
134 HPROF_HEAP_ZYGOTE = 'Z',
135 HPROF_HEAP_APP = 'A',
136 HPROF_HEAP_IMAGE = 'I',
137 };
138
139 enum HprofBasicType {
140 hprof_basic_object = 2,
141 hprof_basic_boolean = 4,
142 hprof_basic_char = 5,
143 hprof_basic_float = 6,
144 hprof_basic_double = 7,
145 hprof_basic_byte = 8,
146 hprof_basic_short = 9,
147 hprof_basic_int = 10,
148 hprof_basic_long = 11,
149 };
150
151 typedef uint32_t HprofStringId;
152 typedef uint32_t HprofClassObjectId;
153 typedef uint32_t HprofClassSerialNumber;
154 typedef uint32_t HprofStackTraceSerialNumber;
155 typedef uint32_t HprofStackFrameId;
156 static constexpr HprofStackTraceSerialNumber kHprofNullStackTrace = 0;
157
158 class EndianOutput {
159 public:
EndianOutput()160 EndianOutput() : length_(0), sum_length_(0), max_length_(0), started_(false) {}
~EndianOutput()161 virtual ~EndianOutput() {}
162
StartNewRecord(uint8_t tag,uint32_t time)163 void StartNewRecord(uint8_t tag, uint32_t time) {
164 if (length_ > 0) {
165 EndRecord();
166 }
167 DCHECK_EQ(length_, 0U);
168 AddU1(tag);
169 AddU4(time);
170 AddU4(0xdeaddead); // Length, replaced on flush.
171 started_ = true;
172 }
173
EndRecord()174 void EndRecord() {
175 // Replace length in header.
176 if (started_) {
177 UpdateU4(sizeof(uint8_t) + sizeof(uint32_t),
178 length_ - sizeof(uint8_t) - 2 * sizeof(uint32_t));
179 }
180
181 HandleEndRecord();
182
183 sum_length_ += length_;
184 max_length_ = std::max(max_length_, length_);
185 length_ = 0;
186 started_ = false;
187 }
188
AddU1(uint8_t value)189 void AddU1(uint8_t value) {
190 AddU1List(&value, 1);
191 }
AddU2(uint16_t value)192 void AddU2(uint16_t value) {
193 AddU2List(&value, 1);
194 }
AddU4(uint32_t value)195 void AddU4(uint32_t value) {
196 AddU4List(&value, 1);
197 }
198
AddU8(uint64_t value)199 void AddU8(uint64_t value) {
200 AddU8List(&value, 1);
201 }
202
AddObjectId(const mirror::Object * value)203 void AddObjectId(const mirror::Object* value) {
204 AddU4(PointerToLowMemUInt32(value));
205 }
206
AddStackTraceSerialNumber(HprofStackTraceSerialNumber value)207 void AddStackTraceSerialNumber(HprofStackTraceSerialNumber value) {
208 AddU4(value);
209 }
210
211 // The ID for the synthetic object generated to account for class static overhead.
AddClassStaticsId(const mirror::Class * value)212 void AddClassStaticsId(const mirror::Class* value) {
213 AddU4(1 | PointerToLowMemUInt32(value));
214 }
215
AddJniGlobalRefId(jobject value)216 void AddJniGlobalRefId(jobject value) {
217 AddU4(PointerToLowMemUInt32(value));
218 }
219
AddClassId(HprofClassObjectId value)220 void AddClassId(HprofClassObjectId value) {
221 AddU4(value);
222 }
223
AddStringId(HprofStringId value)224 void AddStringId(HprofStringId value) {
225 AddU4(value);
226 }
227
AddU1List(const uint8_t * values,size_t count)228 void AddU1List(const uint8_t* values, size_t count) {
229 HandleU1List(values, count);
230 length_ += count;
231 }
AddU2List(const uint16_t * values,size_t count)232 void AddU2List(const uint16_t* values, size_t count) {
233 HandleU2List(values, count);
234 length_ += count * sizeof(uint16_t);
235 }
AddU4List(const uint32_t * values,size_t count)236 void AddU4List(const uint32_t* values, size_t count) {
237 HandleU4List(values, count);
238 length_ += count * sizeof(uint32_t);
239 }
UpdateU4(size_t offset,uint32_t new_value ATTRIBUTE_UNUSED)240 virtual void UpdateU4(size_t offset, uint32_t new_value ATTRIBUTE_UNUSED) {
241 DCHECK_LE(offset, length_ - 4);
242 }
AddU8List(const uint64_t * values,size_t count)243 void AddU8List(const uint64_t* values, size_t count) {
244 HandleU8List(values, count);
245 length_ += count * sizeof(uint64_t);
246 }
247
AddIdList(mirror::ObjectArray<mirror::Object> * values)248 void AddIdList(mirror::ObjectArray<mirror::Object>* values)
249 REQUIRES_SHARED(Locks::mutator_lock_) {
250 const int32_t length = values->GetLength();
251 for (int32_t i = 0; i < length; ++i) {
252 AddObjectId(values->GetWithoutChecks(i));
253 }
254 }
255
AddUtf8String(const char * str)256 void AddUtf8String(const char* str) {
257 // The terminating NUL character is NOT written.
258 AddU1List((const uint8_t*)str, strlen(str));
259 }
260
Length() const261 size_t Length() const {
262 return length_;
263 }
264
SumLength() const265 size_t SumLength() const {
266 return sum_length_;
267 }
268
MaxLength() const269 size_t MaxLength() const {
270 return max_length_;
271 }
272
273 protected:
HandleU1List(const uint8_t * values ATTRIBUTE_UNUSED,size_t count ATTRIBUTE_UNUSED)274 virtual void HandleU1List(const uint8_t* values ATTRIBUTE_UNUSED,
275 size_t count ATTRIBUTE_UNUSED) {
276 }
HandleU1AsU2List(const uint8_t * values ATTRIBUTE_UNUSED,size_t count ATTRIBUTE_UNUSED)277 virtual void HandleU1AsU2List(const uint8_t* values ATTRIBUTE_UNUSED,
278 size_t count ATTRIBUTE_UNUSED) {
279 }
HandleU2List(const uint16_t * values ATTRIBUTE_UNUSED,size_t count ATTRIBUTE_UNUSED)280 virtual void HandleU2List(const uint16_t* values ATTRIBUTE_UNUSED,
281 size_t count ATTRIBUTE_UNUSED) {
282 }
HandleU4List(const uint32_t * values ATTRIBUTE_UNUSED,size_t count ATTRIBUTE_UNUSED)283 virtual void HandleU4List(const uint32_t* values ATTRIBUTE_UNUSED,
284 size_t count ATTRIBUTE_UNUSED) {
285 }
HandleU8List(const uint64_t * values ATTRIBUTE_UNUSED,size_t count ATTRIBUTE_UNUSED)286 virtual void HandleU8List(const uint64_t* values ATTRIBUTE_UNUSED,
287 size_t count ATTRIBUTE_UNUSED) {
288 }
HandleEndRecord()289 virtual void HandleEndRecord() {
290 }
291
292 size_t length_; // Current record size.
293 size_t sum_length_; // Size of all data.
294 size_t max_length_; // Maximum seen length.
295 bool started_; // Was StartRecord called?
296 };
297
298 // This keeps things buffered until flushed.
299 class EndianOutputBuffered : public EndianOutput {
300 public:
EndianOutputBuffered(size_t reserve_size)301 explicit EndianOutputBuffered(size_t reserve_size) {
302 buffer_.reserve(reserve_size);
303 }
~EndianOutputBuffered()304 virtual ~EndianOutputBuffered() {}
305
UpdateU4(size_t offset,uint32_t new_value)306 void UpdateU4(size_t offset, uint32_t new_value) OVERRIDE {
307 DCHECK_LE(offset, length_ - 4);
308 buffer_[offset + 0] = static_cast<uint8_t>((new_value >> 24) & 0xFF);
309 buffer_[offset + 1] = static_cast<uint8_t>((new_value >> 16) & 0xFF);
310 buffer_[offset + 2] = static_cast<uint8_t>((new_value >> 8) & 0xFF);
311 buffer_[offset + 3] = static_cast<uint8_t>((new_value >> 0) & 0xFF);
312 }
313
314 protected:
HandleU1List(const uint8_t * values,size_t count)315 void HandleU1List(const uint8_t* values, size_t count) OVERRIDE {
316 DCHECK_EQ(length_, buffer_.size());
317 buffer_.insert(buffer_.end(), values, values + count);
318 }
319
HandleU1AsU2List(const uint8_t * values,size_t count)320 void HandleU1AsU2List(const uint8_t* values, size_t count) OVERRIDE {
321 DCHECK_EQ(length_, buffer_.size());
322 // All 8-bits are grouped in 2 to make 16-bit block like Java Char
323 if (count & 1) {
324 buffer_.push_back(0);
325 }
326 for (size_t i = 0; i < count; ++i) {
327 uint8_t value = *values;
328 buffer_.push_back(value);
329 values++;
330 }
331 }
332
HandleU2List(const uint16_t * values,size_t count)333 void HandleU2List(const uint16_t* values, size_t count) OVERRIDE {
334 DCHECK_EQ(length_, buffer_.size());
335 for (size_t i = 0; i < count; ++i) {
336 uint16_t value = *values;
337 buffer_.push_back(static_cast<uint8_t>((value >> 8) & 0xFF));
338 buffer_.push_back(static_cast<uint8_t>((value >> 0) & 0xFF));
339 values++;
340 }
341 }
342
HandleU4List(const uint32_t * values,size_t count)343 void HandleU4List(const uint32_t* values, size_t count) OVERRIDE {
344 DCHECK_EQ(length_, buffer_.size());
345 for (size_t i = 0; i < count; ++i) {
346 uint32_t value = *values;
347 buffer_.push_back(static_cast<uint8_t>((value >> 24) & 0xFF));
348 buffer_.push_back(static_cast<uint8_t>((value >> 16) & 0xFF));
349 buffer_.push_back(static_cast<uint8_t>((value >> 8) & 0xFF));
350 buffer_.push_back(static_cast<uint8_t>((value >> 0) & 0xFF));
351 values++;
352 }
353 }
354
HandleU8List(const uint64_t * values,size_t count)355 void HandleU8List(const uint64_t* values, size_t count) OVERRIDE {
356 DCHECK_EQ(length_, buffer_.size());
357 for (size_t i = 0; i < count; ++i) {
358 uint64_t value = *values;
359 buffer_.push_back(static_cast<uint8_t>((value >> 56) & 0xFF));
360 buffer_.push_back(static_cast<uint8_t>((value >> 48) & 0xFF));
361 buffer_.push_back(static_cast<uint8_t>((value >> 40) & 0xFF));
362 buffer_.push_back(static_cast<uint8_t>((value >> 32) & 0xFF));
363 buffer_.push_back(static_cast<uint8_t>((value >> 24) & 0xFF));
364 buffer_.push_back(static_cast<uint8_t>((value >> 16) & 0xFF));
365 buffer_.push_back(static_cast<uint8_t>((value >> 8) & 0xFF));
366 buffer_.push_back(static_cast<uint8_t>((value >> 0) & 0xFF));
367 values++;
368 }
369 }
370
HandleEndRecord()371 void HandleEndRecord() OVERRIDE {
372 DCHECK_EQ(buffer_.size(), length_);
373 if (kIsDebugBuild && started_) {
374 uint32_t stored_length =
375 static_cast<uint32_t>(buffer_[5]) << 24 |
376 static_cast<uint32_t>(buffer_[6]) << 16 |
377 static_cast<uint32_t>(buffer_[7]) << 8 |
378 static_cast<uint32_t>(buffer_[8]);
379 DCHECK_EQ(stored_length, length_ - sizeof(uint8_t) - 2 * sizeof(uint32_t));
380 }
381 HandleFlush(buffer_.data(), length_);
382 buffer_.clear();
383 }
384
HandleFlush(const uint8_t * buffer ATTRIBUTE_UNUSED,size_t length ATTRIBUTE_UNUSED)385 virtual void HandleFlush(const uint8_t* buffer ATTRIBUTE_UNUSED, size_t length ATTRIBUTE_UNUSED) {
386 }
387
388 std::vector<uint8_t> buffer_;
389 };
390
391 class FileEndianOutput FINAL : public EndianOutputBuffered {
392 public:
FileEndianOutput(File * fp,size_t reserved_size)393 FileEndianOutput(File* fp, size_t reserved_size)
394 : EndianOutputBuffered(reserved_size), fp_(fp), errors_(false) {
395 DCHECK(fp != nullptr);
396 }
~FileEndianOutput()397 ~FileEndianOutput() {
398 }
399
Errors()400 bool Errors() {
401 return errors_;
402 }
403
404 protected:
HandleFlush(const uint8_t * buffer,size_t length)405 void HandleFlush(const uint8_t* buffer, size_t length) OVERRIDE {
406 if (!errors_) {
407 errors_ = !fp_->WriteFully(buffer, length);
408 }
409 }
410
411 private:
412 File* fp_;
413 bool errors_;
414 };
415
416 class VectorEndianOuputput FINAL : public EndianOutputBuffered {
417 public:
VectorEndianOuputput(std::vector<uint8_t> & data,size_t reserved_size)418 VectorEndianOuputput(std::vector<uint8_t>& data, size_t reserved_size)
419 : EndianOutputBuffered(reserved_size), full_data_(data) {}
~VectorEndianOuputput()420 ~VectorEndianOuputput() {}
421
422 protected:
HandleFlush(const uint8_t * buf,size_t length)423 void HandleFlush(const uint8_t* buf, size_t length) OVERRIDE {
424 size_t old_size = full_data_.size();
425 full_data_.resize(old_size + length);
426 memcpy(full_data_.data() + old_size, buf, length);
427 }
428
429 private:
430 std::vector<uint8_t>& full_data_;
431 };
432
433 #define __ output_->
434
435 class Hprof : public SingleRootVisitor {
436 public:
Hprof(const char * output_filename,int fd,bool direct_to_ddms)437 Hprof(const char* output_filename, int fd, bool direct_to_ddms)
438 : filename_(output_filename),
439 fd_(fd),
440 direct_to_ddms_(direct_to_ddms) {
441 LOG(INFO) << "hprof: heap dump \"" << filename_ << "\" starting...";
442 }
443
Dump()444 void Dump()
445 REQUIRES(Locks::mutator_lock_)
446 REQUIRES(!Locks::heap_bitmap_lock_, !Locks::alloc_tracker_lock_) {
447 {
448 MutexLock mu(Thread::Current(), *Locks::alloc_tracker_lock_);
449 if (Runtime::Current()->GetHeap()->IsAllocTrackingEnabled()) {
450 PopulateAllocationTrackingTraces();
451 }
452 }
453
454 // First pass to measure the size of the dump.
455 size_t overall_size;
456 size_t max_length;
457 {
458 EndianOutput count_output;
459 output_ = &count_output;
460 ProcessHeap(false);
461 overall_size = count_output.SumLength();
462 max_length = count_output.MaxLength();
463 output_ = nullptr;
464 }
465
466 bool okay;
467 visited_objects_.clear();
468 if (direct_to_ddms_) {
469 if (kDirectStream) {
470 okay = DumpToDdmsDirect(overall_size, max_length, CHUNK_TYPE("HPDS"));
471 } else {
472 okay = DumpToDdmsBuffered(overall_size, max_length);
473 }
474 } else {
475 okay = DumpToFile(overall_size, max_length);
476 }
477
478 if (okay) {
479 const uint64_t duration = NanoTime() - start_ns_;
480 LOG(INFO) << "hprof: heap dump completed (" << PrettySize(RoundUp(overall_size, KB))
481 << ") in " << PrettyDuration(duration)
482 << " objects " << total_objects_
483 << " objects with stack traces " << total_objects_with_stack_trace_;
484 }
485 }
486
487 private:
488 void DumpHeapObject(mirror::Object* obj)
489 REQUIRES_SHARED(Locks::mutator_lock_);
490
491 void DumpHeapClass(mirror::Class* klass)
492 REQUIRES_SHARED(Locks::mutator_lock_);
493
494 void DumpHeapArray(mirror::Array* obj, mirror::Class* klass)
495 REQUIRES_SHARED(Locks::mutator_lock_);
496
497 void DumpFakeObjectArray(mirror::Object* obj, const std::set<mirror::Object*>& elements)
498 REQUIRES_SHARED(Locks::mutator_lock_);
499
500 void DumpHeapInstanceObject(mirror::Object* obj,
501 mirror::Class* klass,
502 const std::set<mirror::Object*>& fake_roots)
503 REQUIRES_SHARED(Locks::mutator_lock_);
504
505 bool AddRuntimeInternalObjectsField(mirror::Class* klass) REQUIRES_SHARED(Locks::mutator_lock_);
506
ProcessHeap(bool header_first)507 void ProcessHeap(bool header_first)
508 REQUIRES(Locks::mutator_lock_) {
509 // Reset current heap and object count.
510 current_heap_ = HPROF_HEAP_DEFAULT;
511 objects_in_segment_ = 0;
512
513 if (header_first) {
514 ProcessHeader(true);
515 ProcessBody();
516 } else {
517 ProcessBody();
518 ProcessHeader(false);
519 }
520 }
521
ProcessBody()522 void ProcessBody() REQUIRES(Locks::mutator_lock_) {
523 Runtime* const runtime = Runtime::Current();
524 // Walk the roots and the heap.
525 output_->StartNewRecord(HPROF_TAG_HEAP_DUMP_SEGMENT, kHprofTime);
526
527 simple_roots_.clear();
528 runtime->VisitRoots(this);
529 runtime->VisitImageRoots(this);
530 auto dump_object = [this](mirror::Object* obj) REQUIRES_SHARED(Locks::mutator_lock_) {
531 DCHECK(obj != nullptr);
532 DumpHeapObject(obj);
533 };
534 runtime->GetHeap()->VisitObjectsPaused(dump_object);
535 output_->StartNewRecord(HPROF_TAG_HEAP_DUMP_END, kHprofTime);
536 output_->EndRecord();
537 }
538
ProcessHeader(bool string_first)539 void ProcessHeader(bool string_first) REQUIRES(Locks::mutator_lock_) {
540 // Write the header.
541 WriteFixedHeader();
542 // Write the string and class tables, and any stack traces, to the header.
543 // (jhat requires that these appear before any of the data in the body that refers to them.)
544 // jhat also requires the string table appear before class table and stack traces.
545 // However, WriteStackTraces() can modify the string table, so it's necessary to call
546 // WriteStringTable() last in the first pass, to compute the correct length of the output.
547 if (string_first) {
548 WriteStringTable();
549 }
550 WriteClassTable();
551 WriteStackTraces();
552 if (!string_first) {
553 WriteStringTable();
554 }
555 output_->EndRecord();
556 }
557
WriteClassTable()558 void WriteClassTable() REQUIRES_SHARED(Locks::mutator_lock_) {
559 for (const auto& p : classes_) {
560 mirror::Class* c = p.first;
561 HprofClassSerialNumber sn = p.second;
562 CHECK(c != nullptr);
563 output_->StartNewRecord(HPROF_TAG_LOAD_CLASS, kHprofTime);
564 // LOAD CLASS format:
565 // U4: class serial number (always > 0)
566 // ID: class object ID. We use the address of the class object structure as its ID.
567 // U4: stack trace serial number
568 // ID: class name string ID
569 __ AddU4(sn);
570 __ AddObjectId(c);
571 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(c));
572 __ AddStringId(LookupClassNameId(c));
573 }
574 }
575
WriteStringTable()576 void WriteStringTable() {
577 for (const auto& p : strings_) {
578 const std::string& string = p.first;
579 const HprofStringId id = p.second;
580
581 output_->StartNewRecord(HPROF_TAG_STRING, kHprofTime);
582
583 // STRING format:
584 // ID: ID for this string
585 // U1*: UTF8 characters for string (NOT null terminated)
586 // (the record format encodes the length)
587 __ AddU4(id);
588 __ AddUtf8String(string.c_str());
589 }
590 }
591
StartNewHeapDumpSegment()592 void StartNewHeapDumpSegment() {
593 // This flushes the old segment and starts a new one.
594 output_->StartNewRecord(HPROF_TAG_HEAP_DUMP_SEGMENT, kHprofTime);
595 objects_in_segment_ = 0;
596 // Starting a new HEAP_DUMP resets the heap to default.
597 current_heap_ = HPROF_HEAP_DEFAULT;
598 }
599
CheckHeapSegmentConstraints()600 void CheckHeapSegmentConstraints() {
601 if (objects_in_segment_ >= kMaxObjectsPerSegment || output_->Length() >= kMaxBytesPerSegment) {
602 StartNewHeapDumpSegment();
603 }
604 }
605
606 void VisitRoot(mirror::Object* obj, const RootInfo& root_info)
607 OVERRIDE REQUIRES_SHARED(Locks::mutator_lock_);
608 void MarkRootObject(const mirror::Object* obj, jobject jni_obj, HprofHeapTag heap_tag,
609 uint32_t thread_serial);
610
LookupClassId(mirror::Class * c)611 HprofClassObjectId LookupClassId(mirror::Class* c) REQUIRES_SHARED(Locks::mutator_lock_) {
612 if (c != nullptr) {
613 auto it = classes_.find(c);
614 if (it == classes_.end()) {
615 // first time to see this class
616 HprofClassSerialNumber sn = next_class_serial_number_++;
617 classes_.Put(c, sn);
618 // Make sure that we've assigned a string ID for this class' name
619 LookupClassNameId(c);
620 }
621 }
622 return PointerToLowMemUInt32(c);
623 }
624
LookupStackTraceSerialNumber(const mirror::Object * obj)625 HprofStackTraceSerialNumber LookupStackTraceSerialNumber(const mirror::Object* obj)
626 REQUIRES_SHARED(Locks::mutator_lock_) {
627 auto r = allocation_records_.find(obj);
628 if (r == allocation_records_.end()) {
629 return kHprofNullStackTrace;
630 } else {
631 const gc::AllocRecordStackTrace* trace = r->second;
632 auto result = traces_.find(trace);
633 CHECK(result != traces_.end());
634 return result->second;
635 }
636 }
637
LookupStringId(mirror::String * string)638 HprofStringId LookupStringId(mirror::String* string) REQUIRES_SHARED(Locks::mutator_lock_) {
639 return LookupStringId(string->ToModifiedUtf8());
640 }
641
LookupStringId(const char * string)642 HprofStringId LookupStringId(const char* string) {
643 return LookupStringId(std::string(string));
644 }
645
LookupStringId(const std::string & string)646 HprofStringId LookupStringId(const std::string& string) {
647 auto it = strings_.find(string);
648 if (it != strings_.end()) {
649 return it->second;
650 }
651 HprofStringId id = next_string_id_++;
652 strings_.Put(string, id);
653 return id;
654 }
655
LookupClassNameId(mirror::Class * c)656 HprofStringId LookupClassNameId(mirror::Class* c) REQUIRES_SHARED(Locks::mutator_lock_) {
657 return LookupStringId(c->PrettyDescriptor());
658 }
659
WriteFixedHeader()660 void WriteFixedHeader() {
661 // Write the file header.
662 // U1: NUL-terminated magic string.
663 const char magic[] = "JAVA PROFILE 1.0.3";
664 __ AddU1List(reinterpret_cast<const uint8_t*>(magic), sizeof(magic));
665
666 // U4: size of identifiers. We're using addresses as IDs and our heap references are stored
667 // as uint32_t.
668 // Note of warning: hprof-conv hard-codes the size of identifiers to 4.
669 static_assert(sizeof(mirror::HeapReference<mirror::Object>) == sizeof(uint32_t),
670 "Unexpected HeapReference size");
671 __ AddU4(sizeof(uint32_t));
672
673 // The current time, in milliseconds since 0:00 GMT, 1/1/70.
674 timeval now;
675 const uint64_t nowMs = (gettimeofday(&now, nullptr) < 0) ? 0 :
676 (uint64_t)now.tv_sec * 1000 + now.tv_usec / 1000;
677 // TODO: It seems it would be correct to use U8.
678 // U4: high word of the 64-bit time.
679 __ AddU4(static_cast<uint32_t>(nowMs >> 32));
680 // U4: low word of the 64-bit time.
681 __ AddU4(static_cast<uint32_t>(nowMs & 0xFFFFFFFF));
682 }
683
WriteStackTraces()684 void WriteStackTraces() REQUIRES_SHARED(Locks::mutator_lock_) {
685 // Write a dummy stack trace record so the analysis tools don't freak out.
686 output_->StartNewRecord(HPROF_TAG_STACK_TRACE, kHprofTime);
687 __ AddStackTraceSerialNumber(kHprofNullStackTrace);
688 __ AddU4(kHprofNullThread);
689 __ AddU4(0); // no frames
690
691 // TODO: jhat complains "WARNING: Stack trace not found for serial # -1", but no trace should
692 // have -1 as its serial number (as long as HprofStackTraceSerialNumber doesn't overflow).
693 for (const auto& it : traces_) {
694 const gc::AllocRecordStackTrace* trace = it.first;
695 HprofStackTraceSerialNumber trace_sn = it.second;
696 size_t depth = trace->GetDepth();
697
698 // First write stack frames of the trace
699 for (size_t i = 0; i < depth; ++i) {
700 const gc::AllocRecordStackTraceElement* frame = &trace->GetStackElement(i);
701 ArtMethod* method = frame->GetMethod();
702 CHECK(method != nullptr);
703 output_->StartNewRecord(HPROF_TAG_STACK_FRAME, kHprofTime);
704 // STACK FRAME format:
705 // ID: stack frame ID. We use the address of the AllocRecordStackTraceElement object as its ID.
706 // ID: method name string ID
707 // ID: method signature string ID
708 // ID: source file name string ID
709 // U4: class serial number
710 // U4: >0, line number; 0, no line information available; -1, unknown location
711 auto frame_result = frames_.find(frame);
712 CHECK(frame_result != frames_.end());
713 __ AddU4(frame_result->second);
714 __ AddStringId(LookupStringId(method->GetName()));
715 __ AddStringId(LookupStringId(method->GetSignature().ToString()));
716 const char* source_file = method->GetDeclaringClassSourceFile();
717 if (source_file == nullptr) {
718 source_file = "";
719 }
720 __ AddStringId(LookupStringId(source_file));
721 auto class_result = classes_.find(method->GetDeclaringClass());
722 CHECK(class_result != classes_.end());
723 __ AddU4(class_result->second);
724 __ AddU4(frame->ComputeLineNumber());
725 }
726
727 // Then write the trace itself
728 output_->StartNewRecord(HPROF_TAG_STACK_TRACE, kHprofTime);
729 // STACK TRACE format:
730 // U4: stack trace serial number. We use the address of the AllocRecordStackTrace object as its serial number.
731 // U4: thread serial number. We use Thread::GetTid().
732 // U4: number of frames
733 // [ID]*: series of stack frame ID's
734 __ AddStackTraceSerialNumber(trace_sn);
735 __ AddU4(trace->GetTid());
736 __ AddU4(depth);
737 for (size_t i = 0; i < depth; ++i) {
738 const gc::AllocRecordStackTraceElement* frame = &trace->GetStackElement(i);
739 auto frame_result = frames_.find(frame);
740 CHECK(frame_result != frames_.end());
741 __ AddU4(frame_result->second);
742 }
743 }
744 }
745
DumpToDdmsBuffered(size_t overall_size ATTRIBUTE_UNUSED,size_t max_length ATTRIBUTE_UNUSED)746 bool DumpToDdmsBuffered(size_t overall_size ATTRIBUTE_UNUSED, size_t max_length ATTRIBUTE_UNUSED)
747 REQUIRES(Locks::mutator_lock_) {
748 LOG(FATAL) << "Unimplemented";
749 UNREACHABLE();
750 // // Send the data off to DDMS.
751 // iovec iov[2];
752 // iov[0].iov_base = header_data_ptr_;
753 // iov[0].iov_len = header_data_size_;
754 // iov[1].iov_base = body_data_ptr_;
755 // iov[1].iov_len = body_data_size_;
756 // Dbg::DdmSendChunkV(CHUNK_TYPE("HPDS"), iov, 2);
757 }
758
DumpToFile(size_t overall_size,size_t max_length)759 bool DumpToFile(size_t overall_size, size_t max_length)
760 REQUIRES(Locks::mutator_lock_) {
761 // Where exactly are we writing to?
762 int out_fd;
763 if (fd_ >= 0) {
764 out_fd = dup(fd_);
765 if (out_fd < 0) {
766 ThrowRuntimeException("Couldn't dump heap; dup(%d) failed: %s", fd_, strerror(errno));
767 return false;
768 }
769 } else {
770 out_fd = open(filename_.c_str(), O_WRONLY|O_CREAT|O_TRUNC, 0644);
771 if (out_fd < 0) {
772 ThrowRuntimeException("Couldn't dump heap; open(\"%s\") failed: %s", filename_.c_str(),
773 strerror(errno));
774 return false;
775 }
776 }
777
778 std::unique_ptr<File> file(new File(out_fd, filename_, true));
779 bool okay;
780 {
781 FileEndianOutput file_output(file.get(), max_length);
782 output_ = &file_output;
783 ProcessHeap(true);
784 okay = !file_output.Errors();
785
786 if (okay) {
787 // Check for expected size. Output is expected to be less-or-equal than first phase, see
788 // b/23521263.
789 DCHECK_LE(file_output.SumLength(), overall_size);
790 }
791 output_ = nullptr;
792 }
793
794 if (okay) {
795 okay = file->FlushCloseOrErase() == 0;
796 } else {
797 file->Erase();
798 }
799 if (!okay) {
800 std::string msg(android::base::StringPrintf("Couldn't dump heap; writing \"%s\" failed: %s",
801 filename_.c_str(),
802 strerror(errno)));
803 ThrowRuntimeException("%s", msg.c_str());
804 LOG(ERROR) << msg;
805 }
806
807 return okay;
808 }
809
DumpToDdmsDirect(size_t overall_size,size_t max_length,uint32_t chunk_type)810 bool DumpToDdmsDirect(size_t overall_size, size_t max_length, uint32_t chunk_type)
811 REQUIRES(Locks::mutator_lock_) {
812 CHECK(direct_to_ddms_);
813
814 std::vector<uint8_t> out_data;
815
816 // TODO It would be really good to have some streaming thing again. b/73084059
817 VectorEndianOuputput output(out_data, max_length);
818 output_ = &output;
819
820 // Write the dump.
821 ProcessHeap(true);
822
823 Runtime::Current()->GetRuntimeCallbacks()->DdmPublishChunk(
824 chunk_type, ArrayRef<const uint8_t>(out_data.data(), out_data.size()));
825
826 // Check for expected size. See DumpToFile for comment.
827 DCHECK_LE(output.SumLength(), overall_size);
828 output_ = nullptr;
829
830 return true;
831 }
832
PopulateAllocationTrackingTraces()833 void PopulateAllocationTrackingTraces()
834 REQUIRES(Locks::mutator_lock_, Locks::alloc_tracker_lock_) {
835 gc::AllocRecordObjectMap* records = Runtime::Current()->GetHeap()->GetAllocationRecords();
836 CHECK(records != nullptr);
837 HprofStackTraceSerialNumber next_trace_sn = kHprofNullStackTrace + 1;
838 HprofStackFrameId next_frame_id = 0;
839 size_t count = 0;
840
841 for (auto it = records->Begin(), end = records->End(); it != end; ++it) {
842 const mirror::Object* obj = it->first.Read();
843 if (obj == nullptr) {
844 continue;
845 }
846 ++count;
847 const gc::AllocRecordStackTrace* trace = it->second.GetStackTrace();
848
849 // Copy the pair into a real hash map to speed up look up.
850 auto records_result = allocation_records_.emplace(obj, trace);
851 // The insertion should always succeed, i.e. no duplicate object pointers in "records"
852 CHECK(records_result.second);
853
854 // Generate serial numbers for traces, and IDs for frames.
855 auto traces_result = traces_.find(trace);
856 if (traces_result == traces_.end()) {
857 traces_.emplace(trace, next_trace_sn++);
858 // only check frames if the trace is newly discovered
859 for (size_t i = 0, depth = trace->GetDepth(); i < depth; ++i) {
860 const gc::AllocRecordStackTraceElement* frame = &trace->GetStackElement(i);
861 auto frames_result = frames_.find(frame);
862 if (frames_result == frames_.end()) {
863 frames_.emplace(frame, next_frame_id++);
864 }
865 }
866 }
867 }
868 CHECK_EQ(traces_.size(), next_trace_sn - kHprofNullStackTrace - 1);
869 CHECK_EQ(frames_.size(), next_frame_id);
870 total_objects_with_stack_trace_ = count;
871 }
872
873 // If direct_to_ddms_ is set, "filename_" and "fd" will be ignored.
874 // Otherwise, "filename_" must be valid, though if "fd" >= 0 it will
875 // only be used for debug messages.
876 std::string filename_;
877 int fd_;
878 bool direct_to_ddms_;
879
880 uint64_t start_ns_ = NanoTime();
881
882 EndianOutput* output_ = nullptr;
883
884 HprofHeapId current_heap_ = HPROF_HEAP_DEFAULT; // Which heap we're currently dumping.
885 size_t objects_in_segment_ = 0;
886
887 size_t total_objects_ = 0u;
888 size_t total_objects_with_stack_trace_ = 0u;
889
890 HprofStringId next_string_id_ = 0x400000;
891 SafeMap<std::string, HprofStringId> strings_;
892 HprofClassSerialNumber next_class_serial_number_ = 1;
893 SafeMap<mirror::Class*, HprofClassSerialNumber> classes_;
894
895 std::unordered_map<const gc::AllocRecordStackTrace*, HprofStackTraceSerialNumber,
896 gc::HashAllocRecordTypesPtr<gc::AllocRecordStackTrace>,
897 gc::EqAllocRecordTypesPtr<gc::AllocRecordStackTrace>> traces_;
898 std::unordered_map<const gc::AllocRecordStackTraceElement*, HprofStackFrameId,
899 gc::HashAllocRecordTypesPtr<gc::AllocRecordStackTraceElement>,
900 gc::EqAllocRecordTypesPtr<gc::AllocRecordStackTraceElement>> frames_;
901 std::unordered_map<const mirror::Object*, const gc::AllocRecordStackTrace*> allocation_records_;
902
903 // Set used to keep track of what simple root records we have already
904 // emitted, to avoid emitting duplicate entries. The simple root records are
905 // those that contain no other information than the root type and the object
906 // id. A pair of root type and object id is packed into a uint64_t, with
907 // the root type in the upper 32 bits and the object id in the lower 32
908 // bits.
909 std::unordered_set<uint64_t> simple_roots_;
910
911 // To make sure we don't dump the same object multiple times. b/34967844
912 std::unordered_set<mirror::Object*> visited_objects_;
913
914 friend class GcRootVisitor;
915 DISALLOW_COPY_AND_ASSIGN(Hprof);
916 };
917
SignatureToBasicTypeAndSize(const char * sig,size_t * size_out)918 static HprofBasicType SignatureToBasicTypeAndSize(const char* sig, size_t* size_out) {
919 char c = sig[0];
920 HprofBasicType ret;
921 size_t size;
922
923 switch (c) {
924 case '[':
925 case 'L':
926 ret = hprof_basic_object;
927 size = 4;
928 break;
929 case 'Z':
930 ret = hprof_basic_boolean;
931 size = 1;
932 break;
933 case 'C':
934 ret = hprof_basic_char;
935 size = 2;
936 break;
937 case 'F':
938 ret = hprof_basic_float;
939 size = 4;
940 break;
941 case 'D':
942 ret = hprof_basic_double;
943 size = 8;
944 break;
945 case 'B':
946 ret = hprof_basic_byte;
947 size = 1;
948 break;
949 case 'S':
950 ret = hprof_basic_short;
951 size = 2;
952 break;
953 case 'I':
954 ret = hprof_basic_int;
955 size = 4;
956 break;
957 case 'J':
958 ret = hprof_basic_long;
959 size = 8;
960 break;
961 default:
962 LOG(FATAL) << "UNREACHABLE";
963 UNREACHABLE();
964 }
965
966 if (size_out != nullptr) {
967 *size_out = size;
968 }
969
970 return ret;
971 }
972
973 // Always called when marking objects, but only does
974 // something when ctx->gc_scan_state_ is non-zero, which is usually
975 // only true when marking the root set or unreachable
976 // objects. Used to add rootset references to obj.
MarkRootObject(const mirror::Object * obj,jobject jni_obj,HprofHeapTag heap_tag,uint32_t thread_serial)977 void Hprof::MarkRootObject(const mirror::Object* obj, jobject jni_obj, HprofHeapTag heap_tag,
978 uint32_t thread_serial) {
979 if (heap_tag == 0) {
980 return;
981 }
982
983 CheckHeapSegmentConstraints();
984
985 switch (heap_tag) {
986 // ID: object ID
987 case HPROF_ROOT_UNKNOWN:
988 case HPROF_ROOT_STICKY_CLASS:
989 case HPROF_ROOT_MONITOR_USED:
990 case HPROF_ROOT_INTERNED_STRING:
991 case HPROF_ROOT_DEBUGGER:
992 case HPROF_ROOT_VM_INTERNAL: {
993 uint64_t key = (static_cast<uint64_t>(heap_tag) << 32) | PointerToLowMemUInt32(obj);
994 if (simple_roots_.insert(key).second) {
995 __ AddU1(heap_tag);
996 __ AddObjectId(obj);
997 }
998 break;
999 }
1000
1001 // ID: object ID
1002 // ID: JNI global ref ID
1003 case HPROF_ROOT_JNI_GLOBAL:
1004 __ AddU1(heap_tag);
1005 __ AddObjectId(obj);
1006 __ AddJniGlobalRefId(jni_obj);
1007 break;
1008
1009 // ID: object ID
1010 // U4: thread serial number
1011 // U4: frame number in stack trace (-1 for empty)
1012 case HPROF_ROOT_JNI_LOCAL:
1013 case HPROF_ROOT_JNI_MONITOR:
1014 case HPROF_ROOT_JAVA_FRAME:
1015 __ AddU1(heap_tag);
1016 __ AddObjectId(obj);
1017 __ AddU4(thread_serial);
1018 __ AddU4((uint32_t)-1);
1019 break;
1020
1021 // ID: object ID
1022 // U4: thread serial number
1023 case HPROF_ROOT_NATIVE_STACK:
1024 case HPROF_ROOT_THREAD_BLOCK:
1025 __ AddU1(heap_tag);
1026 __ AddObjectId(obj);
1027 __ AddU4(thread_serial);
1028 break;
1029
1030 // ID: thread object ID
1031 // U4: thread serial number
1032 // U4: stack trace serial number
1033 case HPROF_ROOT_THREAD_OBJECT:
1034 __ AddU1(heap_tag);
1035 __ AddObjectId(obj);
1036 __ AddU4(thread_serial);
1037 __ AddU4((uint32_t)-1); // xxx
1038 break;
1039
1040 case HPROF_CLASS_DUMP:
1041 case HPROF_INSTANCE_DUMP:
1042 case HPROF_OBJECT_ARRAY_DUMP:
1043 case HPROF_PRIMITIVE_ARRAY_DUMP:
1044 case HPROF_HEAP_DUMP_INFO:
1045 case HPROF_PRIMITIVE_ARRAY_NODATA_DUMP:
1046 // Ignored.
1047 break;
1048
1049 case HPROF_ROOT_FINALIZING:
1050 case HPROF_ROOT_REFERENCE_CLEANUP:
1051 case HPROF_UNREACHABLE:
1052 LOG(FATAL) << "obsolete tag " << static_cast<int>(heap_tag);
1053 break;
1054 }
1055
1056 ++objects_in_segment_;
1057 }
1058
AddRuntimeInternalObjectsField(mirror::Class * klass)1059 bool Hprof::AddRuntimeInternalObjectsField(mirror::Class* klass) {
1060 if (klass->IsDexCacheClass()) {
1061 return true;
1062 }
1063 // IsClassLoaderClass is true for subclasses of classloader but we only want to add the fake
1064 // field to the java.lang.ClassLoader class.
1065 if (klass->IsClassLoaderClass() && klass->GetSuperClass()->IsObjectClass()) {
1066 return true;
1067 }
1068 return false;
1069 }
1070
DumpHeapObject(mirror::Object * obj)1071 void Hprof::DumpHeapObject(mirror::Object* obj) {
1072 // Ignore classes that are retired.
1073 if (obj->IsClass() && obj->AsClass()->IsRetired()) {
1074 return;
1075 }
1076 DCHECK(visited_objects_.insert(obj).second) << "Already visited " << obj;
1077
1078 ++total_objects_;
1079
1080 class RootCollector {
1081 public:
1082 RootCollector() {}
1083
1084 void operator()(mirror::Object*, MemberOffset, bool) const {}
1085
1086 // Note that these don't have read barriers. Its OK however since the GC is guaranteed to not be
1087 // running during the hprof dumping process.
1088 void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const
1089 REQUIRES_SHARED(Locks::mutator_lock_) {
1090 if (!root->IsNull()) {
1091 VisitRoot(root);
1092 }
1093 }
1094
1095 void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const
1096 REQUIRES_SHARED(Locks::mutator_lock_) {
1097 roots_.insert(root->AsMirrorPtr());
1098 }
1099
1100 const std::set<mirror::Object*>& GetRoots() const {
1101 return roots_;
1102 }
1103
1104 private:
1105 // These roots are actually live from the object. Avoid marking them as roots in hprof to make
1106 // it easier to debug class unloading.
1107 mutable std::set<mirror::Object*> roots_;
1108 };
1109
1110 RootCollector visitor;
1111 // Collect all native roots.
1112 if (!obj->IsClass()) {
1113 obj->VisitReferences(visitor, VoidFunctor());
1114 }
1115
1116 gc::Heap* const heap = Runtime::Current()->GetHeap();
1117 const gc::space::ContinuousSpace* const space = heap->FindContinuousSpaceFromObject(obj, true);
1118 HprofHeapId heap_type = HPROF_HEAP_APP;
1119 if (space != nullptr) {
1120 if (space->IsZygoteSpace()) {
1121 heap_type = HPROF_HEAP_ZYGOTE;
1122 VisitRoot(obj, RootInfo(kRootVMInternal));
1123 } else if (space->IsImageSpace() && heap->ObjectIsInBootImageSpace(obj)) {
1124 // Only count objects in the boot image as HPROF_HEAP_IMAGE, this leaves app image objects as
1125 // HPROF_HEAP_APP. b/35762934
1126 heap_type = HPROF_HEAP_IMAGE;
1127 VisitRoot(obj, RootInfo(kRootVMInternal));
1128 }
1129 } else {
1130 const auto* los = heap->GetLargeObjectsSpace();
1131 if (los->Contains(obj) && los->IsZygoteLargeObject(Thread::Current(), obj)) {
1132 heap_type = HPROF_HEAP_ZYGOTE;
1133 VisitRoot(obj, RootInfo(kRootVMInternal));
1134 }
1135 }
1136 CheckHeapSegmentConstraints();
1137
1138 if (heap_type != current_heap_) {
1139 HprofStringId nameId;
1140
1141 // This object is in a different heap than the current one.
1142 // Emit a HEAP_DUMP_INFO tag to change heaps.
1143 __ AddU1(HPROF_HEAP_DUMP_INFO);
1144 __ AddU4(static_cast<uint32_t>(heap_type)); // uint32_t: heap type
1145 switch (heap_type) {
1146 case HPROF_HEAP_APP:
1147 nameId = LookupStringId("app");
1148 break;
1149 case HPROF_HEAP_ZYGOTE:
1150 nameId = LookupStringId("zygote");
1151 break;
1152 case HPROF_HEAP_IMAGE:
1153 nameId = LookupStringId("image");
1154 break;
1155 default:
1156 // Internal error
1157 LOG(ERROR) << "Unexpected desiredHeap";
1158 nameId = LookupStringId("<ILLEGAL>");
1159 break;
1160 }
1161 __ AddStringId(nameId);
1162 current_heap_ = heap_type;
1163 }
1164
1165 mirror::Class* c = obj->GetClass();
1166 if (c == nullptr) {
1167 // This object will bother HprofReader, because it has a null
1168 // class, so just don't dump it. It could be
1169 // gDvm.unlinkedJavaLangClass or it could be an object just
1170 // allocated which hasn't been initialized yet.
1171 } else {
1172 if (obj->IsClass()) {
1173 DumpHeapClass(obj->AsClass());
1174 } else if (c->IsArrayClass()) {
1175 DumpHeapArray(obj->AsArray(), c);
1176 } else {
1177 DumpHeapInstanceObject(obj, c, visitor.GetRoots());
1178 }
1179 }
1180
1181 ++objects_in_segment_;
1182 }
1183
DumpHeapClass(mirror::Class * klass)1184 void Hprof::DumpHeapClass(mirror::Class* klass) {
1185 if (!klass->IsResolved()) {
1186 // Class is allocated but not yet resolved: we cannot access its fields or super class.
1187 return;
1188 }
1189
1190 // Note: We will emit instance fields of Class as synthetic static fields with a prefix of
1191 // "$class$" so the class fields are visible in hprof dumps. For tools to account for that
1192 // correctly, we'll emit an instance size of zero for java.lang.Class, and also emit the
1193 // instance fields of java.lang.Object.
1194 //
1195 // For other overhead (currently only the embedded vtable), we will generate a synthetic
1196 // byte array (or field[s] in case the overhead size is of reference size or less).
1197
1198 const size_t num_static_fields = klass->NumStaticFields();
1199
1200 // Total class size:
1201 // * class instance fields (including Object instance fields)
1202 // * vtable
1203 // * class static fields
1204 const size_t total_class_size = klass->GetClassSize();
1205
1206 // Base class size (common parts of all Class instances):
1207 // * class instance fields (including Object instance fields)
1208 constexpr size_t base_class_size = sizeof(mirror::Class);
1209 CHECK_LE(base_class_size, total_class_size);
1210
1211 // Difference of Total and Base:
1212 // * vtable
1213 // * class static fields
1214 const size_t base_overhead_size = total_class_size - base_class_size;
1215
1216 // Tools (ahat/Studio) will count the static fields and account for them in the class size. We
1217 // must thus subtract them from base_overhead_size or they will be double-counted.
1218 size_t class_static_fields_size = 0;
1219 for (ArtField& class_static_field : klass->GetSFields()) {
1220 size_t size = 0;
1221 SignatureToBasicTypeAndSize(class_static_field.GetTypeDescriptor(), &size);
1222 class_static_fields_size += size;
1223 }
1224
1225 CHECK_GE(base_overhead_size, class_static_fields_size);
1226 // Now we have:
1227 // * vtable
1228 const size_t base_no_statics_overhead_size = base_overhead_size - class_static_fields_size;
1229
1230 // We may decide to display native overhead (the actual IMT, ArtFields and ArtMethods) in the
1231 // future.
1232 const size_t java_heap_overhead_size = base_no_statics_overhead_size;
1233
1234 // For overhead greater 4, we'll allocate a synthetic array.
1235 if (java_heap_overhead_size > 4) {
1236 // Create a byte array to reflect the allocation of the
1237 // StaticField array at the end of this class.
1238 __ AddU1(HPROF_PRIMITIVE_ARRAY_DUMP);
1239 __ AddClassStaticsId(klass);
1240 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(klass));
1241 __ AddU4(java_heap_overhead_size - 4);
1242 __ AddU1(hprof_basic_byte);
1243 for (size_t i = 0; i < java_heap_overhead_size - 4; ++i) {
1244 __ AddU1(0);
1245 }
1246 }
1247 const size_t java_heap_overhead_field_count = java_heap_overhead_size > 0
1248 ? (java_heap_overhead_size == 3 ? 2u : 1u)
1249 : 0;
1250
1251 __ AddU1(HPROF_CLASS_DUMP);
1252 __ AddClassId(LookupClassId(klass));
1253 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(klass));
1254 __ AddClassId(LookupClassId(klass->GetSuperClass()));
1255 __ AddObjectId(klass->GetClassLoader());
1256 __ AddObjectId(nullptr); // no signer
1257 __ AddObjectId(nullptr); // no prot domain
1258 __ AddObjectId(nullptr); // reserved
1259 __ AddObjectId(nullptr); // reserved
1260 // Instance size.
1261 if (klass->IsClassClass()) {
1262 // As mentioned above, we will emit instance fields as synthetic static fields. So the
1263 // base object is "empty."
1264 __ AddU4(0);
1265 } else if (klass->IsStringClass()) {
1266 // Strings are variable length with character data at the end like arrays.
1267 // This outputs the size of an empty string.
1268 __ AddU4(sizeof(mirror::String));
1269 } else if (klass->IsArrayClass() || klass->IsPrimitive()) {
1270 __ AddU4(0);
1271 } else {
1272 __ AddU4(klass->GetObjectSize()); // instance size
1273 }
1274
1275 __ AddU2(0); // empty const pool
1276
1277 // Static fields
1278 //
1279 // Note: we report Class' and Object's instance fields here, too. This is for visibility reasons.
1280 // (b/38167721)
1281 mirror::Class* class_class = klass->GetClass();
1282
1283 DCHECK(class_class->GetSuperClass()->IsObjectClass());
1284 const size_t static_fields_reported = class_class->NumInstanceFields()
1285 + class_class->GetSuperClass()->NumInstanceFields()
1286 + java_heap_overhead_field_count
1287 + num_static_fields;
1288 __ AddU2(dchecked_integral_cast<uint16_t>(static_fields_reported));
1289
1290 if (java_heap_overhead_size != 0) {
1291 __ AddStringId(LookupStringId(kClassOverheadName));
1292 size_t overhead_fields = 0;
1293 if (java_heap_overhead_size > 4) {
1294 __ AddU1(hprof_basic_object);
1295 __ AddClassStaticsId(klass);
1296 ++overhead_fields;
1297 } else {
1298 switch (java_heap_overhead_size) {
1299 case 4: {
1300 __ AddU1(hprof_basic_int);
1301 __ AddU4(0);
1302 ++overhead_fields;
1303 break;
1304 }
1305
1306 case 2: {
1307 __ AddU1(hprof_basic_short);
1308 __ AddU2(0);
1309 ++overhead_fields;
1310 break;
1311 }
1312
1313 case 3: {
1314 __ AddU1(hprof_basic_short);
1315 __ AddU2(0);
1316 __ AddStringId(LookupStringId(std::string(kClassOverheadName) + "2"));
1317 ++overhead_fields;
1318 }
1319 FALLTHROUGH_INTENDED;
1320
1321 case 1: {
1322 __ AddU1(hprof_basic_byte);
1323 __ AddU1(0);
1324 ++overhead_fields;
1325 break;
1326 }
1327 }
1328 }
1329 DCHECK_EQ(java_heap_overhead_field_count, overhead_fields);
1330 }
1331
1332 // Helper lambda to emit the given static field. The second argument name_fn will be called to
1333 // generate the name to emit. This can be used to emit something else than the field's actual
1334 // name.
1335 auto static_field_writer = [&](ArtField& field, auto name_fn)
1336 REQUIRES_SHARED(Locks::mutator_lock_) {
1337 __ AddStringId(LookupStringId(name_fn(field)));
1338
1339 size_t size;
1340 HprofBasicType t = SignatureToBasicTypeAndSize(field.GetTypeDescriptor(), &size);
1341 __ AddU1(t);
1342 switch (t) {
1343 case hprof_basic_byte:
1344 __ AddU1(field.GetByte(klass));
1345 return;
1346 case hprof_basic_boolean:
1347 __ AddU1(field.GetBoolean(klass));
1348 return;
1349 case hprof_basic_char:
1350 __ AddU2(field.GetChar(klass));
1351 return;
1352 case hprof_basic_short:
1353 __ AddU2(field.GetShort(klass));
1354 return;
1355 case hprof_basic_float:
1356 case hprof_basic_int:
1357 case hprof_basic_object:
1358 __ AddU4(field.Get32(klass));
1359 return;
1360 case hprof_basic_double:
1361 case hprof_basic_long:
1362 __ AddU8(field.Get64(klass));
1363 return;
1364 }
1365 LOG(FATAL) << "Unexpected size " << size;
1366 UNREACHABLE();
1367 };
1368
1369 {
1370 auto class_instance_field_name_fn = [](ArtField& field) REQUIRES_SHARED(Locks::mutator_lock_) {
1371 return std::string("$class$") + field.GetName();
1372 };
1373 for (ArtField& class_instance_field : class_class->GetIFields()) {
1374 static_field_writer(class_instance_field, class_instance_field_name_fn);
1375 }
1376 for (ArtField& object_instance_field : class_class->GetSuperClass()->GetIFields()) {
1377 static_field_writer(object_instance_field, class_instance_field_name_fn);
1378 }
1379 }
1380
1381 {
1382 auto class_static_field_name_fn = [](ArtField& field) REQUIRES_SHARED(Locks::mutator_lock_) {
1383 return field.GetName();
1384 };
1385 for (ArtField& class_static_field : klass->GetSFields()) {
1386 static_field_writer(class_static_field, class_static_field_name_fn);
1387 }
1388 }
1389
1390 // Instance fields for this class (no superclass fields)
1391 int iFieldCount = klass->NumInstanceFields();
1392 // add_internal_runtime_objects is only for classes that may retain objects live through means
1393 // other than fields. It is never the case for strings.
1394 const bool add_internal_runtime_objects = AddRuntimeInternalObjectsField(klass);
1395 if (klass->IsStringClass() || add_internal_runtime_objects) {
1396 __ AddU2((uint16_t)iFieldCount + 1);
1397 } else {
1398 __ AddU2((uint16_t)iFieldCount);
1399 }
1400 for (int i = 0; i < iFieldCount; ++i) {
1401 ArtField* f = klass->GetInstanceField(i);
1402 __ AddStringId(LookupStringId(f->GetName()));
1403 HprofBasicType t = SignatureToBasicTypeAndSize(f->GetTypeDescriptor(), nullptr);
1404 __ AddU1(t);
1405 }
1406 // Add native value character array for strings / byte array for compressed strings.
1407 if (klass->IsStringClass()) {
1408 __ AddStringId(LookupStringId("value"));
1409 __ AddU1(hprof_basic_object);
1410 } else if (add_internal_runtime_objects) {
1411 __ AddStringId(LookupStringId("runtimeInternalObjects"));
1412 __ AddU1(hprof_basic_object);
1413 }
1414 }
1415
DumpFakeObjectArray(mirror::Object * obj,const std::set<mirror::Object * > & elements)1416 void Hprof::DumpFakeObjectArray(mirror::Object* obj, const std::set<mirror::Object*>& elements) {
1417 __ AddU1(HPROF_OBJECT_ARRAY_DUMP);
1418 __ AddObjectId(obj);
1419 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(obj));
1420 __ AddU4(elements.size());
1421 __ AddClassId(LookupClassId(
1422 Runtime::Current()->GetClassLinker()->GetClassRoot(ClassLinker::kObjectArrayClass)));
1423 for (mirror::Object* e : elements) {
1424 __ AddObjectId(e);
1425 }
1426 }
1427
DumpHeapArray(mirror::Array * obj,mirror::Class * klass)1428 void Hprof::DumpHeapArray(mirror::Array* obj, mirror::Class* klass) {
1429 uint32_t length = obj->GetLength();
1430
1431 if (obj->IsObjectArray()) {
1432 // obj is an object array.
1433 __ AddU1(HPROF_OBJECT_ARRAY_DUMP);
1434
1435 __ AddObjectId(obj);
1436 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(obj));
1437 __ AddU4(length);
1438 __ AddClassId(LookupClassId(klass));
1439
1440 // Dump the elements, which are always objects or null.
1441 __ AddIdList(obj->AsObjectArray<mirror::Object>());
1442 } else {
1443 size_t size;
1444 HprofBasicType t = SignatureToBasicTypeAndSize(
1445 Primitive::Descriptor(klass->GetComponentType()->GetPrimitiveType()), &size);
1446
1447 // obj is a primitive array.
1448 __ AddU1(HPROF_PRIMITIVE_ARRAY_DUMP);
1449
1450 __ AddObjectId(obj);
1451 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(obj));
1452 __ AddU4(length);
1453 __ AddU1(t);
1454
1455 // Dump the raw, packed element values.
1456 if (size == 1) {
1457 __ AddU1List(reinterpret_cast<const uint8_t*>(obj->GetRawData(sizeof(uint8_t), 0)), length);
1458 } else if (size == 2) {
1459 __ AddU2List(reinterpret_cast<const uint16_t*>(obj->GetRawData(sizeof(uint16_t), 0)), length);
1460 } else if (size == 4) {
1461 __ AddU4List(reinterpret_cast<const uint32_t*>(obj->GetRawData(sizeof(uint32_t), 0)), length);
1462 } else if (size == 8) {
1463 __ AddU8List(reinterpret_cast<const uint64_t*>(obj->GetRawData(sizeof(uint64_t), 0)), length);
1464 }
1465 }
1466 }
1467
DumpHeapInstanceObject(mirror::Object * obj,mirror::Class * klass,const std::set<mirror::Object * > & fake_roots)1468 void Hprof::DumpHeapInstanceObject(mirror::Object* obj,
1469 mirror::Class* klass,
1470 const std::set<mirror::Object*>& fake_roots) {
1471 // obj is an instance object.
1472 __ AddU1(HPROF_INSTANCE_DUMP);
1473 __ AddObjectId(obj);
1474 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(obj));
1475 __ AddClassId(LookupClassId(klass));
1476
1477 // Reserve some space for the length of the instance data, which we won't
1478 // know until we're done writing it.
1479 size_t size_patch_offset = output_->Length();
1480 __ AddU4(0x77777777);
1481
1482 // What we will use for the string value if the object is a string.
1483 mirror::Object* string_value = nullptr;
1484 mirror::Object* fake_object_array = nullptr;
1485
1486 // Write the instance data; fields for this class, followed by super class fields, and so on.
1487 do {
1488 const size_t instance_fields = klass->NumInstanceFields();
1489 for (size_t i = 0; i < instance_fields; ++i) {
1490 ArtField* f = klass->GetInstanceField(i);
1491 size_t size;
1492 HprofBasicType t = SignatureToBasicTypeAndSize(f->GetTypeDescriptor(), &size);
1493 switch (t) {
1494 case hprof_basic_byte:
1495 __ AddU1(f->GetByte(obj));
1496 break;
1497 case hprof_basic_boolean:
1498 __ AddU1(f->GetBoolean(obj));
1499 break;
1500 case hprof_basic_char:
1501 __ AddU2(f->GetChar(obj));
1502 break;
1503 case hprof_basic_short:
1504 __ AddU2(f->GetShort(obj));
1505 break;
1506 case hprof_basic_int:
1507 if (mirror::kUseStringCompression &&
1508 klass->IsStringClass() &&
1509 f->GetOffset().SizeValue() == mirror::String::CountOffset().SizeValue()) {
1510 // Store the string length instead of the raw count field with compression flag.
1511 __ AddU4(obj->AsString()->GetLength());
1512 break;
1513 }
1514 FALLTHROUGH_INTENDED;
1515 case hprof_basic_float:
1516 case hprof_basic_object:
1517 __ AddU4(f->Get32(obj));
1518 break;
1519 case hprof_basic_double:
1520 case hprof_basic_long:
1521 __ AddU8(f->Get64(obj));
1522 break;
1523 }
1524 }
1525 // Add value field for String if necessary.
1526 if (klass->IsStringClass()) {
1527 mirror::String* s = obj->AsString();
1528 if (s->GetLength() == 0) {
1529 // If string is empty, use an object-aligned address within the string for the value.
1530 string_value = reinterpret_cast<mirror::Object*>(
1531 reinterpret_cast<uintptr_t>(s) + kObjectAlignment);
1532 } else {
1533 if (s->IsCompressed()) {
1534 string_value = reinterpret_cast<mirror::Object*>(s->GetValueCompressed());
1535 } else {
1536 string_value = reinterpret_cast<mirror::Object*>(s->GetValue());
1537 }
1538 }
1539 __ AddObjectId(string_value);
1540 } else if (AddRuntimeInternalObjectsField(klass)) {
1541 // We need an id that is guaranteed to not be used, use 1/2 of the object alignment.
1542 fake_object_array = reinterpret_cast<mirror::Object*>(
1543 reinterpret_cast<uintptr_t>(obj) + kObjectAlignment / 2);
1544 __ AddObjectId(fake_object_array);
1545 }
1546 klass = klass->GetSuperClass();
1547 } while (klass != nullptr);
1548
1549 // Patch the instance field length.
1550 __ UpdateU4(size_patch_offset, output_->Length() - (size_patch_offset + 4));
1551
1552 // Output native value character array for strings.
1553 CHECK_EQ(obj->IsString(), string_value != nullptr);
1554 if (string_value != nullptr) {
1555 mirror::String* s = obj->AsString();
1556 __ AddU1(HPROF_PRIMITIVE_ARRAY_DUMP);
1557 __ AddObjectId(string_value);
1558 __ AddStackTraceSerialNumber(LookupStackTraceSerialNumber(obj));
1559 __ AddU4(s->GetLength());
1560 if (s->IsCompressed()) {
1561 __ AddU1(hprof_basic_byte);
1562 __ AddU1List(s->GetValueCompressed(), s->GetLength());
1563 } else {
1564 __ AddU1(hprof_basic_char);
1565 __ AddU2List(s->GetValue(), s->GetLength());
1566 }
1567 } else if (fake_object_array != nullptr) {
1568 DumpFakeObjectArray(fake_object_array, fake_roots);
1569 }
1570 }
1571
VisitRoot(mirror::Object * obj,const RootInfo & info)1572 void Hprof::VisitRoot(mirror::Object* obj, const RootInfo& info) {
1573 static const HprofHeapTag xlate[] = {
1574 HPROF_ROOT_UNKNOWN,
1575 HPROF_ROOT_JNI_GLOBAL,
1576 HPROF_ROOT_JNI_LOCAL,
1577 HPROF_ROOT_JAVA_FRAME,
1578 HPROF_ROOT_NATIVE_STACK,
1579 HPROF_ROOT_STICKY_CLASS,
1580 HPROF_ROOT_THREAD_BLOCK,
1581 HPROF_ROOT_MONITOR_USED,
1582 HPROF_ROOT_THREAD_OBJECT,
1583 HPROF_ROOT_INTERNED_STRING,
1584 HPROF_ROOT_FINALIZING,
1585 HPROF_ROOT_DEBUGGER,
1586 HPROF_ROOT_REFERENCE_CLEANUP,
1587 HPROF_ROOT_VM_INTERNAL,
1588 HPROF_ROOT_JNI_MONITOR,
1589 };
1590 CHECK_LT(info.GetType(), sizeof(xlate) / sizeof(HprofHeapTag));
1591 if (obj == nullptr) {
1592 return;
1593 }
1594 MarkRootObject(obj, 0, xlate[info.GetType()], info.GetThreadId());
1595 }
1596
1597 // If "direct_to_ddms" is true, the other arguments are ignored, and data is
1598 // sent directly to DDMS.
1599 // If "fd" is >= 0, the output will be written to that file descriptor.
1600 // Otherwise, "filename" is used to create an output file.
DumpHeap(const char * filename,int fd,bool direct_to_ddms)1601 void DumpHeap(const char* filename, int fd, bool direct_to_ddms) {
1602 CHECK(filename != nullptr);
1603 Thread* self = Thread::Current();
1604 // Need to take a heap dump while GC isn't running. See the comment in Heap::VisitObjects().
1605 // Also we need the critical section to avoid visiting the same object twice. See b/34967844
1606 gc::ScopedGCCriticalSection gcs(self,
1607 gc::kGcCauseHprof,
1608 gc::kCollectorTypeHprof);
1609 ScopedSuspendAll ssa(__FUNCTION__, true /* long suspend */);
1610 Hprof hprof(filename, fd, direct_to_ddms);
1611 hprof.Dump();
1612 }
1613
1614 } // namespace hprof
1615 } // namespace art
1616