trace.cc revision 9ea02c4f01b079bf6a5f49c62cb59fa5791cbc60
1/* 2 * Copyright (C) 2011 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17#include "trace.h" 18 19#include <sys/uio.h> 20#include <unistd.h> 21 22#define ATRACE_TAG ATRACE_TAG_DALVIK 23#include "cutils/trace.h" 24 25#include "art_method-inl.h" 26#include "base/casts.h" 27#include "base/stl_util.h" 28#include "base/time_utils.h" 29#include "base/unix_file/fd_file.h" 30#include "class_linker.h" 31#include "common_throws.h" 32#include "debugger.h" 33#include "dex_file-inl.h" 34#include "gc/scoped_gc_critical_section.h" 35#include "instrumentation.h" 36#include "mirror/class-inl.h" 37#include "mirror/dex_cache-inl.h" 38#include "mirror/object_array-inl.h" 39#include "mirror/object-inl.h" 40#include "os.h" 41#include "scoped_thread_state_change.h" 42#include "ScopedLocalRef.h" 43#include "thread.h" 44#include "thread_list.h" 45#include "utils.h" 46#include "entrypoints/quick/quick_entrypoints.h" 47 48namespace art { 49 50static constexpr size_t TraceActionBits = MinimumBitsToStore( 51 static_cast<size_t>(kTraceMethodActionMask)); 52static constexpr uint8_t kOpNewMethod = 1U; 53static constexpr uint8_t kOpNewThread = 2U; 54 55class BuildStackTraceVisitor : public StackVisitor { 56 public: 57 explicit BuildStackTraceVisitor(Thread* thread) 58 : StackVisitor(thread, nullptr, StackVisitor::StackWalkKind::kIncludeInlinedFrames), 59 method_trace_(Trace::AllocStackTrace()) {} 60 61 bool VisitFrame() SHARED_REQUIRES(Locks::mutator_lock_) { 62 ArtMethod* m = GetMethod(); 63 // Ignore runtime frames (in particular callee save). 64 if (!m->IsRuntimeMethod()) { 65 method_trace_->push_back(m); 66 } 67 return true; 68 } 69 70 // Returns a stack trace where the topmost frame corresponds with the first element of the vector. 71 std::vector<ArtMethod*>* GetStackTrace() const { 72 return method_trace_; 73 } 74 75 private: 76 std::vector<ArtMethod*>* const method_trace_; 77 78 DISALLOW_COPY_AND_ASSIGN(BuildStackTraceVisitor); 79}; 80 81static const char kTraceTokenChar = '*'; 82static const uint16_t kTraceHeaderLength = 32; 83static const uint32_t kTraceMagicValue = 0x574f4c53; 84static const uint16_t kTraceVersionSingleClock = 2; 85static const uint16_t kTraceVersionDualClock = 3; 86static const uint16_t kTraceRecordSizeSingleClock = 10; // using v2 87static const uint16_t kTraceRecordSizeDualClock = 14; // using v3 with two timestamps 88 89TraceClockSource Trace::default_clock_source_ = kDefaultTraceClockSource; 90 91Trace* volatile Trace::the_trace_ = nullptr; 92pthread_t Trace::sampling_pthread_ = 0U; 93std::unique_ptr<std::vector<ArtMethod*>> Trace::temp_stack_trace_; 94 95// The key identifying the tracer to update instrumentation. 96static constexpr const char* kTracerInstrumentationKey = "Tracer"; 97 98static TraceAction DecodeTraceAction(uint32_t tmid) { 99 return static_cast<TraceAction>(tmid & kTraceMethodActionMask); 100} 101 102ArtMethod* Trace::DecodeTraceMethod(uint32_t tmid) { 103 MutexLock mu(Thread::Current(), *unique_methods_lock_); 104 return unique_methods_[tmid >> TraceActionBits]; 105} 106 107uint32_t Trace::EncodeTraceMethod(ArtMethod* method) { 108 MutexLock mu(Thread::Current(), *unique_methods_lock_); 109 uint32_t idx; 110 auto it = art_method_id_map_.find(method); 111 if (it != art_method_id_map_.end()) { 112 idx = it->second; 113 } else { 114 unique_methods_.push_back(method); 115 idx = unique_methods_.size() - 1; 116 art_method_id_map_.emplace(method, idx); 117 } 118 DCHECK_LT(idx, unique_methods_.size()); 119 DCHECK_EQ(unique_methods_[idx], method); 120 return idx; 121} 122 123uint32_t Trace::EncodeTraceMethodAndAction(ArtMethod* method, TraceAction action) { 124 uint32_t tmid = (EncodeTraceMethod(method) << TraceActionBits) | action; 125 DCHECK_EQ(method, DecodeTraceMethod(tmid)); 126 return tmid; 127} 128 129std::vector<ArtMethod*>* Trace::AllocStackTrace() { 130 return (temp_stack_trace_.get() != nullptr) ? temp_stack_trace_.release() : 131 new std::vector<ArtMethod*>(); 132} 133 134void Trace::FreeStackTrace(std::vector<ArtMethod*>* stack_trace) { 135 stack_trace->clear(); 136 temp_stack_trace_.reset(stack_trace); 137} 138 139void Trace::SetDefaultClockSource(TraceClockSource clock_source) { 140#if defined(__linux__) 141 default_clock_source_ = clock_source; 142#else 143 if (clock_source != TraceClockSource::kWall) { 144 LOG(WARNING) << "Ignoring tracing request to use CPU time."; 145 } 146#endif 147} 148 149static uint16_t GetTraceVersion(TraceClockSource clock_source) { 150 return (clock_source == TraceClockSource::kDual) ? kTraceVersionDualClock 151 : kTraceVersionSingleClock; 152} 153 154static uint16_t GetRecordSize(TraceClockSource clock_source) { 155 return (clock_source == TraceClockSource::kDual) ? kTraceRecordSizeDualClock 156 : kTraceRecordSizeSingleClock; 157} 158 159bool Trace::UseThreadCpuClock() { 160 return (clock_source_ == TraceClockSource::kThreadCpu) || 161 (clock_source_ == TraceClockSource::kDual); 162} 163 164bool Trace::UseWallClock() { 165 return (clock_source_ == TraceClockSource::kWall) || 166 (clock_source_ == TraceClockSource::kDual); 167} 168 169void Trace::MeasureClockOverhead() { 170 if (UseThreadCpuClock()) { 171 Thread::Current()->GetCpuMicroTime(); 172 } 173 if (UseWallClock()) { 174 MicroTime(); 175 } 176} 177 178// Compute an average time taken to measure clocks. 179uint32_t Trace::GetClockOverheadNanoSeconds() { 180 Thread* self = Thread::Current(); 181 uint64_t start = self->GetCpuMicroTime(); 182 183 for (int i = 4000; i > 0; i--) { 184 MeasureClockOverhead(); 185 MeasureClockOverhead(); 186 MeasureClockOverhead(); 187 MeasureClockOverhead(); 188 MeasureClockOverhead(); 189 MeasureClockOverhead(); 190 MeasureClockOverhead(); 191 MeasureClockOverhead(); 192 } 193 194 uint64_t elapsed_us = self->GetCpuMicroTime() - start; 195 return static_cast<uint32_t>(elapsed_us / 32); 196} 197 198// TODO: put this somewhere with the big-endian equivalent used by JDWP. 199static void Append2LE(uint8_t* buf, uint16_t val) { 200 *buf++ = static_cast<uint8_t>(val); 201 *buf++ = static_cast<uint8_t>(val >> 8); 202} 203 204// TODO: put this somewhere with the big-endian equivalent used by JDWP. 205static void Append4LE(uint8_t* buf, uint32_t val) { 206 *buf++ = static_cast<uint8_t>(val); 207 *buf++ = static_cast<uint8_t>(val >> 8); 208 *buf++ = static_cast<uint8_t>(val >> 16); 209 *buf++ = static_cast<uint8_t>(val >> 24); 210} 211 212// TODO: put this somewhere with the big-endian equivalent used by JDWP. 213static void Append8LE(uint8_t* buf, uint64_t val) { 214 *buf++ = static_cast<uint8_t>(val); 215 *buf++ = static_cast<uint8_t>(val >> 8); 216 *buf++ = static_cast<uint8_t>(val >> 16); 217 *buf++ = static_cast<uint8_t>(val >> 24); 218 *buf++ = static_cast<uint8_t>(val >> 32); 219 *buf++ = static_cast<uint8_t>(val >> 40); 220 *buf++ = static_cast<uint8_t>(val >> 48); 221 *buf++ = static_cast<uint8_t>(val >> 56); 222} 223 224static void GetSample(Thread* thread, void* arg) SHARED_REQUIRES(Locks::mutator_lock_) { 225 BuildStackTraceVisitor build_trace_visitor(thread); 226 build_trace_visitor.WalkStack(); 227 std::vector<ArtMethod*>* stack_trace = build_trace_visitor.GetStackTrace(); 228 Trace* the_trace = reinterpret_cast<Trace*>(arg); 229 the_trace->CompareAndUpdateStackTrace(thread, stack_trace); 230} 231 232static void ClearThreadStackTraceAndClockBase(Thread* thread, void* arg ATTRIBUTE_UNUSED) { 233 thread->SetTraceClockBase(0); 234 std::vector<ArtMethod*>* stack_trace = thread->GetStackTraceSample(); 235 thread->SetStackTraceSample(nullptr); 236 delete stack_trace; 237} 238 239void Trace::CompareAndUpdateStackTrace(Thread* thread, 240 std::vector<ArtMethod*>* stack_trace) { 241 CHECK_EQ(pthread_self(), sampling_pthread_); 242 std::vector<ArtMethod*>* old_stack_trace = thread->GetStackTraceSample(); 243 // Update the thread's stack trace sample. 244 thread->SetStackTraceSample(stack_trace); 245 // Read timer clocks to use for all events in this trace. 246 uint32_t thread_clock_diff = 0; 247 uint32_t wall_clock_diff = 0; 248 ReadClocks(thread, &thread_clock_diff, &wall_clock_diff); 249 if (old_stack_trace == nullptr) { 250 // If there's no previous stack trace sample for this thread, log an entry event for all 251 // methods in the trace. 252 for (auto rit = stack_trace->rbegin(); rit != stack_trace->rend(); ++rit) { 253 LogMethodTraceEvent(thread, *rit, instrumentation::Instrumentation::kMethodEntered, 254 thread_clock_diff, wall_clock_diff); 255 } 256 } else { 257 // If there's a previous stack trace for this thread, diff the traces and emit entry and exit 258 // events accordingly. 259 auto old_rit = old_stack_trace->rbegin(); 260 auto rit = stack_trace->rbegin(); 261 // Iterate bottom-up over both traces until there's a difference between them. 262 while (old_rit != old_stack_trace->rend() && rit != stack_trace->rend() && *old_rit == *rit) { 263 old_rit++; 264 rit++; 265 } 266 // Iterate top-down over the old trace until the point where they differ, emitting exit events. 267 for (auto old_it = old_stack_trace->begin(); old_it != old_rit.base(); ++old_it) { 268 LogMethodTraceEvent(thread, *old_it, instrumentation::Instrumentation::kMethodExited, 269 thread_clock_diff, wall_clock_diff); 270 } 271 // Iterate bottom-up over the new trace from the point where they differ, emitting entry events. 272 for (; rit != stack_trace->rend(); ++rit) { 273 LogMethodTraceEvent(thread, *rit, instrumentation::Instrumentation::kMethodEntered, 274 thread_clock_diff, wall_clock_diff); 275 } 276 FreeStackTrace(old_stack_trace); 277 } 278} 279 280void* Trace::RunSamplingThread(void* arg) { 281 Runtime* runtime = Runtime::Current(); 282 intptr_t interval_us = reinterpret_cast<intptr_t>(arg); 283 CHECK_GE(interval_us, 0); 284 CHECK(runtime->AttachCurrentThread("Sampling Profiler", true, runtime->GetSystemThreadGroup(), 285 !runtime->IsAotCompiler())); 286 287 while (true) { 288 usleep(interval_us); 289 ATRACE_BEGIN("Profile sampling"); 290 Thread* self = Thread::Current(); 291 Trace* the_trace; 292 { 293 MutexLock mu(self, *Locks::trace_lock_); 294 the_trace = the_trace_; 295 if (the_trace == nullptr) { 296 break; 297 } 298 } 299 { 300 ScopedSuspendAll ssa(__FUNCTION__); 301 MutexLock mu(self, *Locks::thread_list_lock_); 302 runtime->GetThreadList()->ForEach(GetSample, the_trace); 303 } 304 ATRACE_END(); 305 } 306 307 runtime->DetachCurrentThread(); 308 return nullptr; 309} 310 311void Trace::Start(const char* trace_filename, int trace_fd, size_t buffer_size, int flags, 312 TraceOutputMode output_mode, TraceMode trace_mode, int interval_us) { 313 Thread* self = Thread::Current(); 314 { 315 MutexLock mu(self, *Locks::trace_lock_); 316 if (the_trace_ != nullptr) { 317 LOG(ERROR) << "Trace already in progress, ignoring this request"; 318 return; 319 } 320 } 321 322 // Check interval if sampling is enabled 323 if (trace_mode == TraceMode::kSampling && interval_us <= 0) { 324 LOG(ERROR) << "Invalid sampling interval: " << interval_us; 325 ScopedObjectAccess soa(self); 326 ThrowRuntimeException("Invalid sampling interval: %d", interval_us); 327 return; 328 } 329 330 // Open trace file if not going directly to ddms. 331 std::unique_ptr<File> trace_file; 332 if (output_mode != TraceOutputMode::kDDMS) { 333 if (trace_fd < 0) { 334 trace_file.reset(OS::CreateEmptyFileWriteOnly(trace_filename)); 335 } else { 336 trace_file.reset(new File(trace_fd, "tracefile")); 337 trace_file->DisableAutoClose(); 338 } 339 if (trace_file.get() == nullptr) { 340 PLOG(ERROR) << "Unable to open trace file '" << trace_filename << "'"; 341 ScopedObjectAccess soa(self); 342 ThrowRuntimeException("Unable to open trace file '%s'", trace_filename); 343 return; 344 } 345 } 346 347 Runtime* runtime = Runtime::Current(); 348 349 // Enable count of allocs if specified in the flags. 350 bool enable_stats = false; 351 352 // Create Trace object. 353 { 354 // Required since EnableMethodTracing calls ConfigureStubs which visits class linker classes. 355 gc::ScopedGCCriticalSection gcs(self, 356 gc::kGcCauseInstrumentation, 357 gc::kCollectorTypeInstrumentation); 358 ScopedSuspendAll ssa(__FUNCTION__); 359 MutexLock mu(self, *Locks::trace_lock_); 360 if (the_trace_ != nullptr) { 361 LOG(ERROR) << "Trace already in progress, ignoring this request"; 362 } else { 363 enable_stats = (flags && kTraceCountAllocs) != 0; 364 the_trace_ = new Trace(trace_file.release(), trace_filename, buffer_size, flags, output_mode, 365 trace_mode); 366 if (trace_mode == TraceMode::kSampling) { 367 CHECK_PTHREAD_CALL(pthread_create, (&sampling_pthread_, nullptr, &RunSamplingThread, 368 reinterpret_cast<void*>(interval_us)), 369 "Sampling profiler thread"); 370 the_trace_->interval_us_ = interval_us; 371 } else { 372 runtime->GetInstrumentation()->AddListener(the_trace_, 373 instrumentation::Instrumentation::kMethodEntered | 374 instrumentation::Instrumentation::kMethodExited | 375 instrumentation::Instrumentation::kMethodUnwind); 376 // TODO: In full-PIC mode, we don't need to fully deopt. 377 runtime->GetInstrumentation()->EnableMethodTracing(kTracerInstrumentationKey); 378 } 379 } 380 } 381 382 // Can't call this when holding the mutator lock. 383 if (enable_stats) { 384 runtime->SetStatsEnabled(true); 385 } 386} 387 388void Trace::StopTracing(bool finish_tracing, bool flush_file) { 389 bool stop_alloc_counting = false; 390 Runtime* const runtime = Runtime::Current(); 391 Trace* the_trace = nullptr; 392 Thread* const self = Thread::Current(); 393 pthread_t sampling_pthread = 0U; 394 { 395 MutexLock mu(self, *Locks::trace_lock_); 396 if (the_trace_ == nullptr) { 397 LOG(ERROR) << "Trace stop requested, but no trace currently running"; 398 } else { 399 the_trace = the_trace_; 400 the_trace_ = nullptr; 401 sampling_pthread = sampling_pthread_; 402 } 403 } 404 // Make sure that we join before we delete the trace since we don't want to have 405 // the sampling thread access a stale pointer. This finishes since the sampling thread exits when 406 // the_trace_ is null. 407 if (sampling_pthread != 0U) { 408 CHECK_PTHREAD_CALL(pthread_join, (sampling_pthread, nullptr), "sampling thread shutdown"); 409 sampling_pthread_ = 0U; 410 } 411 412 { 413 gc::ScopedGCCriticalSection gcs(self, 414 gc::kGcCauseInstrumentation, 415 gc::kCollectorTypeInstrumentation); 416 ScopedSuspendAll ssa(__FUNCTION__); 417 if (the_trace != nullptr) { 418 stop_alloc_counting = (the_trace->flags_ & Trace::kTraceCountAllocs) != 0; 419 if (finish_tracing) { 420 the_trace->FinishTracing(); 421 } 422 423 if (the_trace->trace_mode_ == TraceMode::kSampling) { 424 MutexLock mu(self, *Locks::thread_list_lock_); 425 runtime->GetThreadList()->ForEach(ClearThreadStackTraceAndClockBase, nullptr); 426 } else { 427 runtime->GetInstrumentation()->DisableMethodTracing(kTracerInstrumentationKey); 428 runtime->GetInstrumentation()->RemoveListener( 429 the_trace, instrumentation::Instrumentation::kMethodEntered | 430 instrumentation::Instrumentation::kMethodExited | 431 instrumentation::Instrumentation::kMethodUnwind); 432 } 433 if (the_trace->trace_file_.get() != nullptr) { 434 // Do not try to erase, so flush and close explicitly. 435 if (flush_file) { 436 if (the_trace->trace_file_->Flush() != 0) { 437 PLOG(WARNING) << "Could not flush trace file."; 438 } 439 } else { 440 the_trace->trace_file_->MarkUnchecked(); // Do not trigger guard. 441 } 442 if (the_trace->trace_file_->Close() != 0) { 443 PLOG(ERROR) << "Could not close trace file."; 444 } 445 } 446 delete the_trace; 447 } 448 } 449 if (stop_alloc_counting) { 450 // Can be racy since SetStatsEnabled is not guarded by any locks. 451 runtime->SetStatsEnabled(false); 452 } 453} 454 455void Trace::Abort() { 456 // Do not write anything anymore. 457 StopTracing(false, false); 458} 459 460void Trace::Stop() { 461 // Finish writing. 462 StopTracing(true, true); 463} 464 465void Trace::Shutdown() { 466 if (GetMethodTracingMode() != kTracingInactive) { 467 Stop(); 468 } 469} 470 471void Trace::Pause() { 472 bool stop_alloc_counting = false; 473 Runtime* runtime = Runtime::Current(); 474 Trace* the_trace = nullptr; 475 476 Thread* const self = Thread::Current(); 477 pthread_t sampling_pthread = 0U; 478 { 479 MutexLock mu(self, *Locks::trace_lock_); 480 if (the_trace_ == nullptr) { 481 LOG(ERROR) << "Trace pause requested, but no trace currently running"; 482 return; 483 } else { 484 the_trace = the_trace_; 485 sampling_pthread = sampling_pthread_; 486 } 487 } 488 489 if (sampling_pthread != 0U) { 490 { 491 MutexLock mu(self, *Locks::trace_lock_); 492 the_trace_ = nullptr; 493 } 494 CHECK_PTHREAD_CALL(pthread_join, (sampling_pthread, nullptr), "sampling thread shutdown"); 495 sampling_pthread_ = 0U; 496 { 497 MutexLock mu(self, *Locks::trace_lock_); 498 the_trace_ = the_trace; 499 } 500 } 501 502 if (the_trace != nullptr) { 503 gc::ScopedGCCriticalSection gcs(self, 504 gc::kGcCauseInstrumentation, 505 gc::kCollectorTypeInstrumentation); 506 ScopedSuspendAll ssa(__FUNCTION__); 507 stop_alloc_counting = (the_trace->flags_ & Trace::kTraceCountAllocs) != 0; 508 509 if (the_trace->trace_mode_ == TraceMode::kSampling) { 510 MutexLock mu(self, *Locks::thread_list_lock_); 511 runtime->GetThreadList()->ForEach(ClearThreadStackTraceAndClockBase, nullptr); 512 } else { 513 runtime->GetInstrumentation()->DisableMethodTracing(kTracerInstrumentationKey); 514 runtime->GetInstrumentation()->RemoveListener( 515 the_trace, 516 instrumentation::Instrumentation::kMethodEntered | 517 instrumentation::Instrumentation::kMethodExited | 518 instrumentation::Instrumentation::kMethodUnwind); 519 } 520 } 521 522 if (stop_alloc_counting) { 523 // Can be racy since SetStatsEnabled is not guarded by any locks. 524 Runtime::Current()->SetStatsEnabled(false); 525 } 526} 527 528void Trace::Resume() { 529 Thread* self = Thread::Current(); 530 Trace* the_trace; 531 { 532 MutexLock mu(self, *Locks::trace_lock_); 533 if (the_trace_ == nullptr) { 534 LOG(ERROR) << "No trace to resume (or sampling mode), ignoring this request"; 535 return; 536 } 537 the_trace = the_trace_; 538 } 539 540 Runtime* runtime = Runtime::Current(); 541 542 // Enable count of allocs if specified in the flags. 543 bool enable_stats = (the_trace->flags_ && kTraceCountAllocs) != 0; 544 545 { 546 gc::ScopedGCCriticalSection gcs(self, 547 gc::kGcCauseInstrumentation, 548 gc::kCollectorTypeInstrumentation); 549 ScopedSuspendAll ssa(__FUNCTION__); 550 551 // Reenable. 552 if (the_trace->trace_mode_ == TraceMode::kSampling) { 553 CHECK_PTHREAD_CALL(pthread_create, (&sampling_pthread_, nullptr, &RunSamplingThread, 554 reinterpret_cast<void*>(the_trace->interval_us_)), "Sampling profiler thread"); 555 } else { 556 runtime->GetInstrumentation()->AddListener(the_trace, 557 instrumentation::Instrumentation::kMethodEntered | 558 instrumentation::Instrumentation::kMethodExited | 559 instrumentation::Instrumentation::kMethodUnwind); 560 // TODO: In full-PIC mode, we don't need to fully deopt. 561 runtime->GetInstrumentation()->EnableMethodTracing(kTracerInstrumentationKey); 562 } 563 } 564 565 // Can't call this when holding the mutator lock. 566 if (enable_stats) { 567 runtime->SetStatsEnabled(true); 568 } 569} 570 571TracingMode Trace::GetMethodTracingMode() { 572 MutexLock mu(Thread::Current(), *Locks::trace_lock_); 573 if (the_trace_ == nullptr) { 574 return kTracingInactive; 575 } else { 576 switch (the_trace_->trace_mode_) { 577 case TraceMode::kSampling: 578 return kSampleProfilingActive; 579 case TraceMode::kMethodTracing: 580 return kMethodTracingActive; 581 } 582 LOG(FATAL) << "Unreachable"; 583 UNREACHABLE(); 584 } 585} 586 587static constexpr size_t kMinBufSize = 18U; // Trace header is up to 18B. 588 589Trace::Trace(File* trace_file, const char* trace_name, size_t buffer_size, int flags, 590 TraceOutputMode output_mode, TraceMode trace_mode) 591 : trace_file_(trace_file), 592 buf_(new uint8_t[std::max(kMinBufSize, buffer_size)]()), 593 flags_(flags), trace_output_mode_(output_mode), trace_mode_(trace_mode), 594 clock_source_(default_clock_source_), 595 buffer_size_(std::max(kMinBufSize, buffer_size)), 596 start_time_(MicroTime()), clock_overhead_ns_(GetClockOverheadNanoSeconds()), cur_offset_(0), 597 overflow_(false), interval_us_(0), streaming_lock_(nullptr), 598 unique_methods_lock_(new Mutex("unique methods lock", kTracingUniqueMethodsLock)) { 599 uint16_t trace_version = GetTraceVersion(clock_source_); 600 if (output_mode == TraceOutputMode::kStreaming) { 601 trace_version |= 0xF0U; 602 } 603 // Set up the beginning of the trace. 604 memset(buf_.get(), 0, kTraceHeaderLength); 605 Append4LE(buf_.get(), kTraceMagicValue); 606 Append2LE(buf_.get() + 4, trace_version); 607 Append2LE(buf_.get() + 6, kTraceHeaderLength); 608 Append8LE(buf_.get() + 8, start_time_); 609 if (trace_version >= kTraceVersionDualClock) { 610 uint16_t record_size = GetRecordSize(clock_source_); 611 Append2LE(buf_.get() + 16, record_size); 612 } 613 static_assert(18 <= kMinBufSize, "Minimum buffer size not large enough for trace header"); 614 615 // Update current offset. 616 cur_offset_.StoreRelaxed(kTraceHeaderLength); 617 618 if (output_mode == TraceOutputMode::kStreaming) { 619 streaming_file_name_ = trace_name; 620 streaming_lock_ = new Mutex("tracing lock", LockLevel::kTracingStreamingLock); 621 seen_threads_.reset(new ThreadIDBitSet()); 622 } 623} 624 625Trace::~Trace() { 626 delete streaming_lock_; 627 delete unique_methods_lock_; 628} 629 630static uint64_t ReadBytes(uint8_t* buf, size_t bytes) { 631 uint64_t ret = 0; 632 for (size_t i = 0; i < bytes; ++i) { 633 ret |= static_cast<uint64_t>(buf[i]) << (i * 8); 634 } 635 return ret; 636} 637 638void Trace::DumpBuf(uint8_t* buf, size_t buf_size, TraceClockSource clock_source) { 639 uint8_t* ptr = buf + kTraceHeaderLength; 640 uint8_t* end = buf + buf_size; 641 642 while (ptr < end) { 643 uint32_t tmid = ReadBytes(ptr + 2, sizeof(tmid)); 644 ArtMethod* method = DecodeTraceMethod(tmid); 645 TraceAction action = DecodeTraceAction(tmid); 646 LOG(INFO) << PrettyMethod(method) << " " << static_cast<int>(action); 647 ptr += GetRecordSize(clock_source); 648 } 649} 650 651static void GetVisitedMethodsFromBitSets( 652 const std::map<const DexFile*, DexIndexBitSet*>& seen_methods, 653 std::set<ArtMethod*>* visited_methods) SHARED_REQUIRES(Locks::mutator_lock_) { 654 ClassLinker* class_linker = Runtime::Current()->GetClassLinker(); 655 Thread* const self = Thread::Current(); 656 for (auto& e : seen_methods) { 657 DexIndexBitSet* bit_set = e.second; 658 // TODO: Visit trace methods as roots. 659 mirror::DexCache* dex_cache = class_linker->FindDexCache(self, *e.first, false); 660 for (uint32_t i = 0; i < bit_set->size(); ++i) { 661 if ((*bit_set)[i]) { 662 visited_methods->insert(dex_cache->GetResolvedMethod(i, sizeof(void*))); 663 } 664 } 665 } 666} 667 668void Trace::FinishTracing() { 669 size_t final_offset = 0; 670 671 std::set<ArtMethod*> visited_methods; 672 if (trace_output_mode_ == TraceOutputMode::kStreaming) { 673 // Write the secondary file with all the method names. 674 GetVisitedMethodsFromBitSets(seen_methods_, &visited_methods); 675 676 // Clean up. 677 STLDeleteValues(&seen_methods_); 678 } else { 679 final_offset = cur_offset_.LoadRelaxed(); 680 GetVisitedMethods(final_offset, &visited_methods); 681 } 682 683 // Compute elapsed time. 684 uint64_t elapsed = MicroTime() - start_time_; 685 686 std::ostringstream os; 687 688 os << StringPrintf("%cversion\n", kTraceTokenChar); 689 os << StringPrintf("%d\n", GetTraceVersion(clock_source_)); 690 os << StringPrintf("data-file-overflow=%s\n", overflow_ ? "true" : "false"); 691 if (UseThreadCpuClock()) { 692 if (UseWallClock()) { 693 os << StringPrintf("clock=dual\n"); 694 } else { 695 os << StringPrintf("clock=thread-cpu\n"); 696 } 697 } else { 698 os << StringPrintf("clock=wall\n"); 699 } 700 os << StringPrintf("elapsed-time-usec=%" PRIu64 "\n", elapsed); 701 if (trace_output_mode_ != TraceOutputMode::kStreaming) { 702 size_t num_records = (final_offset - kTraceHeaderLength) / GetRecordSize(clock_source_); 703 os << StringPrintf("num-method-calls=%zd\n", num_records); 704 } 705 os << StringPrintf("clock-call-overhead-nsec=%d\n", clock_overhead_ns_); 706 os << StringPrintf("vm=art\n"); 707 os << StringPrintf("pid=%d\n", getpid()); 708 if ((flags_ & kTraceCountAllocs) != 0) { 709 os << StringPrintf("alloc-count=%d\n", Runtime::Current()->GetStat(KIND_ALLOCATED_OBJECTS)); 710 os << StringPrintf("alloc-size=%d\n", Runtime::Current()->GetStat(KIND_ALLOCATED_BYTES)); 711 os << StringPrintf("gc-count=%d\n", Runtime::Current()->GetStat(KIND_GC_INVOCATIONS)); 712 } 713 os << StringPrintf("%cthreads\n", kTraceTokenChar); 714 DumpThreadList(os); 715 os << StringPrintf("%cmethods\n", kTraceTokenChar); 716 DumpMethodList(os, visited_methods); 717 os << StringPrintf("%cend\n", kTraceTokenChar); 718 std::string header(os.str()); 719 720 if (trace_output_mode_ == TraceOutputMode::kStreaming) { 721 File file; 722 if (!file.Open(streaming_file_name_ + ".sec", O_CREAT | O_WRONLY)) { 723 LOG(WARNING) << "Could not open secondary trace file!"; 724 return; 725 } 726 if (!file.WriteFully(header.c_str(), header.length())) { 727 file.Erase(); 728 std::string detail(StringPrintf("Trace data write failed: %s", strerror(errno))); 729 PLOG(ERROR) << detail; 730 ThrowRuntimeException("%s", detail.c_str()); 731 } 732 if (file.FlushCloseOrErase() != 0) { 733 PLOG(ERROR) << "Could not write secondary file"; 734 } 735 } else { 736 if (trace_file_.get() == nullptr) { 737 iovec iov[2]; 738 iov[0].iov_base = reinterpret_cast<void*>(const_cast<char*>(header.c_str())); 739 iov[0].iov_len = header.length(); 740 iov[1].iov_base = buf_.get(); 741 iov[1].iov_len = final_offset; 742 Dbg::DdmSendChunkV(CHUNK_TYPE("MPSE"), iov, 2); 743 const bool kDumpTraceInfo = false; 744 if (kDumpTraceInfo) { 745 LOG(INFO) << "Trace sent:\n" << header; 746 DumpBuf(buf_.get(), final_offset, clock_source_); 747 } 748 } else { 749 if (!trace_file_->WriteFully(header.c_str(), header.length()) || 750 !trace_file_->WriteFully(buf_.get(), final_offset)) { 751 std::string detail(StringPrintf("Trace data write failed: %s", strerror(errno))); 752 PLOG(ERROR) << detail; 753 ThrowRuntimeException("%s", detail.c_str()); 754 } 755 } 756 } 757} 758 759void Trace::DexPcMoved(Thread* thread ATTRIBUTE_UNUSED, 760 mirror::Object* this_object ATTRIBUTE_UNUSED, 761 ArtMethod* method, 762 uint32_t new_dex_pc) { 763 // We're not recorded to listen to this kind of event, so complain. 764 LOG(ERROR) << "Unexpected dex PC event in tracing " << PrettyMethod(method) << " " << new_dex_pc; 765} 766 767void Trace::FieldRead(Thread* thread ATTRIBUTE_UNUSED, 768 mirror::Object* this_object ATTRIBUTE_UNUSED, 769 ArtMethod* method, 770 uint32_t dex_pc, 771 ArtField* field ATTRIBUTE_UNUSED) 772 SHARED_REQUIRES(Locks::mutator_lock_) { 773 // We're not recorded to listen to this kind of event, so complain. 774 LOG(ERROR) << "Unexpected field read event in tracing " << PrettyMethod(method) << " " << dex_pc; 775} 776 777void Trace::FieldWritten(Thread* thread ATTRIBUTE_UNUSED, 778 mirror::Object* this_object ATTRIBUTE_UNUSED, 779 ArtMethod* method, 780 uint32_t dex_pc, 781 ArtField* field ATTRIBUTE_UNUSED, 782 const JValue& field_value ATTRIBUTE_UNUSED) 783 SHARED_REQUIRES(Locks::mutator_lock_) { 784 // We're not recorded to listen to this kind of event, so complain. 785 LOG(ERROR) << "Unexpected field write event in tracing " << PrettyMethod(method) << " " << dex_pc; 786} 787 788void Trace::MethodEntered(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED, 789 ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED) { 790 uint32_t thread_clock_diff = 0; 791 uint32_t wall_clock_diff = 0; 792 ReadClocks(thread, &thread_clock_diff, &wall_clock_diff); 793 LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodEntered, 794 thread_clock_diff, wall_clock_diff); 795} 796 797void Trace::MethodExited(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED, 798 ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED, 799 const JValue& return_value ATTRIBUTE_UNUSED) { 800 uint32_t thread_clock_diff = 0; 801 uint32_t wall_clock_diff = 0; 802 ReadClocks(thread, &thread_clock_diff, &wall_clock_diff); 803 LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodExited, 804 thread_clock_diff, wall_clock_diff); 805} 806 807void Trace::MethodUnwind(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED, 808 ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED) { 809 uint32_t thread_clock_diff = 0; 810 uint32_t wall_clock_diff = 0; 811 ReadClocks(thread, &thread_clock_diff, &wall_clock_diff); 812 LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodUnwind, 813 thread_clock_diff, wall_clock_diff); 814} 815 816void Trace::ExceptionCaught(Thread* thread ATTRIBUTE_UNUSED, 817 mirror::Throwable* exception_object ATTRIBUTE_UNUSED) 818 SHARED_REQUIRES(Locks::mutator_lock_) { 819 LOG(ERROR) << "Unexpected exception caught event in tracing"; 820} 821 822void Trace::Branch(Thread* /*thread*/, ArtMethod* method, 823 uint32_t /*dex_pc*/, int32_t /*dex_pc_offset*/) 824 SHARED_REQUIRES(Locks::mutator_lock_) { 825 LOG(ERROR) << "Unexpected branch event in tracing" << PrettyMethod(method); 826} 827 828void Trace::InvokeVirtualOrInterface(Thread*, 829 mirror::Object*, 830 ArtMethod* method, 831 uint32_t dex_pc, 832 ArtMethod*) { 833 LOG(ERROR) << "Unexpected invoke event in tracing" << PrettyMethod(method) 834 << " " << dex_pc; 835} 836 837void Trace::ReadClocks(Thread* thread, uint32_t* thread_clock_diff, uint32_t* wall_clock_diff) { 838 if (UseThreadCpuClock()) { 839 uint64_t clock_base = thread->GetTraceClockBase(); 840 if (UNLIKELY(clock_base == 0)) { 841 // First event, record the base time in the map. 842 uint64_t time = thread->GetCpuMicroTime(); 843 thread->SetTraceClockBase(time); 844 } else { 845 *thread_clock_diff = thread->GetCpuMicroTime() - clock_base; 846 } 847 } 848 if (UseWallClock()) { 849 *wall_clock_diff = MicroTime() - start_time_; 850 } 851} 852 853bool Trace::RegisterMethod(ArtMethod* method) { 854 mirror::DexCache* dex_cache = method->GetDexCache(); 855 const DexFile* dex_file = dex_cache->GetDexFile(); 856 auto* resolved_method = dex_cache->GetResolvedMethod(method->GetDexMethodIndex(), sizeof(void*)); 857 if (resolved_method != method) { 858 DCHECK(resolved_method == nullptr); 859 dex_cache->SetResolvedMethod(method->GetDexMethodIndex(), method, sizeof(void*)); 860 } 861 if (seen_methods_.find(dex_file) == seen_methods_.end()) { 862 seen_methods_.insert(std::make_pair(dex_file, new DexIndexBitSet())); 863 } 864 DexIndexBitSet* bit_set = seen_methods_.find(dex_file)->second; 865 if (!(*bit_set)[method->GetDexMethodIndex()]) { 866 bit_set->set(method->GetDexMethodIndex()); 867 return true; 868 } 869 return false; 870} 871 872bool Trace::RegisterThread(Thread* thread) { 873 pid_t tid = thread->GetTid(); 874 CHECK_LT(0U, static_cast<uint32_t>(tid)); 875 CHECK_LT(static_cast<uint32_t>(tid), 65536U); 876 877 if (!(*seen_threads_)[tid]) { 878 seen_threads_->set(tid); 879 return true; 880 } 881 return false; 882} 883 884std::string Trace::GetMethodLine(ArtMethod* method) { 885 method = method->GetInterfaceMethodIfProxy(sizeof(void*)); 886 return StringPrintf("%p\t%s\t%s\t%s\t%s\n", 887 reinterpret_cast<void*>((EncodeTraceMethod(method) << TraceActionBits)), 888 PrettyDescriptor(method->GetDeclaringClassDescriptor()).c_str(), method->GetName(), 889 method->GetSignature().ToString().c_str(), method->GetDeclaringClassSourceFile()); 890} 891 892void Trace::WriteToBuf(const uint8_t* src, size_t src_size) { 893 int32_t old_offset = cur_offset_.LoadRelaxed(); 894 int32_t new_offset = old_offset + static_cast<int32_t>(src_size); 895 if (dchecked_integral_cast<size_t>(new_offset) > buffer_size_) { 896 // Flush buffer. 897 if (!trace_file_->WriteFully(buf_.get(), old_offset)) { 898 PLOG(WARNING) << "Failed streaming a tracing event."; 899 } 900 901 // Check whether the data is too large for the buffer, then write immediately. 902 if (src_size >= buffer_size_) { 903 if (!trace_file_->WriteFully(src, src_size)) { 904 PLOG(WARNING) << "Failed streaming a tracing event."; 905 } 906 cur_offset_.StoreRelease(0); // Buffer is empty now. 907 return; 908 } 909 910 old_offset = 0; 911 new_offset = static_cast<int32_t>(src_size); 912 } 913 cur_offset_.StoreRelease(new_offset); 914 // Fill in data. 915 memcpy(buf_.get() + old_offset, src, src_size); 916} 917 918void Trace::LogMethodTraceEvent(Thread* thread, ArtMethod* method, 919 instrumentation::Instrumentation::InstrumentationEvent event, 920 uint32_t thread_clock_diff, uint32_t wall_clock_diff) { 921 // Advance cur_offset_ atomically. 922 int32_t new_offset; 923 int32_t old_offset = 0; 924 925 // We do a busy loop here trying to acquire the next offset. 926 if (trace_output_mode_ != TraceOutputMode::kStreaming) { 927 do { 928 old_offset = cur_offset_.LoadRelaxed(); 929 new_offset = old_offset + GetRecordSize(clock_source_); 930 if (static_cast<size_t>(new_offset) > buffer_size_) { 931 overflow_ = true; 932 return; 933 } 934 } while (!cur_offset_.CompareExchangeWeakSequentiallyConsistent(old_offset, new_offset)); 935 } 936 937 TraceAction action = kTraceMethodEnter; 938 switch (event) { 939 case instrumentation::Instrumentation::kMethodEntered: 940 action = kTraceMethodEnter; 941 break; 942 case instrumentation::Instrumentation::kMethodExited: 943 action = kTraceMethodExit; 944 break; 945 case instrumentation::Instrumentation::kMethodUnwind: 946 action = kTraceUnroll; 947 break; 948 default: 949 UNIMPLEMENTED(FATAL) << "Unexpected event: " << event; 950 } 951 952 uint32_t method_value = EncodeTraceMethodAndAction(method, action); 953 954 // Write data 955 uint8_t* ptr; 956 static constexpr size_t kPacketSize = 14U; // The maximum size of data in a packet. 957 uint8_t stack_buf[kPacketSize]; // Space to store a packet when in streaming mode. 958 if (trace_output_mode_ == TraceOutputMode::kStreaming) { 959 ptr = stack_buf; 960 } else { 961 ptr = buf_.get() + old_offset; 962 } 963 964 Append2LE(ptr, thread->GetTid()); 965 Append4LE(ptr + 2, method_value); 966 ptr += 6; 967 968 if (UseThreadCpuClock()) { 969 Append4LE(ptr, thread_clock_diff); 970 ptr += 4; 971 } 972 if (UseWallClock()) { 973 Append4LE(ptr, wall_clock_diff); 974 } 975 static_assert(kPacketSize == 2 + 4 + 4 + 4, "Packet size incorrect."); 976 977 if (trace_output_mode_ == TraceOutputMode::kStreaming) { 978 MutexLock mu(Thread::Current(), *streaming_lock_); // To serialize writing. 979 if (RegisterMethod(method)) { 980 // Write a special block with the name. 981 std::string method_line(GetMethodLine(method)); 982 uint8_t buf2[5]; 983 Append2LE(buf2, 0); 984 buf2[2] = kOpNewMethod; 985 Append2LE(buf2 + 3, static_cast<uint16_t>(method_line.length())); 986 WriteToBuf(buf2, sizeof(buf2)); 987 WriteToBuf(reinterpret_cast<const uint8_t*>(method_line.c_str()), method_line.length()); 988 } 989 if (RegisterThread(thread)) { 990 // It might be better to postpone this. Threads might not have received names... 991 std::string thread_name; 992 thread->GetThreadName(thread_name); 993 uint8_t buf2[7]; 994 Append2LE(buf2, 0); 995 buf2[2] = kOpNewThread; 996 Append2LE(buf2 + 3, static_cast<uint16_t>(thread->GetTid())); 997 Append2LE(buf2 + 5, static_cast<uint16_t>(thread_name.length())); 998 WriteToBuf(buf2, sizeof(buf2)); 999 WriteToBuf(reinterpret_cast<const uint8_t*>(thread_name.c_str()), thread_name.length()); 1000 } 1001 WriteToBuf(stack_buf, sizeof(stack_buf)); 1002 } 1003} 1004 1005void Trace::GetVisitedMethods(size_t buf_size, 1006 std::set<ArtMethod*>* visited_methods) { 1007 uint8_t* ptr = buf_.get() + kTraceHeaderLength; 1008 uint8_t* end = buf_.get() + buf_size; 1009 1010 while (ptr < end) { 1011 uint32_t tmid = ReadBytes(ptr + 2, sizeof(tmid)); 1012 ArtMethod* method = DecodeTraceMethod(tmid); 1013 visited_methods->insert(method); 1014 ptr += GetRecordSize(clock_source_); 1015 } 1016} 1017 1018void Trace::DumpMethodList(std::ostream& os, const std::set<ArtMethod*>& visited_methods) { 1019 for (const auto& method : visited_methods) { 1020 os << GetMethodLine(method); 1021 } 1022} 1023 1024static void DumpThread(Thread* t, void* arg) { 1025 std::ostream& os = *reinterpret_cast<std::ostream*>(arg); 1026 std::string name; 1027 t->GetThreadName(name); 1028 os << t->GetTid() << "\t" << name << "\n"; 1029} 1030 1031void Trace::DumpThreadList(std::ostream& os) { 1032 Thread* self = Thread::Current(); 1033 for (auto it : exited_threads_) { 1034 os << it.first << "\t" << it.second << "\n"; 1035 } 1036 Locks::thread_list_lock_->AssertNotHeld(self); 1037 MutexLock mu(self, *Locks::thread_list_lock_); 1038 Runtime::Current()->GetThreadList()->ForEach(DumpThread, &os); 1039} 1040 1041void Trace::StoreExitingThreadInfo(Thread* thread) { 1042 MutexLock mu(thread, *Locks::trace_lock_); 1043 if (the_trace_ != nullptr) { 1044 std::string name; 1045 thread->GetThreadName(name); 1046 // The same thread/tid may be used multiple times. As SafeMap::Put does not allow to override 1047 // a previous mapping, use SafeMap::Overwrite. 1048 the_trace_->exited_threads_.Overwrite(thread->GetTid(), name); 1049 } 1050} 1051 1052Trace::TraceOutputMode Trace::GetOutputMode() { 1053 MutexLock mu(Thread::Current(), *Locks::trace_lock_); 1054 CHECK(the_trace_ != nullptr) << "Trace output mode requested, but no trace currently running"; 1055 return the_trace_->trace_output_mode_; 1056} 1057 1058Trace::TraceMode Trace::GetMode() { 1059 MutexLock mu(Thread::Current(), *Locks::trace_lock_); 1060 CHECK(the_trace_ != nullptr) << "Trace mode requested, but no trace currently running"; 1061 return the_trace_->trace_mode_; 1062} 1063 1064size_t Trace::GetBufferSize() { 1065 MutexLock mu(Thread::Current(), *Locks::trace_lock_); 1066 CHECK(the_trace_ != nullptr) << "Trace mode requested, but no trace currently running"; 1067 return the_trace_->buffer_size_; 1068} 1069 1070bool Trace::IsTracingEnabled() { 1071 MutexLock mu(Thread::Current(), *Locks::trace_lock_); 1072 return the_trace_ != nullptr; 1073} 1074 1075} // namespace art 1076