trace.cc revision 3d21bdf8894e780d349c481e5c9e29fe1556051c
1/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "trace.h"
18
19#include <sys/uio.h>
20#include <unistd.h>
21
22#define ATRACE_TAG ATRACE_TAG_DALVIK
23#include "cutils/trace.h"
24
25#include "art_method-inl.h"
26#include "base/casts.h"
27#include "base/stl_util.h"
28#include "base/time_utils.h"
29#include "base/unix_file/fd_file.h"
30#include "class_linker.h"
31#include "common_throws.h"
32#include "debugger.h"
33#include "dex_file-inl.h"
34#include "instrumentation.h"
35#include "mirror/class-inl.h"
36#include "mirror/dex_cache-inl.h"
37#include "mirror/object_array-inl.h"
38#include "mirror/object-inl.h"
39#include "os.h"
40#include "scoped_thread_state_change.h"
41#include "ScopedLocalRef.h"
42#include "thread.h"
43#include "thread_list.h"
44#include "utils.h"
45#include "entrypoints/quick/quick_entrypoints.h"
46
47namespace art {
48
49// File format:
50//     header
51//     record 0
52//     record 1
53//     ...
54//
55// Header format:
56//     u4  magic ('SLOW')
57//     u2  version
58//     u2  offset to data
59//     u8  start date/time in usec
60//     u2  record size in bytes (version >= 2 only)
61//     ... padding to 32 bytes
62//
63// Record format v1:
64//     u1  thread ID
65//     u4  method ID | method action
66//     u4  time delta since start, in usec
67//
68// Record format v2:
69//     u2  thread ID
70//     u4  method ID | method action
71//     u4  time delta since start, in usec
72//
73// Record format v3:
74//     u2  thread ID
75//     u4  method ID | method action
76//     u4  time delta since start, in usec
77//     u4  wall time since start, in usec (when clock == "dual" only)
78//
79// 32 bits of microseconds is 70 minutes.
80//
81// All values are stored in little-endian order.
82
83enum TraceAction {
84    kTraceMethodEnter = 0x00,       // method entry
85    kTraceMethodExit = 0x01,        // method exit
86    kTraceUnroll = 0x02,            // method exited by exception unrolling
87    // 0x03 currently unused
88    kTraceMethodActionMask = 0x03,  // two bits
89};
90
91static constexpr uint8_t kOpNewMethod = 1U;
92static constexpr uint8_t kOpNewThread = 2U;
93
94class BuildStackTraceVisitor : public StackVisitor {
95 public:
96  explicit BuildStackTraceVisitor(Thread* thread)
97      : StackVisitor(thread, nullptr, StackVisitor::StackWalkKind::kIncludeInlinedFrames),
98        method_trace_(Trace::AllocStackTrace()) {}
99
100  bool VisitFrame() SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
101    ArtMethod* m = GetMethod();
102    // Ignore runtime frames (in particular callee save).
103    if (!m->IsRuntimeMethod()) {
104      method_trace_->push_back(m);
105    }
106    return true;
107  }
108
109  // Returns a stack trace where the topmost frame corresponds with the first element of the vector.
110  std::vector<ArtMethod*>* GetStackTrace() const {
111    return method_trace_;
112  }
113
114 private:
115  std::vector<ArtMethod*>* const method_trace_;
116};
117
118static const char     kTraceTokenChar             = '*';
119static const uint16_t kTraceHeaderLength          = 32;
120static const uint32_t kTraceMagicValue            = 0x574f4c53;
121static const uint16_t kTraceVersionSingleClock    = 2;
122static const uint16_t kTraceVersionDualClock      = 3;
123static const uint16_t kTraceRecordSizeSingleClock = 14;  // using v2
124static const uint16_t kTraceRecordSizeDualClock   = 18;  // using v3 with two timestamps
125
126TraceClockSource Trace::default_clock_source_ = kDefaultTraceClockSource;
127
128Trace* volatile Trace::the_trace_ = nullptr;
129pthread_t Trace::sampling_pthread_ = 0U;
130std::unique_ptr<std::vector<ArtMethod*>> Trace::temp_stack_trace_;
131
132// The key identifying the tracer to update instrumentation.
133static constexpr const char* kTracerInstrumentationKey = "Tracer";
134
135static ArtMethod* DecodeTraceMethodId(uint64_t tmid) {
136  return reinterpret_cast<ArtMethod*>(tmid & ~kTraceMethodActionMask);
137}
138
139static TraceAction DecodeTraceAction(uint32_t tmid) {
140  return static_cast<TraceAction>(tmid & kTraceMethodActionMask);
141}
142
143static uint64_t EncodeTraceMethodAndAction(ArtMethod* method, TraceAction action) {
144  auto tmid = static_cast<uint64_t>(reinterpret_cast<uintptr_t>(method)) | action;
145  DCHECK_EQ(method, DecodeTraceMethodId(tmid));
146  return tmid;
147}
148
149std::vector<ArtMethod*>* Trace::AllocStackTrace() {
150  if (temp_stack_trace_.get() != nullptr) {
151    return temp_stack_trace_.release();
152  } else {
153    return new std::vector<ArtMethod*>();
154  }
155}
156
157void Trace::FreeStackTrace(std::vector<ArtMethod*>* stack_trace) {
158  stack_trace->clear();
159  temp_stack_trace_.reset(stack_trace);
160}
161
162void Trace::SetDefaultClockSource(TraceClockSource clock_source) {
163#if defined(__linux__)
164  default_clock_source_ = clock_source;
165#else
166  if (clock_source != TraceClockSource::kWall) {
167    LOG(WARNING) << "Ignoring tracing request to use CPU time.";
168  }
169#endif
170}
171
172static uint16_t GetTraceVersion(TraceClockSource clock_source) {
173  return (clock_source == TraceClockSource::kDual) ? kTraceVersionDualClock
174                                                    : kTraceVersionSingleClock;
175}
176
177static uint16_t GetRecordSize(TraceClockSource clock_source) {
178  return (clock_source == TraceClockSource::kDual) ? kTraceRecordSizeDualClock
179                                                    : kTraceRecordSizeSingleClock;
180}
181
182bool Trace::UseThreadCpuClock() {
183  return (clock_source_ == TraceClockSource::kThreadCpu) ||
184      (clock_source_ == TraceClockSource::kDual);
185}
186
187bool Trace::UseWallClock() {
188  return (clock_source_ == TraceClockSource::kWall) ||
189      (clock_source_ == TraceClockSource::kDual);
190}
191
192void Trace::MeasureClockOverhead() {
193  if (UseThreadCpuClock()) {
194    Thread::Current()->GetCpuMicroTime();
195  }
196  if (UseWallClock()) {
197    MicroTime();
198  }
199}
200
201// Compute an average time taken to measure clocks.
202uint32_t Trace::GetClockOverheadNanoSeconds() {
203  Thread* self = Thread::Current();
204  uint64_t start = self->GetCpuMicroTime();
205
206  for (int i = 4000; i > 0; i--) {
207    MeasureClockOverhead();
208    MeasureClockOverhead();
209    MeasureClockOverhead();
210    MeasureClockOverhead();
211    MeasureClockOverhead();
212    MeasureClockOverhead();
213    MeasureClockOverhead();
214    MeasureClockOverhead();
215  }
216
217  uint64_t elapsed_us = self->GetCpuMicroTime() - start;
218  return static_cast<uint32_t>(elapsed_us / 32);
219}
220
221// TODO: put this somewhere with the big-endian equivalent used by JDWP.
222static void Append2LE(uint8_t* buf, uint16_t val) {
223  *buf++ = static_cast<uint8_t>(val);
224  *buf++ = static_cast<uint8_t>(val >> 8);
225}
226
227// TODO: put this somewhere with the big-endian equivalent used by JDWP.
228static void Append4LE(uint8_t* buf, uint32_t val) {
229  *buf++ = static_cast<uint8_t>(val);
230  *buf++ = static_cast<uint8_t>(val >> 8);
231  *buf++ = static_cast<uint8_t>(val >> 16);
232  *buf++ = static_cast<uint8_t>(val >> 24);
233}
234
235// TODO: put this somewhere with the big-endian equivalent used by JDWP.
236static void Append8LE(uint8_t* buf, uint64_t val) {
237  *buf++ = static_cast<uint8_t>(val);
238  *buf++ = static_cast<uint8_t>(val >> 8);
239  *buf++ = static_cast<uint8_t>(val >> 16);
240  *buf++ = static_cast<uint8_t>(val >> 24);
241  *buf++ = static_cast<uint8_t>(val >> 32);
242  *buf++ = static_cast<uint8_t>(val >> 40);
243  *buf++ = static_cast<uint8_t>(val >> 48);
244  *buf++ = static_cast<uint8_t>(val >> 56);
245}
246
247static void GetSample(Thread* thread, void* arg) SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
248  BuildStackTraceVisitor build_trace_visitor(thread);
249  build_trace_visitor.WalkStack();
250  std::vector<ArtMethod*>* stack_trace = build_trace_visitor.GetStackTrace();
251  Trace* the_trace = reinterpret_cast<Trace*>(arg);
252  the_trace->CompareAndUpdateStackTrace(thread, stack_trace);
253}
254
255static void ClearThreadStackTraceAndClockBase(Thread* thread, void* arg ATTRIBUTE_UNUSED) {
256  thread->SetTraceClockBase(0);
257  std::vector<ArtMethod*>* stack_trace = thread->GetStackTraceSample();
258  thread->SetStackTraceSample(nullptr);
259  delete stack_trace;
260}
261
262void Trace::CompareAndUpdateStackTrace(Thread* thread,
263                                       std::vector<ArtMethod*>* stack_trace) {
264  CHECK_EQ(pthread_self(), sampling_pthread_);
265  std::vector<ArtMethod*>* old_stack_trace = thread->GetStackTraceSample();
266  // Update the thread's stack trace sample.
267  thread->SetStackTraceSample(stack_trace);
268  // Read timer clocks to use for all events in this trace.
269  uint32_t thread_clock_diff = 0;
270  uint32_t wall_clock_diff = 0;
271  ReadClocks(thread, &thread_clock_diff, &wall_clock_diff);
272  if (old_stack_trace == nullptr) {
273    // If there's no previous stack trace sample for this thread, log an entry event for all
274    // methods in the trace.
275    for (std::vector<ArtMethod*>::reverse_iterator rit = stack_trace->rbegin();
276         rit != stack_trace->rend(); ++rit) {
277      LogMethodTraceEvent(thread, *rit, instrumentation::Instrumentation::kMethodEntered,
278                          thread_clock_diff, wall_clock_diff);
279    }
280  } else {
281    // If there's a previous stack trace for this thread, diff the traces and emit entry and exit
282    // events accordingly.
283    std::vector<ArtMethod*>::reverse_iterator old_rit = old_stack_trace->rbegin();
284    std::vector<ArtMethod*>::reverse_iterator rit = stack_trace->rbegin();
285    // Iterate bottom-up over both traces until there's a difference between them.
286    while (old_rit != old_stack_trace->rend() && rit != stack_trace->rend() && *old_rit == *rit) {
287      old_rit++;
288      rit++;
289    }
290    // Iterate top-down over the old trace until the point where they differ, emitting exit events.
291    for (std::vector<ArtMethod*>::iterator old_it = old_stack_trace->begin();
292         old_it != old_rit.base(); ++old_it) {
293      LogMethodTraceEvent(thread, *old_it, instrumentation::Instrumentation::kMethodExited,
294                          thread_clock_diff, wall_clock_diff);
295    }
296    // Iterate bottom-up over the new trace from the point where they differ, emitting entry events.
297    for (; rit != stack_trace->rend(); ++rit) {
298      LogMethodTraceEvent(thread, *rit, instrumentation::Instrumentation::kMethodEntered,
299                          thread_clock_diff, wall_clock_diff);
300    }
301    FreeStackTrace(old_stack_trace);
302  }
303}
304
305void* Trace::RunSamplingThread(void* arg) {
306  Runtime* runtime = Runtime::Current();
307  intptr_t interval_us = reinterpret_cast<intptr_t>(arg);
308  CHECK_GE(interval_us, 0);
309  CHECK(runtime->AttachCurrentThread("Sampling Profiler", true, runtime->GetSystemThreadGroup(),
310                                     !runtime->IsAotCompiler()));
311
312  while (true) {
313    usleep(interval_us);
314    ATRACE_BEGIN("Profile sampling");
315    Thread* self = Thread::Current();
316    Trace* the_trace;
317    {
318      MutexLock mu(self, *Locks::trace_lock_);
319      the_trace = the_trace_;
320      if (the_trace == nullptr) {
321        break;
322      }
323    }
324
325    runtime->GetThreadList()->SuspendAll(__FUNCTION__);
326    {
327      MutexLock mu(self, *Locks::thread_list_lock_);
328      runtime->GetThreadList()->ForEach(GetSample, the_trace);
329    }
330    runtime->GetThreadList()->ResumeAll();
331    ATRACE_END();
332  }
333
334  runtime->DetachCurrentThread();
335  return nullptr;
336}
337
338void Trace::Start(const char* trace_filename, int trace_fd, size_t buffer_size, int flags,
339                  TraceOutputMode output_mode, TraceMode trace_mode, int interval_us) {
340  Thread* self = Thread::Current();
341  {
342    MutexLock mu(self, *Locks::trace_lock_);
343    if (the_trace_ != nullptr) {
344      LOG(ERROR) << "Trace already in progress, ignoring this request";
345      return;
346    }
347  }
348
349  // Check interval if sampling is enabled
350  if (trace_mode == TraceMode::kSampling && interval_us <= 0) {
351    LOG(ERROR) << "Invalid sampling interval: " << interval_us;
352    ScopedObjectAccess soa(self);
353    ThrowRuntimeException("Invalid sampling interval: %d", interval_us);
354    return;
355  }
356
357  // Open trace file if not going directly to ddms.
358  std::unique_ptr<File> trace_file;
359  if (output_mode != TraceOutputMode::kDDMS) {
360    if (trace_fd < 0) {
361      trace_file.reset(OS::CreateEmptyFile(trace_filename));
362    } else {
363      trace_file.reset(new File(trace_fd, "tracefile"));
364      trace_file->DisableAutoClose();
365    }
366    if (trace_file.get() == nullptr) {
367      PLOG(ERROR) << "Unable to open trace file '" << trace_filename << "'";
368      ScopedObjectAccess soa(self);
369      ThrowRuntimeException("Unable to open trace file '%s'", trace_filename);
370      return;
371    }
372  }
373
374  Runtime* runtime = Runtime::Current();
375
376  // Enable count of allocs if specified in the flags.
377  bool enable_stats = false;
378
379  runtime->GetThreadList()->SuspendAll(__FUNCTION__);
380
381  // Create Trace object.
382  {
383    MutexLock mu(self, *Locks::trace_lock_);
384    if (the_trace_ != nullptr) {
385      LOG(ERROR) << "Trace already in progress, ignoring this request";
386    } else {
387      enable_stats = (flags && kTraceCountAllocs) != 0;
388      the_trace_ = new Trace(trace_file.release(), trace_filename, buffer_size, flags, output_mode,
389                             trace_mode);
390      if (trace_mode == TraceMode::kSampling) {
391        CHECK_PTHREAD_CALL(pthread_create, (&sampling_pthread_, nullptr, &RunSamplingThread,
392                                            reinterpret_cast<void*>(interval_us)),
393                                            "Sampling profiler thread");
394        the_trace_->interval_us_ = interval_us;
395      } else {
396        runtime->GetInstrumentation()->AddListener(the_trace_,
397                                                   instrumentation::Instrumentation::kMethodEntered |
398                                                   instrumentation::Instrumentation::kMethodExited |
399                                                   instrumentation::Instrumentation::kMethodUnwind);
400        // TODO: In full-PIC mode, we don't need to fully deopt.
401        runtime->GetInstrumentation()->EnableMethodTracing(kTracerInstrumentationKey);
402      }
403    }
404  }
405
406  runtime->GetThreadList()->ResumeAll();
407
408  // Can't call this when holding the mutator lock.
409  if (enable_stats) {
410    runtime->SetStatsEnabled(true);
411  }
412}
413
414void Trace::StopTracing(bool finish_tracing, bool flush_file) {
415  bool stop_alloc_counting = false;
416  Runtime* const runtime = Runtime::Current();
417  Trace* the_trace = nullptr;
418  pthread_t sampling_pthread = 0U;
419  {
420    MutexLock mu(Thread::Current(), *Locks::trace_lock_);
421    if (the_trace_ == nullptr) {
422      LOG(ERROR) << "Trace stop requested, but no trace currently running";
423    } else {
424      the_trace = the_trace_;
425      the_trace_ = nullptr;
426      sampling_pthread = sampling_pthread_;
427    }
428  }
429  // Make sure that we join before we delete the trace since we don't want to have
430  // the sampling thread access a stale pointer. This finishes since the sampling thread exits when
431  // the_trace_ is null.
432  if (sampling_pthread != 0U) {
433    CHECK_PTHREAD_CALL(pthread_join, (sampling_pthread, nullptr), "sampling thread shutdown");
434    sampling_pthread_ = 0U;
435  }
436  runtime->GetThreadList()->SuspendAll(__FUNCTION__);
437
438  if (the_trace != nullptr) {
439    stop_alloc_counting = (the_trace->flags_ & Trace::kTraceCountAllocs) != 0;
440    if (finish_tracing) {
441      the_trace->FinishTracing();
442    }
443
444    if (the_trace->trace_mode_ == TraceMode::kSampling) {
445      MutexLock mu(Thread::Current(), *Locks::thread_list_lock_);
446      runtime->GetThreadList()->ForEach(ClearThreadStackTraceAndClockBase, nullptr);
447    } else {
448      runtime->GetInstrumentation()->DisableMethodTracing(kTracerInstrumentationKey);
449      runtime->GetInstrumentation()->RemoveListener(
450          the_trace, instrumentation::Instrumentation::kMethodEntered |
451          instrumentation::Instrumentation::kMethodExited |
452          instrumentation::Instrumentation::kMethodUnwind);
453    }
454    if (the_trace->trace_file_.get() != nullptr) {
455      // Do not try to erase, so flush and close explicitly.
456      if (flush_file) {
457        if (the_trace->trace_file_->Flush() != 0) {
458          PLOG(ERROR) << "Could not flush trace file.";
459        }
460      } else {
461        the_trace->trace_file_->MarkUnchecked();  // Do not trigger guard.
462      }
463      if (the_trace->trace_file_->Close() != 0) {
464        PLOG(ERROR) << "Could not close trace file.";
465      }
466    }
467    delete the_trace;
468  }
469  runtime->GetThreadList()->ResumeAll();
470  if (stop_alloc_counting) {
471    // Can be racy since SetStatsEnabled is not guarded by any locks.
472    runtime->SetStatsEnabled(false);
473  }
474}
475
476void Trace::Abort() {
477  // Do not write anything anymore.
478  StopTracing(false, false);
479}
480
481void Trace::Stop() {
482  // Finish writing.
483  StopTracing(true, true);
484}
485
486void Trace::Shutdown() {
487  if (GetMethodTracingMode() != kTracingInactive) {
488    Stop();
489  }
490}
491
492void Trace::Pause() {
493  bool stop_alloc_counting = false;
494  Runtime* runtime = Runtime::Current();
495  Trace* the_trace = nullptr;
496
497  pthread_t sampling_pthread = 0U;
498  {
499    MutexLock mu(Thread::Current(), *Locks::trace_lock_);
500    if (the_trace_ == nullptr) {
501      LOG(ERROR) << "Trace pause requested, but no trace currently running";
502      return;
503    } else {
504      the_trace = the_trace_;
505      sampling_pthread = sampling_pthread_;
506    }
507  }
508
509  if (sampling_pthread != 0U) {
510    {
511      MutexLock mu(Thread::Current(), *Locks::trace_lock_);
512      the_trace_ = nullptr;
513    }
514    CHECK_PTHREAD_CALL(pthread_join, (sampling_pthread, nullptr), "sampling thread shutdown");
515    sampling_pthread_ = 0U;
516    {
517      MutexLock mu(Thread::Current(), *Locks::trace_lock_);
518      the_trace_ = the_trace;
519    }
520  }
521
522  if (the_trace != nullptr) {
523    runtime->GetThreadList()->SuspendAll(__FUNCTION__);
524    stop_alloc_counting = (the_trace->flags_ & Trace::kTraceCountAllocs) != 0;
525
526    if (the_trace->trace_mode_ == TraceMode::kSampling) {
527      MutexLock mu(Thread::Current(), *Locks::thread_list_lock_);
528      runtime->GetThreadList()->ForEach(ClearThreadStackTraceAndClockBase, nullptr);
529    } else {
530      runtime->GetInstrumentation()->DisableMethodTracing(kTracerInstrumentationKey);
531      runtime->GetInstrumentation()->RemoveListener(the_trace,
532                                                    instrumentation::Instrumentation::kMethodEntered |
533                                                    instrumentation::Instrumentation::kMethodExited |
534                                                    instrumentation::Instrumentation::kMethodUnwind);
535    }
536    runtime->GetThreadList()->ResumeAll();
537  }
538
539  if (stop_alloc_counting) {
540    // Can be racy since SetStatsEnabled is not guarded by any locks.
541    Runtime::Current()->SetStatsEnabled(false);
542  }
543}
544
545void Trace::Resume() {
546  Thread* self = Thread::Current();
547  Trace* the_trace;
548  {
549    MutexLock mu(self, *Locks::trace_lock_);
550    if (the_trace_ == nullptr) {
551      LOG(ERROR) << "No trace to resume (or sampling mode), ignoring this request";
552      return;
553    }
554    the_trace = the_trace_;
555  }
556
557  Runtime* runtime = Runtime::Current();
558
559  // Enable count of allocs if specified in the flags.
560  bool enable_stats = (the_trace->flags_ && kTraceCountAllocs) != 0;
561
562  runtime->GetThreadList()->SuspendAll(__FUNCTION__);
563
564  // Reenable.
565  if (the_trace->trace_mode_ == TraceMode::kSampling) {
566    CHECK_PTHREAD_CALL(pthread_create, (&sampling_pthread_, nullptr, &RunSamplingThread,
567        reinterpret_cast<void*>(the_trace->interval_us_)), "Sampling profiler thread");
568  } else {
569    runtime->GetInstrumentation()->AddListener(the_trace,
570                                               instrumentation::Instrumentation::kMethodEntered |
571                                               instrumentation::Instrumentation::kMethodExited |
572                                               instrumentation::Instrumentation::kMethodUnwind);
573    // TODO: In full-PIC mode, we don't need to fully deopt.
574    runtime->GetInstrumentation()->EnableMethodTracing(kTracerInstrumentationKey);
575  }
576
577  runtime->GetThreadList()->ResumeAll();
578
579  // Can't call this when holding the mutator lock.
580  if (enable_stats) {
581    runtime->SetStatsEnabled(true);
582  }
583}
584
585TracingMode Trace::GetMethodTracingMode() {
586  MutexLock mu(Thread::Current(), *Locks::trace_lock_);
587  if (the_trace_ == nullptr) {
588    return kTracingInactive;
589  } else {
590    switch (the_trace_->trace_mode_) {
591      case TraceMode::kSampling:
592        return kSampleProfilingActive;
593      case TraceMode::kMethodTracing:
594        return kMethodTracingActive;
595    }
596    LOG(FATAL) << "Unreachable";
597    UNREACHABLE();
598  }
599}
600
601static constexpr size_t kMinBufSize = 18U;  // Trace header is up to 18B.
602
603Trace::Trace(File* trace_file, const char* trace_name, size_t buffer_size, int flags,
604             TraceOutputMode output_mode, TraceMode trace_mode)
605    : trace_file_(trace_file),
606      buf_(new uint8_t[std::max(kMinBufSize, buffer_size)]()),
607      flags_(flags), trace_output_mode_(output_mode), trace_mode_(trace_mode),
608      clock_source_(default_clock_source_),
609      buffer_size_(std::max(kMinBufSize, buffer_size)),
610      start_time_(MicroTime()), clock_overhead_ns_(GetClockOverheadNanoSeconds()), cur_offset_(0),
611      overflow_(false), interval_us_(0), streaming_lock_(nullptr) {
612  uint16_t trace_version = GetTraceVersion(clock_source_);
613  if (output_mode == TraceOutputMode::kStreaming) {
614    trace_version |= 0xF0U;
615  }
616  // Set up the beginning of the trace.
617  memset(buf_.get(), 0, kTraceHeaderLength);
618  Append4LE(buf_.get(), kTraceMagicValue);
619  Append2LE(buf_.get() + 4, trace_version);
620  Append2LE(buf_.get() + 6, kTraceHeaderLength);
621  Append8LE(buf_.get() + 8, start_time_);
622  if (trace_version >= kTraceVersionDualClock) {
623    uint16_t record_size = GetRecordSize(clock_source_);
624    Append2LE(buf_.get() + 16, record_size);
625  }
626  static_assert(18 <= kMinBufSize, "Minimum buffer size not large enough for trace header");
627
628  // Update current offset.
629  cur_offset_.StoreRelaxed(kTraceHeaderLength);
630
631  if (output_mode == TraceOutputMode::kStreaming) {
632    streaming_file_name_ = trace_name;
633    streaming_lock_ = new Mutex("tracing lock");
634    seen_threads_.reset(new ThreadIDBitSet());
635  }
636}
637
638Trace::~Trace() {
639  delete streaming_lock_;
640}
641
642static uint64_t ReadBytes(uint8_t* buf, size_t bytes) {
643  uint64_t ret = 0;
644  for (size_t i = 0; i < bytes; ++i) {
645    ret |= static_cast<uint64_t>(buf[i]) << (i * 8);
646  }
647  return ret;
648}
649
650static void DumpBuf(uint8_t* buf, size_t buf_size, TraceClockSource clock_source)
651    SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
652  uint8_t* ptr = buf + kTraceHeaderLength;
653  uint8_t* end = buf + buf_size;
654
655  while (ptr < end) {
656    uint64_t tmid = ReadBytes(ptr + 2, sizeof(tmid));
657    ArtMethod* method = DecodeTraceMethodId(tmid);
658    TraceAction action = DecodeTraceAction(tmid);
659    LOG(INFO) << PrettyMethod(method) << " " << static_cast<int>(action);
660    ptr += GetRecordSize(clock_source);
661  }
662}
663
664static void GetVisitedMethodsFromBitSets(
665    const std::map<mirror::DexCache*, DexIndexBitSet*>& seen_methods,
666    std::set<ArtMethod*>* visited_methods) SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
667  for (auto& e : seen_methods) {
668    DexIndexBitSet* bit_set = e.second;
669    for (uint32_t i = 0; i < bit_set->size(); ++i) {
670      if ((*bit_set)[i]) {
671        visited_methods->insert(e.first->GetResolvedMethod(i, sizeof(void*)));
672      }
673    }
674  }
675}
676
677void Trace::FinishTracing() {
678  size_t final_offset = 0;
679
680  std::set<ArtMethod*> visited_methods;
681  if (trace_output_mode_ == TraceOutputMode::kStreaming) {
682    // Write the secondary file with all the method names.
683    GetVisitedMethodsFromBitSets(seen_methods_, &visited_methods);
684
685    // Clean up.
686    for (auto& e : seen_methods_) {
687      delete e.second;
688    }
689  } else {
690    final_offset = cur_offset_.LoadRelaxed();
691    GetVisitedMethods(final_offset, &visited_methods);
692  }
693
694  // Compute elapsed time.
695  uint64_t elapsed = MicroTime() - start_time_;
696
697  std::ostringstream os;
698
699  os << StringPrintf("%cversion\n", kTraceTokenChar);
700  os << StringPrintf("%d\n", GetTraceVersion(clock_source_));
701  os << StringPrintf("data-file-overflow=%s\n", overflow_ ? "true" : "false");
702  if (UseThreadCpuClock()) {
703    if (UseWallClock()) {
704      os << StringPrintf("clock=dual\n");
705    } else {
706      os << StringPrintf("clock=thread-cpu\n");
707    }
708  } else {
709    os << StringPrintf("clock=wall\n");
710  }
711  os << StringPrintf("elapsed-time-usec=%" PRIu64 "\n", elapsed);
712  if (trace_output_mode_ != TraceOutputMode::kStreaming) {
713    size_t num_records = (final_offset - kTraceHeaderLength) / GetRecordSize(clock_source_);
714    os << StringPrintf("num-method-calls=%zd\n", num_records);
715  }
716  os << StringPrintf("clock-call-overhead-nsec=%d\n", clock_overhead_ns_);
717  os << StringPrintf("vm=art\n");
718  os << StringPrintf("pid=%d\n", getpid());
719  if ((flags_ & kTraceCountAllocs) != 0) {
720    os << StringPrintf("alloc-count=%d\n", Runtime::Current()->GetStat(KIND_ALLOCATED_OBJECTS));
721    os << StringPrintf("alloc-size=%d\n", Runtime::Current()->GetStat(KIND_ALLOCATED_BYTES));
722    os << StringPrintf("gc-count=%d\n", Runtime::Current()->GetStat(KIND_GC_INVOCATIONS));
723  }
724  os << StringPrintf("%cthreads\n", kTraceTokenChar);
725  DumpThreadList(os);
726  os << StringPrintf("%cmethods\n", kTraceTokenChar);
727  DumpMethodList(os, visited_methods);
728  os << StringPrintf("%cend\n", kTraceTokenChar);
729  std::string header(os.str());
730
731  if (trace_output_mode_ == TraceOutputMode::kStreaming) {
732    File file;
733    if (!file.Open(streaming_file_name_ + ".sec", O_CREAT | O_WRONLY)) {
734      LOG(WARNING) << "Could not open secondary trace file!";
735      return;
736    }
737    if (!file.WriteFully(header.c_str(), header.length())) {
738      file.Erase();
739      std::string detail(StringPrintf("Trace data write failed: %s", strerror(errno)));
740      PLOG(ERROR) << detail;
741      ThrowRuntimeException("%s", detail.c_str());
742    }
743    if (file.FlushCloseOrErase() != 0) {
744      PLOG(ERROR) << "Could not write secondary file";
745    }
746  } else {
747    if (trace_file_.get() == nullptr) {
748      iovec iov[2];
749      iov[0].iov_base = reinterpret_cast<void*>(const_cast<char*>(header.c_str()));
750      iov[0].iov_len = header.length();
751      iov[1].iov_base = buf_.get();
752      iov[1].iov_len = final_offset;
753      Dbg::DdmSendChunkV(CHUNK_TYPE("MPSE"), iov, 2);
754      const bool kDumpTraceInfo = false;
755      if (kDumpTraceInfo) {
756        LOG(INFO) << "Trace sent:\n" << header;
757        DumpBuf(buf_.get(), final_offset, clock_source_);
758      }
759    } else {
760      if (!trace_file_->WriteFully(header.c_str(), header.length()) ||
761          !trace_file_->WriteFully(buf_.get(), final_offset)) {
762        std::string detail(StringPrintf("Trace data write failed: %s", strerror(errno)));
763        PLOG(ERROR) << detail;
764        ThrowRuntimeException("%s", detail.c_str());
765      }
766    }
767  }
768}
769
770void Trace::DexPcMoved(Thread* thread, mirror::Object* this_object,
771                       ArtMethod* method, uint32_t new_dex_pc) {
772  UNUSED(thread, this_object, method, new_dex_pc);
773  // We're not recorded to listen to this kind of event, so complain.
774  LOG(ERROR) << "Unexpected dex PC event in tracing " << PrettyMethod(method) << " " << new_dex_pc;
775}
776
777void Trace::FieldRead(Thread* thread, mirror::Object* this_object,
778                       ArtMethod* method, uint32_t dex_pc, ArtField* field)
779    SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
780  UNUSED(thread, this_object, method, dex_pc, field);
781  // We're not recorded to listen to this kind of event, so complain.
782  LOG(ERROR) << "Unexpected field read event in tracing " << PrettyMethod(method) << " " << dex_pc;
783}
784
785void Trace::FieldWritten(Thread* thread, mirror::Object* this_object,
786                          ArtMethod* method, uint32_t dex_pc, ArtField* field,
787                          const JValue& field_value)
788    SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
789  UNUSED(thread, this_object, method, dex_pc, field, field_value);
790  // We're not recorded to listen to this kind of event, so complain.
791  LOG(ERROR) << "Unexpected field write event in tracing " << PrettyMethod(method) << " " << dex_pc;
792}
793
794void Trace::MethodEntered(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED,
795                          ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED) {
796  uint32_t thread_clock_diff = 0;
797  uint32_t wall_clock_diff = 0;
798  ReadClocks(thread, &thread_clock_diff, &wall_clock_diff);
799  LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodEntered,
800                      thread_clock_diff, wall_clock_diff);
801}
802
803void Trace::MethodExited(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED,
804                         ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED,
805                         const JValue& return_value ATTRIBUTE_UNUSED) {
806  uint32_t thread_clock_diff = 0;
807  uint32_t wall_clock_diff = 0;
808  ReadClocks(thread, &thread_clock_diff, &wall_clock_diff);
809  LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodExited,
810                      thread_clock_diff, wall_clock_diff);
811}
812
813void Trace::MethodUnwind(Thread* thread, mirror::Object* this_object ATTRIBUTE_UNUSED,
814                         ArtMethod* method, uint32_t dex_pc ATTRIBUTE_UNUSED) {
815  uint32_t thread_clock_diff = 0;
816  uint32_t wall_clock_diff = 0;
817  ReadClocks(thread, &thread_clock_diff, &wall_clock_diff);
818  LogMethodTraceEvent(thread, method, instrumentation::Instrumentation::kMethodUnwind,
819                      thread_clock_diff, wall_clock_diff);
820}
821
822void Trace::ExceptionCaught(Thread* thread, mirror::Throwable* exception_object)
823    SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
824  UNUSED(thread, exception_object);
825  LOG(ERROR) << "Unexpected exception caught event in tracing";
826}
827
828void Trace::BackwardBranch(Thread* /*thread*/, ArtMethod* method,
829                           int32_t /*dex_pc_offset*/)
830      SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
831  LOG(ERROR) << "Unexpected backward branch event in tracing" << PrettyMethod(method);
832}
833
834void Trace::ReadClocks(Thread* thread, uint32_t* thread_clock_diff, uint32_t* wall_clock_diff) {
835  if (UseThreadCpuClock()) {
836    uint64_t clock_base = thread->GetTraceClockBase();
837    if (UNLIKELY(clock_base == 0)) {
838      // First event, record the base time in the map.
839      uint64_t time = thread->GetCpuMicroTime();
840      thread->SetTraceClockBase(time);
841    } else {
842      *thread_clock_diff = thread->GetCpuMicroTime() - clock_base;
843    }
844  }
845  if (UseWallClock()) {
846    *wall_clock_diff = MicroTime() - start_time_;
847  }
848}
849
850bool Trace::RegisterMethod(ArtMethod* method) {
851  mirror::DexCache* dex_cache = method->GetDexCache();
852  auto* resolved_method = dex_cache->GetResolvedMethod(method->GetDexMethodIndex(), sizeof(void*));
853  if (resolved_method != method) {
854    DCHECK(resolved_method == nullptr);
855    dex_cache->SetResolvedMethod(method->GetDexMethodIndex(), method, sizeof(void*));
856  }
857  if (seen_methods_.find(dex_cache) == seen_methods_.end()) {
858    seen_methods_.insert(std::make_pair(dex_cache, new DexIndexBitSet()));
859  }
860  DexIndexBitSet* bit_set = seen_methods_.find(dex_cache)->second;
861  if (!(*bit_set)[method->GetDexMethodIndex()]) {
862    bit_set->set(method->GetDexMethodIndex());
863    return true;
864  }
865  return false;
866}
867
868bool Trace::RegisterThread(Thread* thread) {
869  pid_t tid = thread->GetTid();
870  CHECK_LT(0U, static_cast<uint32_t>(tid));
871  CHECK_LT(static_cast<uint32_t>(tid), 65536U);
872
873  if (!(*seen_threads_)[tid]) {
874    seen_threads_->set(tid);
875    return true;
876  }
877  return false;
878}
879
880static std::string GetMethodLine(ArtMethod* method)
881    SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) {
882  method = method->GetInterfaceMethodIfProxy(sizeof(void*));
883  return StringPrintf("%p\t%s\t%s\t%s\t%s\n", method,
884      PrettyDescriptor(method->GetDeclaringClassDescriptor()).c_str(), method->GetName(),
885      method->GetSignature().ToString().c_str(), method->GetDeclaringClassSourceFile());
886}
887
888void Trace::WriteToBuf(const uint8_t* src, size_t src_size) {
889  int32_t old_offset = cur_offset_.LoadRelaxed();
890  int32_t new_offset = old_offset + static_cast<int32_t>(src_size);
891  if (dchecked_integral_cast<size_t>(new_offset) > buffer_size_) {
892    // Flush buffer.
893    if (!trace_file_->WriteFully(buf_.get(), old_offset)) {
894      PLOG(WARNING) << "Failed streaming a tracing event.";
895    }
896
897    // Check whether the data is too large for the buffer, then write immediately.
898    if (src_size >= buffer_size_) {
899      if (!trace_file_->WriteFully(src, src_size)) {
900        PLOG(WARNING) << "Failed streaming a tracing event.";
901      }
902      cur_offset_.StoreRelease(0);  // Buffer is empty now.
903      return;
904    }
905
906    old_offset = 0;
907    new_offset = static_cast<int32_t>(src_size);
908  }
909  cur_offset_.StoreRelease(new_offset);
910  // Fill in data.
911  memcpy(buf_.get() + old_offset, src, src_size);
912}
913
914void Trace::LogMethodTraceEvent(Thread* thread, ArtMethod* method,
915                                instrumentation::Instrumentation::InstrumentationEvent event,
916                                uint32_t thread_clock_diff, uint32_t wall_clock_diff) {
917  // Advance cur_offset_ atomically.
918  int32_t new_offset;
919  int32_t old_offset = 0;
920
921  // We do a busy loop here trying to acquire the next offset.
922  if (trace_output_mode_ != TraceOutputMode::kStreaming) {
923    do {
924      old_offset = cur_offset_.LoadRelaxed();
925      new_offset = old_offset + GetRecordSize(clock_source_);
926      if (static_cast<size_t>(new_offset) > buffer_size_) {
927        overflow_ = true;
928        return;
929      }
930    } while (!cur_offset_.CompareExchangeWeakSequentiallyConsistent(old_offset, new_offset));
931  }
932
933  TraceAction action = kTraceMethodEnter;
934  switch (event) {
935    case instrumentation::Instrumentation::kMethodEntered:
936      action = kTraceMethodEnter;
937      break;
938    case instrumentation::Instrumentation::kMethodExited:
939      action = kTraceMethodExit;
940      break;
941    case instrumentation::Instrumentation::kMethodUnwind:
942      action = kTraceUnroll;
943      break;
944    default:
945      UNIMPLEMENTED(FATAL) << "Unexpected event: " << event;
946  }
947
948  uint64_t method_value = EncodeTraceMethodAndAction(method, action);
949
950  // Write data
951  uint8_t* ptr;
952  static constexpr size_t kPacketSize = 18U;  // The maximum size of data in a packet.
953  uint8_t stack_buf[kPacketSize];             // Space to store a packet when in streaming mode.
954  if (trace_output_mode_ == TraceOutputMode::kStreaming) {
955    ptr = stack_buf;
956  } else {
957    ptr = buf_.get() + old_offset;
958  }
959
960  Append2LE(ptr, thread->GetTid());
961  Append8LE(ptr + 2, method_value);
962  ptr += 10;
963
964  if (UseThreadCpuClock()) {
965    Append4LE(ptr, thread_clock_diff);
966    ptr += 4;
967  }
968  if (UseWallClock()) {
969    Append4LE(ptr, wall_clock_diff);
970  }
971  static_assert(kPacketSize == 2 + 8 + 4 + 4, "Packet size incorrect.");
972
973  if (trace_output_mode_ == TraceOutputMode::kStreaming) {
974    MutexLock mu(Thread::Current(), *streaming_lock_);  // To serialize writing.
975    if (RegisterMethod(method)) {
976      // Write a special block with the name.
977      std::string method_line(GetMethodLine(method));
978      uint8_t buf2[5];
979      Append2LE(buf2, 0);
980      buf2[2] = kOpNewMethod;
981      Append2LE(buf2 + 3, static_cast<uint16_t>(method_line.length()));
982      WriteToBuf(buf2, sizeof(buf2));
983      WriteToBuf(reinterpret_cast<const uint8_t*>(method_line.c_str()), method_line.length());
984    }
985    if (RegisterThread(thread)) {
986      // It might be better to postpone this. Threads might not have received names...
987      std::string thread_name;
988      thread->GetThreadName(thread_name);
989      uint8_t buf2[7];
990      Append2LE(buf2, 0);
991      buf2[2] = kOpNewThread;
992      Append2LE(buf2 + 3, static_cast<uint16_t>(thread->GetTid()));
993      Append2LE(buf2 + 5, static_cast<uint16_t>(thread_name.length()));
994      WriteToBuf(buf2, sizeof(buf2));
995      WriteToBuf(reinterpret_cast<const uint8_t*>(thread_name.c_str()), thread_name.length());
996    }
997    WriteToBuf(stack_buf, sizeof(stack_buf));
998  }
999}
1000
1001void Trace::GetVisitedMethods(size_t buf_size,
1002                              std::set<ArtMethod*>* visited_methods) {
1003  uint8_t* ptr = buf_.get() + kTraceHeaderLength;
1004  uint8_t* end = buf_.get() + buf_size;
1005
1006  while (ptr < end) {
1007    uint64_t tmid = ReadBytes(ptr + 2, sizeof(tmid));
1008    ArtMethod* method = DecodeTraceMethodId(tmid);
1009    visited_methods->insert(method);
1010    ptr += GetRecordSize(clock_source_);
1011  }
1012}
1013
1014void Trace::DumpMethodList(std::ostream& os, const std::set<ArtMethod*>& visited_methods) {
1015  for (const auto& method : visited_methods) {
1016    os << GetMethodLine(method);
1017  }
1018}
1019
1020static void DumpThread(Thread* t, void* arg) {
1021  std::ostream& os = *reinterpret_cast<std::ostream*>(arg);
1022  std::string name;
1023  t->GetThreadName(name);
1024  os << t->GetTid() << "\t" << name << "\n";
1025}
1026
1027void Trace::DumpThreadList(std::ostream& os) {
1028  Thread* self = Thread::Current();
1029  for (auto it : exited_threads_) {
1030    os << it.first << "\t" << it.second << "\n";
1031  }
1032  Locks::thread_list_lock_->AssertNotHeld(self);
1033  MutexLock mu(self, *Locks::thread_list_lock_);
1034  Runtime::Current()->GetThreadList()->ForEach(DumpThread, &os);
1035}
1036
1037void Trace::StoreExitingThreadInfo(Thread* thread) {
1038  MutexLock mu(thread, *Locks::trace_lock_);
1039  if (the_trace_ != nullptr) {
1040    std::string name;
1041    thread->GetThreadName(name);
1042    // The same thread/tid may be used multiple times. As SafeMap::Put does not allow to override
1043    // a previous mapping, use SafeMap::Overwrite.
1044    the_trace_->exited_threads_.Overwrite(thread->GetTid(), name);
1045  }
1046}
1047
1048Trace::TraceOutputMode Trace::GetOutputMode() {
1049  MutexLock mu(Thread::Current(), *Locks::trace_lock_);
1050  CHECK(the_trace_ != nullptr) << "Trace output mode requested, but no trace currently running";
1051  return the_trace_->trace_output_mode_;
1052}
1053
1054Trace::TraceMode Trace::GetMode() {
1055  MutexLock mu(Thread::Current(), *Locks::trace_lock_);
1056  CHECK(the_trace_ != nullptr) << "Trace mode requested, but no trace currently running";
1057  return the_trace_->trace_mode_;
1058}
1059
1060size_t Trace::GetBufferSize() {
1061  MutexLock mu(Thread::Current(), *Locks::trace_lock_);
1062  CHECK(the_trace_ != nullptr) << "Trace mode requested, but no trace currently running";
1063  return the_trace_->buffer_size_;
1064}
1065
1066}  // namespace art
1067