| /* |
| * Copyright (C) 2011 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef ART_RUNTIME_TRACE_H_ |
| #define ART_RUNTIME_TRACE_H_ |
| |
| #include <bitset> |
| #include <map> |
| #include <memory> |
| #include <ostream> |
| #include <set> |
| #include <string> |
| #include <unordered_map> |
| #include <vector> |
| |
| #include "base/atomic.h" |
| #include "base/locks.h" |
| #include "base/macros.h" |
| #include "base/mutex.h" |
| #include "base/os.h" |
| #include "base/safe_map.h" |
| #include "instrumentation.h" |
| #include "runtime_globals.h" |
| #include "thread_pool.h" |
| |
| namespace unix_file { |
| class FdFile; |
| } // namespace unix_file |
| |
| namespace art HIDDEN { |
| |
| class ArtField; |
| class ArtMethod; |
| class DexFile; |
| class ShadowFrame; |
| class Thread; |
| |
| struct MethodTraceRecord; |
| |
| using DexIndexBitSet = std::bitset<65536>; |
| |
| enum TracingMode { |
| kTracingInactive, |
| kMethodTracingActive, // Trace activity synchronous with method progress. |
| kSampleProfilingActive, // Trace activity captured by sampling thread. |
| }; |
| std::ostream& operator<<(std::ostream& os, TracingMode rhs); |
| |
| // File format: |
| // header |
| // record 0 |
| // record 1 |
| // ... |
| // |
| // Header format: |
| // u4 magic ('SLOW') |
| // u2 version |
| // u2 offset to data |
| // u8 start date/time in usec |
| // u2 record size in bytes (version >= 2 only) |
| // ... padding to 32 bytes |
| // |
| // Record format v1: |
| // u1 thread ID |
| // u4 method ID | method action |
| // u4 time delta since start, in usec |
| // |
| // Record format v2: |
| // u2 thread ID |
| // u4 method ID | method action |
| // u4 time delta since start, in usec |
| // |
| // Record format v3: |
| // u2 thread ID |
| // u4 method ID | method action |
| // u4 time delta since start, in usec |
| // u4 wall time since start, in usec (when clock == "dual" only) |
| // |
| // 32 bits of microseconds is 70 minutes. |
| // |
| // All values are stored in little-endian order. |
| |
| enum TraceAction { |
| kTraceMethodEnter = 0x00, // method entry |
| kTraceMethodExit = 0x01, // method exit |
| kTraceUnroll = 0x02, // method exited by exception unrolling |
| // 0x03 currently unused |
| kTraceMethodActionMask = 0x03, // two bits |
| }; |
| |
| enum class TraceOutputMode { |
| kFile, |
| kDDMS, |
| kStreaming |
| }; |
| |
| // We need 3 entries to store 64-bit timestamp counter as two 32-bit values on 32-bit architectures. |
| static constexpr uint32_t kNumEntriesForWallClock = |
| (kRuntimePointerSize == PointerSize::k64) ? 2 : 3; |
| static constexpr uint32_t kNumEntriesForDualClock = kNumEntriesForWallClock + 1; |
| |
| // These define offsets in bytes for the individual fields of a trace entry. These are used by the |
| // JITed code when storing a trace entry. |
| static constexpr int32_t kMethodOffsetInBytes = 0; |
| static constexpr int32_t kTimestampOffsetInBytes = 1 * static_cast<uint32_t>(kRuntimePointerSize); |
| // On 32-bit architectures we store 64-bit timestamp as two 32-bit values. |
| // kHighTimestampOffsetInBytes is only relevant on 32-bit architectures. |
| static constexpr int32_t kHighTimestampOffsetInBytes = |
| 2 * static_cast<uint32_t>(kRuntimePointerSize); |
| |
| static constexpr uintptr_t kMaskTraceAction = ~0b11; |
| |
| class TraceWriterThreadPool : public ThreadPool { |
| public: |
| static TraceWriterThreadPool* Create(const char* name) { |
| TraceWriterThreadPool* pool = new TraceWriterThreadPool(name); |
| pool->CreateThreads(); |
| return pool; |
| } |
| |
| uintptr_t* FinishTaskAndClaimBuffer(size_t tid); |
| |
| private: |
| explicit TraceWriterThreadPool(const char* name) |
| : ThreadPool(name, |
| /* num_threads= */ 1, |
| /* create_peers= */ false, |
| /* worker_stack_size= */ ThreadPoolWorker::kDefaultStackSize) {} |
| }; |
| |
| class TraceWriter { |
| public: |
| TraceWriter(File* trace_file, |
| TraceOutputMode output_mode, |
| TraceClockSource clock_source, |
| size_t buffer_size, |
| int num_trace_buffers, |
| int trace_format_version, |
| uint32_t clock_overhead_ns); |
| |
| // This encodes all the events in the per-thread trace buffer and writes it to the trace file / |
| // buffer. This acquires streaming lock to prevent any other threads writing concurrently. It is |
| // required to serialize these since each method is encoded with a unique id which is assigned |
| // when the method is seen for the first time in the recoreded events. So we need to serialize |
| // these flushes across threads. |
| void FlushBuffer(Thread* thread, bool is_sync, bool free_buffer) |
| REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!tracing_lock_); |
| |
| // This is called when the per-thread buffer is full and a new entry needs to be recorded. This |
| // returns a pointer to the new buffer where the entries should be recorded. |
| // In streaming mode, we just flush the per-thread buffer. The buffer is flushed asynchronously |
| // on a thread pool worker. This creates a new buffer and updates the per-thread buffer pointer |
| // and returns a pointer to the newly created buffer. |
| // In non-streaming mode, buffers from all threads are flushed to see if there's enough room |
| // in the centralized buffer before recording new entries. We just flush these buffers |
| // synchronously and reuse the existing buffer. Since this mode is mostly deprecated we want to |
| // keep the implementation simple here. |
| uintptr_t* PrepareBufferForNewEntries(Thread* thread) REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES(!tracing_lock_); |
| |
| // Flushes all per-thread buffer and also write a summary entry. |
| void FinishTracing(int flags, bool flush_entries) REQUIRES(!tracing_lock_) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| void PreProcessTraceForMethodInfos(uintptr_t* buffer, |
| size_t num_entries, |
| std::unordered_map<ArtMethod*, std::string>& method_infos) |
| REQUIRES_SHARED(Locks::mutator_lock_) REQUIRES(!tracing_lock_); |
| |
| // Flush buffer to the file (for streaming) or to the common buffer (for non-streaming). In |
| // non-streaming case it returns false if all the contents couldn't be flushed. |
| void FlushBuffer(uintptr_t* buffer, |
| size_t num_entries, |
| size_t tid, |
| const std::unordered_map<ArtMethod*, std::string>& method_infos) |
| REQUIRES(!tracing_lock_); |
| |
| // This is called when we see the first entry from the thread to record the information about the |
| // thread. |
| void RecordThreadInfo(Thread* thread) REQUIRES(!tracing_lock_); |
| |
| bool HasOverflow() { return overflow_; } |
| TraceOutputMode GetOutputMode() { return trace_output_mode_; } |
| size_t GetBufferSize() { return buffer_size_; } |
| |
| // Performs the initialization for the buffer pool. It marks all buffers as free by storing 0 |
| // as the owner tid. This also allocates the buffer pool. |
| void InitializeTraceBuffers(); |
| |
| // Releases the trace buffer and transfers the ownership to the specified tid. If the tid is 0, |
| // then it means it is free and other threads can claim it. |
| void FetchTraceBufferForThread(int index, size_t tid); |
| |
| // Tries to find a free buffer (which has owner of 0) from the pool. If there are no free buffers |
| // it fetches a task, flushes the contents of the buffer and returns that buffer. |
| uintptr_t* AcquireTraceBuffer(size_t tid); |
| |
| // Returns the index corresponding to the start of the current_buffer. We allocate one large |
| // buffer and assign parts of it for each thread. |
| int GetMethodTraceIndex(uintptr_t* current_buffer); |
| |
| private: |
| void ReadValuesFromRecord(uintptr_t* method_trace_entries, |
| size_t record_index, |
| MethodTraceRecord& record, |
| bool has_thread_cpu_clock, |
| bool has_wall_clock); |
| |
| void FlushEntriesFormatV2(uintptr_t* method_trace_entries, |
| size_t tid, |
| const std::unordered_map<ArtMethod*, std::string>& method_infos, |
| size_t num_records, |
| size_t* current_index, |
| uint8_t* init_buffer_ptr) REQUIRES(tracing_lock_); |
| |
| void FlushEntriesFormatV1(uintptr_t* method_trace_entries, |
| size_t tid, |
| const std::unordered_map<ArtMethod*, std::string>& method_infos, |
| size_t end_offset, |
| size_t* current_index, |
| uint8_t* buffer_ptr) REQUIRES(tracing_lock_); |
| // Get a 32-bit id for the method and specify if the method hasn't been seen before. If this is |
| // the first time we see this method record information (like method name, declaring class etc.,) |
| // about the method. |
| std::pair<uint32_t, bool> GetMethodEncoding(ArtMethod* method) REQUIRES(tracing_lock_); |
| bool HasMethodEncoding(ArtMethod* method) REQUIRES(tracing_lock_); |
| |
| // Get a 16-bit id for the thread. We don't want to use thread ids directly since they can be |
| // more than 16-bit. |
| uint16_t GetThreadEncoding(pid_t thread_id) REQUIRES(tracing_lock_); |
| |
| // Get the information about the method. |
| std::string GetMethodLine(const std::string& method_line, uint32_t method_id); |
| std::string GetMethodInfoLine(ArtMethod* method) REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Helper function to record method information when processing the events. These are used by |
| // streaming output mode. Non-streaming modes dump the methods and threads list at the end of |
| // tracing. |
| void RecordMethodInfo(const std::string& method_line, uint32_t method_id) REQUIRES(tracing_lock_); |
| |
| // Encodes the trace event. This assumes that there is enough space reserved to encode the entry. |
| void EncodeEventEntry(uint8_t* ptr, |
| uint16_t thread_id, |
| uint32_t method_index, |
| TraceAction action, |
| uint32_t thread_clock_diff, |
| uint32_t wall_clock_diff) REQUIRES(tracing_lock_); |
| |
| // Encodes the header for the events block. This assumes that there is enough space reserved to |
| // encode the entry. |
| void EncodeEventBlockHeader(uint8_t* ptr, |
| uint32_t thread_id, |
| uint32_t method_index, |
| uint32_t init_thread_clock_time, |
| uint32_t init_wall_clock_time, |
| uint16_t num_records) REQUIRES(tracing_lock_); |
| |
| // Ensures there is sufficient space in the buffer to record the requested_size. If there is not |
| // enough sufficient space the current contents of the buffer are written to the file and |
| // current_index is reset to 0. This doesn't check if buffer_size is big enough to hold the |
| // requested size. |
| void EnsureSpace(uint8_t* buffer, |
| size_t* current_index, |
| size_t buffer_size, |
| size_t required_size); |
| |
| // Flush tracing buffers from all the threads. |
| void FlushAllThreadBuffers() REQUIRES(!Locks::thread_list_lock_) REQUIRES(!tracing_lock_); |
| |
| |
| // Methods to output traced methods and threads. |
| void DumpMethodList(std::ostream& os) REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES(!tracing_lock_); |
| void DumpThreadList(std::ostream& os) REQUIRES(!Locks::thread_list_lock_, !tracing_lock_); |
| |
| // File to write trace data out to, null if direct to ddms. |
| std::unique_ptr<File> trace_file_; |
| |
| // The kind of output for this tracing. |
| const TraceOutputMode trace_output_mode_; |
| |
| // The clock source for this tracing. |
| const TraceClockSource clock_source_; |
| |
| // Map of thread ids and names. This is used only in non-streaming mode, since we have to dump |
| // information about all threads in one block. In streaming mode, thread info is recorded directly |
| // in the file when we see the first even from this thread. |
| SafeMap<uint16_t, std::string> threads_list_; |
| |
| // Map from ArtMethod* to index. |
| std::unordered_map<ArtMethod*, uint32_t> art_method_id_map_ GUARDED_BY(tracing_lock_); |
| uint32_t current_method_index_ = 0; |
| |
| // Map from thread_id to a 16-bit identifier. |
| std::unordered_map<pid_t, uint16_t> thread_id_map_ GUARDED_BY(tracing_lock_); |
| uint16_t current_thread_index_; |
| |
| // Buffer used when generating trace data from the raw entries. |
| // In streaming mode, the trace data is flushed to file when the per-thread buffer gets full. |
| // In non-streaming mode, this data is flushed at the end of tracing. If the buffer gets full |
| // we stop tracing and following trace events are ignored. The size of this buffer is |
| // specified by the user in non-streaming mode. |
| std::unique_ptr<uint8_t[]> buf_; |
| |
| // The cur_offset_ into the buf_. Accessed only in SuspendAll scope when flushing data from the |
| // thread local buffers to buf_. |
| size_t cur_offset_ GUARDED_BY(tracing_lock_); |
| |
| // Size of buf_. |
| const size_t buffer_size_; |
| |
| // Version of trace output |
| const int trace_format_version_; |
| |
| // Time trace was created. |
| const uint64_t start_time_; |
| |
| // Did we overflow the buffer recording traces? |
| bool overflow_; |
| |
| // Total number of records flushed to file. |
| size_t num_records_; |
| |
| // Clock overhead. |
| const uint32_t clock_overhead_ns_; |
| |
| std::vector<std::atomic<size_t>> owner_tids_; |
| std::unique_ptr<uintptr_t[]> trace_buffer_; |
| |
| // Lock to protect common data structures accessed from multiple threads like |
| // art_method_id_map_, thread_id_map_. |
| Mutex tracing_lock_; |
| |
| // Thread pool to flush the trace entries to file. |
| std::unique_ptr<TraceWriterThreadPool> thread_pool_; |
| }; |
| |
| // Class for recording event traces. Trace data is either collected |
| // synchronously during execution (TracingMode::kMethodTracingActive), |
| // or by a separate sampling thread (TracingMode::kSampleProfilingActive). |
| class Trace final : public instrumentation::InstrumentationListener { |
| public: |
| enum TraceFlag { |
| kTraceCountAllocs = 0x001, |
| kTraceClockSourceWallClock = 0x010, |
| kTraceClockSourceThreadCpu = 0x100, |
| }; |
| |
| static const int kFormatV1 = 0; |
| static const int kFormatV2 = 1; |
| static const int kTraceFormatVersionFlagMask = 0b110; |
| static const int kTraceFormatVersionShift = 1; |
| |
| enum class TraceMode { |
| kMethodTracing, |
| kSampling |
| }; |
| |
| static void SetDefaultClockSource(TraceClockSource clock_source); |
| |
| static void Start(const char* trace_filename, |
| size_t buffer_size, |
| int flags, |
| TraceOutputMode output_mode, |
| TraceMode trace_mode, |
| int interval_us) |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::thread_suspend_count_lock_, |
| !Locks::trace_lock_); |
| static void Start(int trace_fd, |
| size_t buffer_size, |
| int flags, |
| TraceOutputMode output_mode, |
| TraceMode trace_mode, |
| int interval_us) |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::thread_suspend_count_lock_, |
| !Locks::trace_lock_); |
| static void Start(std::unique_ptr<unix_file::FdFile>&& file, |
| size_t buffer_size, |
| int flags, |
| TraceOutputMode output_mode, |
| TraceMode trace_mode, |
| int interval_us) |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::thread_suspend_count_lock_, |
| !Locks::trace_lock_); |
| static void StartDDMS(size_t buffer_size, |
| int flags, |
| TraceMode trace_mode, |
| int interval_us) |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::thread_suspend_count_lock_, |
| !Locks::trace_lock_); |
| |
| // Stop tracing. This will finish the trace and write it to file/send it via DDMS. |
| static void Stop() |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::trace_lock_); |
| // Abort tracing. This will just stop tracing and *not* write/send the collected data. |
| static void Abort() |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::trace_lock_); |
| static void Shutdown() |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::trace_lock_); |
| |
| static TracingMode GetMethodTracingMode() REQUIRES(!Locks::trace_lock_); |
| |
| // Flush the per-thread buffer. This is called when the thread is about to detach. |
| static void FlushThreadBuffer(Thread* thread) REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES(!Locks::trace_lock_) NO_THREAD_SAFETY_ANALYSIS; |
| |
| void MeasureClockOverhead(); |
| uint32_t GetClockOverheadNanoSeconds(); |
| |
| void CompareAndUpdateStackTrace(Thread* thread, std::vector<ArtMethod*>* stack_trace) |
| REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // InstrumentationListener implementation. |
| void MethodEntered(Thread* thread, ArtMethod* method) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void MethodExited(Thread* thread, |
| ArtMethod* method, |
| instrumentation::OptionalFrame frame, |
| JValue& return_value) REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void MethodUnwind(Thread* thread, ArtMethod* method, uint32_t dex_pc) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void DexPcMoved(Thread* thread, |
| Handle<mirror::Object> this_object, |
| ArtMethod* method, |
| uint32_t new_dex_pc) REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void FieldRead(Thread* thread, |
| Handle<mirror::Object> this_object, |
| ArtMethod* method, |
| uint32_t dex_pc, |
| ArtField* field) REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void FieldWritten(Thread* thread, |
| Handle<mirror::Object> this_object, |
| ArtMethod* method, |
| uint32_t dex_pc, |
| ArtField* field, |
| const JValue& field_value) REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void ExceptionThrown(Thread* thread, Handle<mirror::Throwable> exception_object) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void ExceptionHandled(Thread* thread, Handle<mirror::Throwable> exception_object) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void Branch(Thread* thread, ArtMethod* method, uint32_t dex_pc, int32_t dex_pc_offset) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| void WatchedFramePop(Thread* thread, const ShadowFrame& frame) |
| REQUIRES_SHARED(Locks::mutator_lock_) override; |
| |
| TraceClockSource GetClockSource() { return clock_source_; } |
| |
| // Reuse an old stack trace if it exists, otherwise allocate a new one. |
| static std::vector<ArtMethod*>* AllocStackTrace(); |
| // Clear and store an old stack trace for later use. |
| static void FreeStackTrace(std::vector<ArtMethod*>* stack_trace); |
| |
| static TraceOutputMode GetOutputMode() REQUIRES(!Locks::trace_lock_); |
| static TraceMode GetMode() REQUIRES(!Locks::trace_lock_); |
| static size_t GetBufferSize() REQUIRES(!Locks::trace_lock_); |
| static int GetFlags() REQUIRES(!Locks::trace_lock_); |
| static int GetIntervalInMillis() REQUIRES(!Locks::trace_lock_); |
| |
| // Used by class linker to prevent class unloading. |
| static bool IsTracingEnabled() REQUIRES(!Locks::trace_lock_); |
| |
| private: |
| Trace(File* trace_file, |
| size_t buffer_size, |
| int flags, |
| TraceOutputMode output_mode, |
| TraceMode trace_mode); |
| |
| // The sampling interval in microseconds is passed as an argument. |
| static void* RunSamplingThread(void* arg) REQUIRES(!Locks::trace_lock_); |
| |
| static void StopTracing(bool flush_entries) |
| REQUIRES(!Locks::mutator_lock_, !Locks::thread_list_lock_, !Locks::trace_lock_) |
| // There is an annoying issue with static functions that create a new object and call into |
| // that object that causes them to not be able to tell that we don't currently hold the lock. |
| // This causes the negative annotations to incorrectly have a false positive. TODO: Figure out |
| // how to annotate this. |
| NO_THREAD_SAFETY_ANALYSIS; |
| |
| void ReadClocks(Thread* thread, uint32_t* thread_clock_diff, uint64_t* timestamp_counter); |
| |
| void LogMethodTraceEvent(Thread* thread, |
| ArtMethod* method, |
| TraceAction action, |
| uint32_t thread_clock_diff, |
| uint64_t timestamp_counter) REQUIRES_SHARED(Locks::mutator_lock_); |
| |
| // Singleton instance of the Trace or null when no method tracing is active. |
| static Trace* volatile the_trace_ GUARDED_BY(Locks::trace_lock_); |
| |
| // The default profiler clock source. |
| static TraceClockSource default_clock_source_; |
| |
| // Sampling thread, non-zero when sampling. |
| static pthread_t sampling_pthread_; |
| |
| // Used to remember an unused stack trace to avoid re-allocation during sampling. |
| static std::unique_ptr<std::vector<ArtMethod*>> temp_stack_trace_; |
| |
| // Flags enabling extra tracing of things such as alloc counts. |
| const int flags_; |
| |
| // The tracing method. |
| const TraceMode trace_mode_; |
| |
| const TraceClockSource clock_source_; |
| |
| // Sampling profiler sampling interval. |
| int interval_us_; |
| |
| // A flag to indicate to the sampling thread whether to stop tracing |
| bool stop_tracing_; |
| |
| std::unique_ptr<TraceWriter> trace_writer_; |
| |
| DISALLOW_COPY_AND_ASSIGN(Trace); |
| }; |
| |
| } // namespace art |
| |
| #endif // ART_RUNTIME_TRACE_H_ |