| //===-- xray_profile_collector.h -------------------------------*- C++ -*-===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file is a part of XRay, a dynamic runtime instrumentation system. |
| // |
| // This file defines the interface for a data collection service, for XRay |
| // profiling. What we implement here is an in-process service where |
| // FunctionCallTrie instances can be handed off by threads, to be |
| // consolidated/collected. |
| // |
| //===----------------------------------------------------------------------===// |
| #ifndef XRAY_XRAY_PROFILE_COLLECTOR_H |
| #define XRAY_XRAY_PROFILE_COLLECTOR_H |
| |
| #include "xray_function_call_trie.h" |
| |
| #include "xray/xray_log_interface.h" |
| |
| namespace __xray { |
| |
| /// The ProfileCollectorService implements a centralised mechanism for |
| /// collecting FunctionCallTrie instances, indexed by thread ID. On demand, the |
| /// ProfileCollectorService can be queried for the most recent state of the |
| /// data, in a form that allows traversal. |
| namespace profileCollectorService { |
| |
| /// Posts the FunctionCallTrie associated with a specific Thread ID. This |
| /// will: |
| /// |
| /// - Make a copy of the FunctionCallTrie and store that against the Thread |
| /// ID. This will use the global allocator for the service-managed |
| /// FunctionCallTrie instances. |
| /// - Queue up a pointer to the FunctionCallTrie. |
| /// - If the queue is long enough (longer than some arbitrary threshold) we |
| /// then pre-calculate a single FunctionCallTrie for the whole process. |
| /// |
| /// |
| /// We are making a copy of the FunctionCallTrie because the intent is to have |
| /// this function be called at thread exit, or soon after the profiling |
| /// handler is finalized through the XRay APIs. By letting threads each |
| /// process their own thread-local FunctionCallTrie instances, we're removing |
| /// the need for synchronisation across threads while we're profiling. |
| /// However, once we're done profiling, we can then collect copies of these |
| /// FunctionCallTrie instances and pay the cost of the copy. |
| /// |
| /// NOTE: In the future, if this turns out to be more costly than "moving" the |
| /// FunctionCallTrie instances from the owning thread to the collector |
| /// service, then we can change the implementation to do it this way (moving) |
| /// instead. |
| void post(const FunctionCallTrie &T, tid_t TId); |
| |
| /// The serialize will process all FunctionCallTrie instances in memory, and |
| /// turn those into specifically formatted blocks, each describing the |
| /// function call trie's contents in a compact form. In memory, this looks |
| /// like the following layout: |
| /// |
| /// - block size (32 bits) |
| /// - block number (32 bits) |
| /// - thread id (64 bits) |
| /// - list of records: |
| /// - function ids in leaf to root order, terminated by |
| /// 0 (32 bits per function id) |
| /// - call count (64 bit) |
| /// - cumulative local time (64 bit) |
| /// - record delimiter (64 bit, 0x0) |
| /// |
| void serialize(); |
| |
| /// The reset function will clear out any internal memory held by the |
| /// service. The intent is to have the resetting be done in calls to the |
| /// initialization routine, or explicitly through the flush log API. |
| void reset(); |
| |
| /// This nextBuffer function is meant to implement the iterator functionality, |
| /// provided in the XRay API. |
| XRayBuffer nextBuffer(XRayBuffer B); |
| |
| } // namespace profileCollectorService |
| |
| } // namespace __xray |
| |
| #endif // XRAY_XRAY_PROFILE_COLLECTOR_H |