fuchsia_inspect_contrib/
self_profile.rs1use fuchsia_inspect::{Inspector, Node};
42use fuchsia_sync::Mutex;
43use std::cell::RefCell;
44use std::collections::BTreeMap;
45use std::future::Future;
46use std::panic::Location;
47use std::pin::Pin;
48use std::sync::atomic::{AtomicBool, AtomicI64, AtomicU64, Ordering};
49use std::sync::{Arc, LazyLock};
50use zx::{self as zx, Task as _};
51
52static PROFILING_ENABLED: AtomicBool = AtomicBool::new(false);
53
54static ROOT_PROFILE_DURATION: LazyLock<Arc<ProfileDurationTree>> =
55 LazyLock::new(|| Arc::new(ProfileDurationTree::new(Location::caller())));
56
57thread_local! {
58 static CURRENT_PROFILE_DURATION: RefCell<Arc<ProfileDurationTree>> =
59 RefCell::new(ROOT_PROFILE_DURATION.clone());
60}
61
62#[macro_export]
67macro_rules! profile_duration {
68 ($name:expr) => {
69 let _guard = $crate::ProfileDuration::enter($name);
70 };
71}
72
73pub fn start_self_profiling() {
75 PROFILING_ENABLED.store(true, Ordering::Relaxed);
76}
77
78pub fn stop_self_profiling() {
80 PROFILING_ENABLED.store(false, Ordering::Relaxed);
81}
82
83#[inline]
84fn profiling_enabled() -> bool {
85 PROFILING_ENABLED.load(Ordering::Relaxed)
86}
87
88pub struct ProfileDuration {
90 inner: Option<InnerGuard>,
91}
92
93impl ProfileDuration {
94 pub fn lazy_node_callback(
96 ) -> Pin<Box<dyn Future<Output = Result<Inspector, anyhow::Error>> + Send + 'static>> {
97 Box::pin(async move {
98 let inspector = Inspector::default();
99 ROOT_PROFILE_DURATION.report(inspector.root());
100
101 inspector.root().record_bool("__profile_durations_root", true);
103 Ok(inspector)
104 })
105 }
106
107 #[track_caller]
113 pub fn enter(name: &'static str) -> Self {
114 Self { inner: if profiling_enabled() { Some(InnerGuard::enter(name)) } else { None } }
115 }
116
117 #[track_caller]
120 pub fn pivot(&mut self, name: &'static str) {
121 if profiling_enabled() {
122 drop(self.inner.take());
123 self.inner = Some(InnerGuard::enter(name));
124 }
125 }
126}
127
128struct InnerGuard {
129 start_runtime: zx::TaskRuntimeInfo,
130 start_monotonic_ns: zx::MonotonicInstant,
131 parent_duration: Arc<ProfileDurationTree>,
132}
133
134impl InnerGuard {
135 #[track_caller]
136 fn enter(name: &'static str) -> Self {
137 let start_monotonic_ns = zx::MonotonicInstant::get();
138 let start_runtime = current_thread_runtime();
139
140 let location = Location::caller();
142 let parent_duration = CURRENT_PROFILE_DURATION.with(|current_duration| {
143 let mut current_duration = current_duration.borrow_mut();
144 let child_duration = current_duration.child(name, location);
145 std::mem::replace(&mut *current_duration, child_duration)
146 });
147
148 Self { start_runtime, start_monotonic_ns, parent_duration }
149 }
150}
151
152impl Drop for InnerGuard {
153 fn drop(&mut self) {
154 CURRENT_PROFILE_DURATION.with(|current_duration| {
155 let mut current_duration = current_duration.borrow_mut();
156 let completed_duration =
157 std::mem::replace(&mut *current_duration, self.parent_duration.clone());
158
159 let runtime_delta = current_thread_runtime() - self.start_runtime;
160 let wall_time_delta = zx::MonotonicInstant::get() - self.start_monotonic_ns;
161
162 completed_duration.count.fetch_add(1, Ordering::Relaxed);
163 completed_duration.wall_time.fetch_add(wall_time_delta.into_nanos(), Ordering::Relaxed);
164 completed_duration.cpu_time.fetch_add(runtime_delta.cpu_time, Ordering::Relaxed);
165 completed_duration.queue_time.fetch_add(runtime_delta.queue_time, Ordering::Relaxed);
166 completed_duration
167 .page_fault_time
168 .fetch_add(runtime_delta.page_fault_time, Ordering::Relaxed);
169 completed_duration
170 .lock_contention_time
171 .fetch_add(runtime_delta.lock_contention_time, Ordering::Relaxed);
172 });
173 }
174}
175
176#[derive(Debug)]
177struct ProfileDurationTree {
178 location: &'static Location<'static>,
179 count: AtomicU64,
180 wall_time: AtomicI64,
181 cpu_time: AtomicI64,
182 queue_time: AtomicI64,
183 page_fault_time: AtomicI64,
184 lock_contention_time: AtomicI64,
185 children: Mutex<BTreeMap<&'static str, Arc<Self>>>,
186}
187
188impl ProfileDurationTree {
189 fn new(location: &'static Location<'static>) -> Self {
190 Self {
191 location,
192 count: Default::default(),
193 wall_time: Default::default(),
194 cpu_time: Default::default(),
195 queue_time: Default::default(),
196 page_fault_time: Default::default(),
197 lock_contention_time: Default::default(),
198 children: Default::default(),
199 }
200 }
201
202 fn child(&self, name: &'static str, location: &'static Location<'static>) -> Arc<Self> {
203 self.children.lock().entry(name).or_insert_with(|| Arc::new(Self::new(location))).clone()
204 }
205
206 fn report(&self, node: &Node) {
207 let children = self.children.lock();
208 node.record_string("location", self.location.to_string());
209 node.record_uint("count", self.count.load(Ordering::Relaxed));
210 node.record_int("wall_time", self.wall_time.load(Ordering::Relaxed));
211 node.record_int("cpu_time", self.cpu_time.load(Ordering::Relaxed));
212 node.record_int("queue_time", self.queue_time.load(Ordering::Relaxed));
213 node.record_int("page_fault_time", self.page_fault_time.load(Ordering::Relaxed));
214 node.record_int("lock_contention_time", self.lock_contention_time.load(Ordering::Relaxed));
215 for (name, child) in children.iter() {
216 node.record_child(*name, |n| child.report(n));
217 }
218 }
219}
220
221fn current_thread_runtime() -> zx::TaskRuntimeInfo {
222 fuchsia_runtime::thread_self()
223 .get_runtime_info()
224 .expect("should always be able to read own thread's runtime info")
225}