fuchsia_inspect/
health.rs

1// Copyright 2020 The Fuchsia Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5//! # Health-checking inspect node.
6//!
7//! Health installs a health checking inspect node.  This node reports the current program's health
8//! status in the form of an enumeration string and, in case of an unhealthy status, a free-form
9//! message.
10//!
11//! Possible statuses are as follows:
12//!
13//! - `OK`, the Node is HEALTHY
14//! - `STARTING_UP`, the node is not yet HEALTHY
15//! - `UNHEALTHY`, the node is NOT HEALTHY (the program is required to provide a status message).
16//! - any other value, the node is NOT HEALTHY.
17//!
18//! # Usage
19//!
20//! To use the health checker one must first obtain a `fuchsia_inspect::Node` to add the health
21//! information into. Once that is available, use `fuchsia_inspect::health::Node::new(...)` to
22//! add a standardized health checker.
23//!
24//! # Examples
25//!
26//! ```
27//! use fuchsia_inspect as inspect;
28//! use fuchsia_inspect::health;
29//!
30//! let inspector = /* the inspector of your choice */
31//! let mut root = inspector.root();  // Or perhaps a different Inspect Node of your choice.
32//! let mut health = health::Node::new(root);
33//!
34//! health.set_ok();
35//! // ...
36//! health.set_unhealthy("I am not feeling well."); // Report an error
37//! // ...
38//! health.set_ok(); // The component is healthy again.
39//! ```
40
41use super::{InspectType, Property, StringProperty};
42use injectable_time::TimeSource;
43use std::fmt;
44
45#[cfg(not(target_os = "fuchsia"))]
46use injectable_time::UtcInstant as TimeType;
47
48#[cfg(target_os = "fuchsia")]
49use injectable_time::MonotonicInstant as TimeType;
50
51/// A trait of a standardized health checker.
52///
53/// Contains the methods to set standardized health status.  All standardized health status reporters
54/// must implement this trait.
55pub trait Reporter {
56    /// Sets the health status to `STARTING_UP`.
57    fn set_starting_up(&mut self);
58    /// Sets the health status to `OK`.
59    fn set_ok(&mut self);
60    /// Sets the health status to `UNHEALTHY`.  A `message` that explains why the node is healthy
61    /// MUST be given.
62    fn set_unhealthy(&mut self, message: &str);
63}
64
65// The metric node name, as exposed by the health checker.
66const FUCHSIA_INSPECT_HEALTH: &str = "fuchsia.inspect.Health";
67
68const STATUS_PROPERTY_KEY: &str = "status";
69
70const MESSAGE_PROPERTY_KEY: &str = "message";
71
72/// Predefined statuses, per the Inspect health specification.  Note that the specification
73/// also allows custom string statuses.
74#[derive(Debug, PartialEq, Eq)]
75enum Status {
76    /// The health checker is available, but has not been initialized with program status yet.
77    StartingUp,
78    /// The program reports unhealthy status.  The program MUST provide a status message if reporting
79    /// unhealthy.
80    Unhealthy,
81    /// The program reports healthy operation.  The definition of healthy is up to the program.
82    Ok,
83}
84
85impl fmt::Display for Status {
86    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
87        match self {
88            Status::StartingUp => write!(f, "STARTING_UP"),
89            Status::Unhealthy => write!(f, "UNHEALTHY"),
90            Status::Ok => write!(f, "OK"),
91        }
92    }
93}
94
95/// Contains subsystem health information.  A global instance of Health is used implicitly
96/// if the user calls the functions `init()`, `ok()` and `unhealthy(...)`.
97///
98/// Use as: ```fuchsia_inspect::health::Node``.
99#[derive(Debug)]
100pub struct Node {
101    // The generic inspect node that hosts the health metric.
102    node: super::Node,
103
104    // The health status of the property
105    status: StringProperty,
106
107    // The detailed status message, filled out in case the health status is not OK.
108    message: Option<StringProperty>,
109}
110
111impl InspectType for Node {}
112
113impl Reporter for Node {
114    /// Sets the health status to `STARTING_UP`.
115    fn set_starting_up(&mut self) {
116        self.set_status_enum(Status::StartingUp, None);
117    }
118
119    /// Sets the health status to `OK`.
120    fn set_ok(&mut self) {
121        self.set_status_enum(Status::Ok, None);
122    }
123
124    /// Sets the health status to `UNHEALTHY`.  A `message` that explains why the node is healthy
125    /// MUST be given.
126    fn set_unhealthy(&mut self, message: &str) {
127        self.set_status_enum(Status::Unhealthy, Some(message));
128    }
129}
130
131impl Node {
132    /// Creates a new health checking node as a child of `parent`.  The initial observed state
133    /// is `STARTING_UP`, and remains so until the programs call one of `set_ok` or `set_unhealthy`.
134    pub fn new(parent: &super::Node) -> Self {
135        Self::new_internal(parent, TimeType::new())
136    }
137
138    // Creates a health node using a specified timestamp. Useful for tests.
139    #[cfg(test)]
140    pub fn new_with_timestamp<T: TimeSource>(parent: &super::Node, timestamper: T) -> Self {
141        Self::new_internal(parent, timestamper)
142    }
143
144    fn new_internal<T: TimeSource>(parent: &super::Node, timestamper: T) -> Self {
145        let node = parent.create_child(FUCHSIA_INSPECT_HEALTH);
146        node.record_int("start_timestamp_nanos", timestamper.now());
147        let status = node.create_string(STATUS_PROPERTY_KEY, Status::StartingUp.to_string());
148        let message = None;
149        Node { node, status, message }
150    }
151
152    // Sets the health status from the supplied `status` and `message`.  Panics if setting invalid
153    // status, e.g. setting `UNHEALTHY` without a message.
154    fn set_status_enum(&mut self, status: Status, message: Option<&str>) {
155        assert!(status != Status::Unhealthy || message.is_some(), "UNHEALTHY must have a message.");
156        self.set_status(&status.to_string(), message);
157    }
158
159    // Sets an arbitrary status and an arbitrary (optional) message into the health report.
160    // Prefer setting standard status using one of the predefined API methods.  This one will
161    // allow you to set whatever you want.
162    fn set_status(&mut self, status: &str, message: Option<&str>) {
163        self.status.set(status);
164        match (&self.message, message) {
165            (_, None) => self.message = None,
166            (Some(m), Some(n)) => m.set(n),
167            (None, Some(n)) => {
168                self.message = Some(self.node.create_string(MESSAGE_PROPERTY_KEY, n))
169            }
170        }
171    }
172}
173
174#[cfg(test)]
175mod tests {
176    use super::*;
177    use crate::Inspector;
178    use diagnostics_assertions::assert_data_tree;
179    use injectable_time::FakeTime;
180
181    #[fuchsia::test]
182    fn health_checker_lifecycle() {
183        let inspector = Inspector::default();
184        let root = inspector.root();
185        // In the beginning, the inspector has no stats.
186        assert_data_tree!(inspector, root: contains {});
187
188        let fake_time = FakeTime::new();
189        fake_time.set_ticks(42);
190        let mut health = Node::new_with_timestamp(root, fake_time);
191        assert_data_tree!(inspector,
192        root: contains {
193            "fuchsia.inspect.Health": {
194                status: "STARTING_UP",
195                start_timestamp_nanos: 42i64,
196            }
197        });
198
199        health.set_ok();
200        assert_data_tree!(inspector,
201        root: contains {
202            "fuchsia.inspect.Health": {
203                status: "OK",
204                start_timestamp_nanos: 42i64,
205            }
206        });
207
208        health.set_unhealthy("Bad state");
209        assert_data_tree!(inspector,
210        root: contains {
211            "fuchsia.inspect.Health": {
212                status: "UNHEALTHY",
213                message: "Bad state",
214                start_timestamp_nanos: 42i64,
215            }
216        });
217
218        // Verify that the message changes.
219        health.set_unhealthy("Another bad state");
220        assert_data_tree!(inspector,
221        root: contains {
222            "fuchsia.inspect.Health": {
223                status: "UNHEALTHY",
224                message: "Another bad state",
225                start_timestamp_nanos: 42i64,
226            }
227        });
228
229        // Also verifies that there is no more message.
230        health.set_ok();
231        assert_data_tree!(inspector,
232        root: contains {
233            "fuchsia.inspect.Health": {
234                status: "OK",
235                start_timestamp_nanos: 42i64,
236            }
237        });
238
239        // Revert to STARTING_UP, but only for tests.
240        health.set_starting_up();
241        assert_data_tree!(inspector,
242        root: contains {
243            "fuchsia.inspect.Health": {
244                status: "STARTING_UP",
245                start_timestamp_nanos: 42i64,
246            }
247        });
248    }
249
250    #[fuchsia::test]
251    fn health_is_recordable() {
252        let inspector = Inspector::default();
253        let root = inspector.root();
254
255        let fake_time = FakeTime::new();
256        fake_time.set_ticks(42);
257        {
258            let mut health = Node::new_with_timestamp(root, fake_time);
259            health.set_ok();
260            assert_data_tree!(inspector,
261                root: contains {
262                    "fuchsia.inspect.Health": {
263                        status: "OK",
264                        start_timestamp_nanos: 42i64,
265                    }
266            });
267
268            root.record(health);
269        }
270
271        assert_data_tree!(inspector,
272            root: contains {
273                "fuchsia.inspect.Health": {
274                    status: "OK",
275                    start_timestamp_nanos: 42i64,
276                }
277        });
278    }
279}