use crate::task_metrics::constants::{COMPONENT_CPU_MAX_SAMPLES, CPU_SAMPLE_PERIOD};
use crate::task_metrics::measurement::{Measurement, MeasurementsQueue};
use crate::task_metrics::runtime_stats_source::RuntimeStatsSource;
use fuchsia_async as fasync;
use fuchsia_inspect::{self as inspect, HistogramProperty, UintLinearHistogramProperty};
use futures::future::BoxFuture;
use futures::lock::Mutex;
use futures::FutureExt;
use injectable_time::TimeSource;
use log::debug;
use moniker::ExtendedMoniker;
use std::fmt::Debug;
use std::sync::{Arc, Weak};
use zx::sys::{self as zx_sys, zx_system_get_num_cpus};
pub(crate) fn create_cpu_histogram(
node: &inspect::Node,
moniker: &ExtendedMoniker,
) -> inspect::UintLinearHistogramProperty {
node.create_uint_linear_histogram(
moniker.to_string(),
inspect::LinearHistogramParams { floor: 1, step_size: 1, buckets: 99 },
)
}
fn num_cpus() -> i64 {
(unsafe { zx_system_get_num_cpus() }) as i64
}
#[derive(Debug)]
pub(crate) enum TaskState<T: RuntimeStatsSource + Debug> {
TerminatedAndMeasured,
Terminated(T),
Alive(T),
}
impl<T> From<T> for TaskState<T>
where
T: RuntimeStatsSource + Debug,
{
fn from(task: T) -> TaskState<T> {
TaskState::Alive(task)
}
}
#[derive(Debug)]
pub struct TaskInfo<T: RuntimeStatsSource + Debug> {
koid: zx_sys::zx_koid_t,
pub(crate) task: Arc<Mutex<TaskState<T>>>,
pub(crate) time_source: Arc<dyn TimeSource + Sync + Send>,
pub(crate) has_parent_task: bool,
pub(crate) measurements: MeasurementsQueue,
exited_cpu: Option<Measurement>,
histogram: Option<UintLinearHistogramProperty>,
previous_cpu: zx::MonotonicDuration,
previous_histogram_timestamp: i64,
cpu_cores: i64,
sample_period: std::time::Duration,
children: Vec<Weak<Mutex<TaskInfo<T>>>>,
_terminated_task: fasync::Task<()>,
pub(crate) most_recent_measurement_nanos: Arc<Mutex<Option<i64>>>,
}
impl<T: 'static + RuntimeStatsSource + Debug + Send + Sync> TaskInfo<T> {
pub fn try_from(
task: T,
histogram: Option<UintLinearHistogramProperty>,
time_source: Arc<dyn TimeSource + Sync + Send>,
) -> Result<Self, zx::Status> {
Self::try_from_internal(task, histogram, time_source, CPU_SAMPLE_PERIOD, num_cpus())
}
}
impl<T: 'static + RuntimeStatsSource + Debug + Send + Sync> TaskInfo<T> {
fn try_from_internal(
task: T,
histogram: Option<UintLinearHistogramProperty>,
time_source: Arc<dyn TimeSource + Sync + Send>,
sample_period: std::time::Duration,
cpu_cores: i64,
) -> Result<Self, zx::Status> {
let koid = task.koid()?;
let maybe_handle = task.handle_ref().duplicate(zx::Rights::SAME_RIGHTS).ok();
let task_state = Arc::new(Mutex::new(TaskState::from(task)));
let weak_task_state = Arc::downgrade(&task_state);
let most_recent_measurement_nanos = Arc::new(Mutex::new(None));
let movable_most_recent_measurement_nanos = most_recent_measurement_nanos.clone();
let movable_time_source = time_source.clone();
let _terminated_task = fasync::Task::spawn(async move {
if let Some(handle) = maybe_handle {
fasync::OnSignals::new(&handle, zx::Signals::TASK_TERMINATED)
.await
.map(|_: fidl::Signals| ()) .unwrap_or_else(|error| debug!(error:%; "error creating signal handler"));
}
if let Some(task_state) = weak_task_state.upgrade() {
let mut terminated_at_nanos_guard =
movable_most_recent_measurement_nanos.lock().await;
*terminated_at_nanos_guard = Some(movable_time_source.now());
let mut state = task_state.lock().await;
*state = match std::mem::replace(&mut *state, TaskState::TerminatedAndMeasured) {
s @ TaskState::TerminatedAndMeasured => s,
TaskState::Alive(t) => TaskState::Terminated(t),
s @ TaskState::Terminated(_) => s,
};
}
});
Ok(Self {
koid,
task: task_state,
has_parent_task: false,
measurements: MeasurementsQueue::new(COMPONENT_CPU_MAX_SAMPLES, time_source.clone()),
children: vec![],
cpu_cores,
sample_period,
histogram,
previous_cpu: zx::MonotonicDuration::from_nanos(0),
previous_histogram_timestamp: time_source.now(),
time_source,
_terminated_task,
most_recent_measurement_nanos,
exited_cpu: None,
})
}
pub async fn measure_if_no_parent(&mut self) -> Option<&Measurement> {
if self.has_parent_task {
return None;
}
self.measure_subtree().await
}
pub fn add_child(&mut self, task: Weak<Mutex<TaskInfo<T>>>) {
self.children.push(task);
}
pub async fn most_recent_measurement(&self) -> Option<zx::BootInstant> {
self.most_recent_measurement_nanos.lock().await.map(|t| zx::BootInstant::from_nanos(t))
}
pub async fn take_measurements_queue(&mut self) -> Result<MeasurementsQueue, ()> {
match &*self.task.lock().await {
TaskState::TerminatedAndMeasured | TaskState::Terminated(_) => Ok(std::mem::replace(
&mut self.measurements,
MeasurementsQueue::new(COMPONENT_CPU_MAX_SAMPLES, self.time_source.clone()),
)),
_ => Err(()),
}
}
pub fn record_measurement_with_start_time(&mut self, t: zx::BootInstant) {
self.record_measurement(Measurement::empty(t));
}
fn record_measurement(&mut self, m: Measurement) {
let current_cpu = *m.cpu_time();
self.add_to_histogram(current_cpu - self.previous_cpu, *m.timestamp());
self.previous_cpu = current_cpu;
self.measurements.insert(m);
}
fn measure_subtree<'a>(&'a mut self) -> BoxFuture<'a, Option<&'a Measurement>> {
async move {
let (task_terminated_can_measure, runtime_info_res) = {
let mut guard = self.task.lock().await;
match &*guard {
TaskState::TerminatedAndMeasured => {
self.measurements.insert_post_invalidation();
return None;
}
TaskState::Terminated(task) => {
let result = task.get_runtime_info().await;
*guard = TaskState::TerminatedAndMeasured;
let mut terminated_at_nanos_guard =
self.most_recent_measurement_nanos.lock().await;
*terminated_at_nanos_guard = Some(self.time_source.now());
(true, result)
}
TaskState::Alive(task) => (false, task.get_runtime_info().await),
}
};
if let Ok(runtime_info) = runtime_info_res {
let mut measurement = Measurement::from_runtime_info(
runtime_info,
zx::BootInstant::from_nanos(self.time_source.now()),
);
let mut alive_children = vec![];
while let Some(weak_child) = self.children.pop() {
if let Some(child) = weak_child.upgrade() {
let mut child_guard = child.lock().await;
if let Some(child_measurement) = child_guard.measure_subtree().await {
measurement -= child_measurement;
}
if child_guard.is_alive().await {
alive_children.push(weak_child);
}
}
}
self.children = alive_children;
self.record_measurement(measurement);
if task_terminated_can_measure {
self.exited_cpu = self.measurements.most_recent_measurement().cloned();
return None;
}
return self.measurements.most_recent_measurement();
}
None
}
.boxed()
}
fn add_to_histogram(
&mut self,
cpu_time_delta: zx::MonotonicDuration,
timestamp: zx::BootInstant,
) {
if let Some(histogram) = &self.histogram {
let time_value: i64 = timestamp.into_nanos();
let elapsed_time = time_value - self.previous_histogram_timestamp;
self.previous_histogram_timestamp = time_value;
if elapsed_time < ((self.sample_period.as_nanos() as i64) * 9 / 10) {
return;
}
let available_core_time = elapsed_time * self.cpu_cores;
if available_core_time != 0 {
let cpu_numerator =
(cpu_time_delta.into_nanos() as i64) * 100 + available_core_time - 1;
histogram.insert((cpu_numerator / available_core_time) as u64);
}
}
}
pub async fn is_alive(&self) -> bool {
let task_state_terminated_and_measured =
matches!(*self.task.lock().await, TaskState::TerminatedAndMeasured);
let task_has_real_measurements = !self.measurements.no_true_measurements();
!task_state_terminated_and_measured || task_has_real_measurements
}
pub async fn exited_cpu(&self) -> Option<&Measurement> {
self.exited_cpu.as_ref()
}
pub fn record_to_node(&self, parent: &inspect::Node) {
let node = parent.create_child(self.koid.to_string());
self.measurements.record_to_node(&node);
parent.record(node);
}
pub fn koid(&self) -> zx_sys::zx_koid_t {
self.koid
}
#[cfg(test)]
pub fn total_measurements(&self) -> usize {
self.measurements.true_measurement_count()
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::task_metrics::testing::FakeTask;
use assert_matches::assert_matches;
use diagnostics_assertions::assert_data_tree;
use diagnostics_hierarchy::{ArrayContent, DiagnosticsHierarchyGetter, LinearHistogram};
use injectable_time::FakeTime;
async fn take_measurement_then_tick_clock<
'a,
T: 'static + RuntimeStatsSource + Debug + Send + Sync,
>(
ti: &'a mut TaskInfo<T>,
clock: &Arc<FakeTime>,
) -> Option<&'a Measurement> {
let m = ti.measure_if_no_parent().await;
clock.add_ticks(CPU_SAMPLE_PERIOD.as_nanos() as i64);
m
}
#[fuchsia::test]
async fn rotates_measurements_per_task() {
let clock = Arc::new(FakeTime::new());
let mut task: TaskInfo<FakeTask> =
TaskInfo::try_from(FakeTask::default(), None , clock.clone()).unwrap();
assert!(task.is_alive().await);
take_measurement_then_tick_clock(&mut task, &clock).await;
assert_eq!(task.measurements.true_measurement_count(), 1);
take_measurement_then_tick_clock(&mut task, &clock).await;
assert_eq!(task.measurements.true_measurement_count(), 2);
take_measurement_then_tick_clock(&mut task, &clock).await;
assert!(task.is_alive().await);
assert_eq!(task.measurements.true_measurement_count(), 3);
task.force_terminate().await;
take_measurement_then_tick_clock(&mut task, &clock).await;
assert_eq!(task.measurements.true_measurement_count(), 4);
assert_matches!(*task.task.lock().await, TaskState::TerminatedAndMeasured);
for _ in 4..COMPONENT_CPU_MAX_SAMPLES {
take_measurement_then_tick_clock(&mut task, &clock).await;
assert_eq!(task.measurements.true_measurement_count(), 4);
}
take_measurement_then_tick_clock(&mut task, &clock).await; assert!(task.is_alive().await);
assert_eq!(task.measurements.true_measurement_count(), 3);
take_measurement_then_tick_clock(&mut task, &clock).await; assert!(task.is_alive().await);
assert_eq!(task.measurements.true_measurement_count(), 2);
take_measurement_then_tick_clock(&mut task, &clock).await; assert!(task.is_alive().await);
assert_eq!(task.measurements.true_measurement_count(), 1);
take_measurement_then_tick_clock(&mut task, &clock).await; assert!(!task.is_alive().await);
assert_eq!(task.measurements.true_measurement_count(), 0);
}
#[fuchsia::test]
async fn write_inspect() {
let time = Arc::new(FakeTime::new());
let mut task = TaskInfo::try_from(
FakeTask::new(
1,
vec![
zx::TaskRuntimeInfo {
cpu_time: 2,
queue_time: 4,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 6,
queue_time: 8,
..zx::TaskRuntimeInfo::default()
},
],
),
None, time.clone(),
)
.unwrap();
time.set_ticks(1);
task.measure_if_no_parent().await;
time.set_ticks(2);
task.measure_if_no_parent().await;
let inspector = inspect::Inspector::default();
task.record_to_node(inspector.root());
assert_data_tree!(inspector, root: {
"1": {
timestamps: vec![1i64, 2],
cpu_times: vec![2i64, 6],
queue_times: vec![4i64, 8],
}
});
}
#[fuchsia::test]
async fn write_more_than_max_samples() {
let inspector = inspect::Inspector::default();
let clock = Arc::new(FakeTime::new());
let mut task = TaskInfo::try_from(
FakeTask::new(
1,
vec![
zx::TaskRuntimeInfo {
cpu_time: 2,
queue_time: 4,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 6,
queue_time: 8,
..zx::TaskRuntimeInfo::default()
},
],
),
None, clock.clone(),
)
.unwrap();
for _ in 0..(COMPONENT_CPU_MAX_SAMPLES + 10) {
assert!(take_measurement_then_tick_clock(&mut task, &clock).await.is_some());
}
assert_eq!(task.measurements.true_measurement_count(), COMPONENT_CPU_MAX_SAMPLES);
task.record_to_node(inspector.root());
assert_eq!(60, COMPONENT_CPU_MAX_SAMPLES);
assert_eq!(task.measurements.true_measurement_count(), 60);
let hierarchy = inspector.get_diagnostics_hierarchy();
for top_level in &hierarchy.children {
let child = hierarchy.get_child(&top_level.name).unwrap();
let timestamps = child.get_property("timestamps").unwrap().int_array().unwrap();
assert_eq!(timestamps.len(), COMPONENT_CPU_MAX_SAMPLES);
let cpu_times = child.get_property("cpu_times").unwrap().int_array().unwrap();
assert_eq!(cpu_times.len(), COMPONENT_CPU_MAX_SAMPLES);
let queue_times = child.get_property("queue_times").unwrap().int_array().unwrap();
assert_eq!(queue_times.len(), COMPONENT_CPU_MAX_SAMPLES);
}
}
#[fuchsia::test]
async fn more_than_max_samples_offset_time() {
let inspector = inspect::Inspector::default();
let clock = Arc::new(FakeTime::new());
let mut task = TaskInfo::try_from(
FakeTask::new(
1,
vec![
zx::TaskRuntimeInfo {
cpu_time: 2,
queue_time: 4,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 6,
queue_time: 8,
..zx::TaskRuntimeInfo::default()
},
],
),
None, clock.clone(),
)
.unwrap();
for _ in 0..COMPONENT_CPU_MAX_SAMPLES {
assert!(take_measurement_then_tick_clock(&mut task, &clock).await.is_some());
}
task.measure_if_no_parent().await;
clock.add_ticks((CPU_SAMPLE_PERIOD - std::time::Duration::from_secs(1)).as_nanos() as i64);
task.measure_if_no_parent().await;
assert_eq!(task.measurements.true_measurement_count(), COMPONENT_CPU_MAX_SAMPLES);
task.record_to_node(inspector.root());
}
#[fuchsia::test]
async fn measure_with_children() {
let clock = Arc::new(FakeTime::new());
let mut task = TaskInfo::try_from(
FakeTask::new(
1,
vec![
zx::TaskRuntimeInfo {
cpu_time: 100,
queue_time: 200,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 300,
queue_time: 400,
..zx::TaskRuntimeInfo::default()
},
],
),
None, clock.clone(),
)
.unwrap();
let child_1 = Arc::new(Mutex::new(
TaskInfo::try_from(
FakeTask::new(
2,
vec![
zx::TaskRuntimeInfo {
cpu_time: 10,
queue_time: 20,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 30,
queue_time: 40,
..zx::TaskRuntimeInfo::default()
},
],
),
None, clock.clone(),
)
.unwrap(),
));
let child_2 = Arc::new(Mutex::new(
TaskInfo::try_from(
FakeTask::new(
3,
vec![
zx::TaskRuntimeInfo {
cpu_time: 5,
queue_time: 2,
..zx::TaskRuntimeInfo::default()
},
zx::TaskRuntimeInfo {
cpu_time: 15,
queue_time: 4,
..zx::TaskRuntimeInfo::default()
},
],
),
None, clock.clone(),
)
.unwrap(),
));
task.add_child(Arc::downgrade(&child_1));
task.add_child(Arc::downgrade(&child_2));
{
let measurement = take_measurement_then_tick_clock(&mut task, &clock).await.unwrap();
assert_eq!(measurement.cpu_time().into_nanos(), 100 - 10 - 5);
assert_eq!(measurement.queue_time().into_nanos(), 200 - 20 - 2);
}
assert_eq!(child_1.lock().await.total_measurements(), 1);
assert_eq!(child_2.lock().await.total_measurements(), 1);
{
let mut child_2_guard = child_2.lock().await;
child_2_guard.task = Arc::new(Mutex::new(TaskState::TerminatedAndMeasured));
child_2_guard.measurements =
MeasurementsQueue::new(COMPONENT_CPU_MAX_SAMPLES, clock.clone());
}
assert_eq!(task.children.len(), 2);
{
let measurement = take_measurement_then_tick_clock(&mut task, &clock).await.unwrap();
assert_eq!(measurement.cpu_time().into_nanos(), 300 - 30);
assert_eq!(measurement.queue_time().into_nanos(), 400 - 40);
}
assert_eq!(task.children.len(), 1); assert_eq!(child_1.lock().await.total_measurements(), 2);
}
type BucketPairs = Vec<(i64, i64)>;
use diagnostics_hierarchy::Property;
fn linear_histogram_non_zero_values(inspector: &inspect::Inspector) -> BucketPairs {
let mut output = vec![];
let hierarchy = inspector.get_diagnostics_hierarchy();
let histogram = hierarchy.get_property_by_path(&["foo"]).unwrap();
if let Property::UintArray(_, data) = histogram {
if let ArrayContent::LinearHistogram(LinearHistogram { counts, indexes, .. }) = data {
match indexes {
None => {
for (index, count) in counts.iter().enumerate() {
if *count > 0 && *count <= i64::MAX as u64 {
output.push((index as i64, *count as i64));
}
}
}
Some(indexes) => {
for (index, count) in indexes.iter().zip(counts.iter()) {
if *count > 0
&& *count <= i64::MAX as u64
&& *index <= i64::MAX as usize
{
output.push((*index as i64, *count as i64));
}
}
}
}
}
}
output
}
fn fake_readings(id: u64, cpu_deltas: Vec<u64>) -> FakeTask {
let mut cpu_time = 0i64;
let mut readings = vec![];
for delta in cpu_deltas.iter() {
cpu_time += *delta as i64;
readings.push(zx::TaskRuntimeInfo { cpu_time, ..zx::TaskRuntimeInfo::default() })
}
FakeTask::new(id, readings)
}
#[fuchsia::test]
async fn bucket_cutoffs() {
let readings = fake_readings(1, vec![1, 0, 500, 989, 990, 991, 999, 0]);
let inspector = inspect::Inspector::default();
let clock = FakeTime::new();
let histogram =
create_cpu_histogram(&inspector.root(), &ExtendedMoniker::parse_str("foo").unwrap());
let mut task = TaskInfo::try_from_internal(
readings,
Some(histogram),
Arc::new(clock.clone()),
std::time::Duration::from_nanos(1000),
1, )
.unwrap();
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(1, 1)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1), (50, 1)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1), (50, 1), (99, 1)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1), (50, 1), (99, 2)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1), (50, 1), (99, 2), (100, 1)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 1), (1, 1), (50, 1), (99, 2), (100, 2)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
clock.add_ticks(1000);
task.measure_if_no_parent().await; let answer = vec![(0, 2), (1, 1), (50, 1), (99, 2), (100, 2)];
assert_eq!(linear_histogram_non_zero_values(&inspector), answer);
}
#[fuchsia::test]
async fn discard_short_intervals() {
let readings = fake_readings(1, vec![100, 100, 100, 100]);
let inspector = inspect::Inspector::default();
let clock = FakeTime::new();
let histogram =
create_cpu_histogram(&inspector.root(), &ExtendedMoniker::parse_str("foo").unwrap());
let mut task = TaskInfo::try_from_internal(
readings,
Some(histogram),
Arc::new(clock.clone()),
std::time::Duration::from_nanos(1000),
1, )
.unwrap();
assert_eq!(linear_histogram_non_zero_values(&inspector), vec![]);
clock.add_ticks(900);
task.measure_if_no_parent().await;
assert_eq!(linear_histogram_non_zero_values(&inspector), vec![(12, 1)]);
clock.add_ticks(899);
task.measure_if_no_parent().await;
assert_eq!(linear_histogram_non_zero_values(&inspector), vec![(12, 1)]); clock.add_ticks(2000);
task.measure_if_no_parent().await;
assert_eq!(linear_histogram_non_zero_values(&inspector), (vec![(5, 1), (12, 1)]));
clock.add_ticks(1000);
task.measure_if_no_parent().await;
assert_eq!(linear_histogram_non_zero_values(&inspector), (vec![(5, 1), (10, 1), (12, 1)]));
}
#[fuchsia::test]
async fn divide_by_cores() {
let readings = fake_readings(1, vec![400]);
let inspector = inspect::Inspector::default();
let clock = FakeTime::new();
let histogram =
create_cpu_histogram(&inspector.root(), &ExtendedMoniker::parse_str("foo").unwrap());
let mut task = TaskInfo::try_from_internal(
readings,
Some(histogram),
Arc::new(clock.clone()),
std::time::Duration::from_nanos(1000),
4, )
.unwrap();
assert_eq!(linear_histogram_non_zero_values(&inspector), vec![]);
clock.add_ticks(1000);
task.measure_if_no_parent().await;
assert_eq!(linear_histogram_non_zero_values(&inspector), vec![(10, 1)]);
}
}