stats: per-agent /stats page with chart.js trends + breakdowns

new hive-ag3nt::stats module reads turn_stats.sqlite read-only and aggregates over 24h/7d/30d windows (hourly/daily buckets) — turn rate, p50/p95/avg duration, ctx tokens (avg/max), cost token components, top tools, wake mix, result mix. served by the agent itself so per-MCP extensions can register more providers without the host knowing their schemas. /stats route + /api/stats?window=... on the per-agent web ui. chart.js v4.4.4 pulled from jsdelivr (SRI hash deferred). nav links: 📊 chip on the dashboard container row + 📊 stats → on the per-agent header. todo housekeeping: softened damocles-area note at the top, new reverse-proxy + deferred reminder-rollup items, removed the two telemetry-ui items absorbed by this page.
2026-05-19 00:27:01 +02:00 · 2026-05-19 00:27:01 +02:00 · d3f90f4cc0
commit d3f90f4cc0
parent f9f1346eae
8 changed files with 930 additions and 3 deletions
--- a/hive-ag3nt/src/lib.rs
+++ b/hive-ag3nt/src/lib.rs
@ -8,6 +8,7 @@ pub mod login_session;
 pub mod mcp;
 pub mod paths;
 pub mod plugins;
+pub mod stats;
 pub mod turn;
 pub mod turn_stats;
 pub mod web_ui;
--- a/hive-ag3nt/src/stats.rs
+++ b/hive-ag3nt/src/stats.rs
@ -0,0 +1,500 @@
+//! Read-side aggregations over the per-agent `turn_stats.sqlite` for
+//! the agent's `/stats` web page. Owned by the agent (same process
+//! that writes the sink) so per-MCP extensions can register more
+//! providers without the host needing to know their schemas.
+//!
+//! Best-effort: any sqlite error returns an empty snapshot rather than
+//! propagating — the stats page is decorative, not authoritative, and
+//! a missing db on a brand-new agent shouldn't 500 the route.
+
+use std::collections::HashMap;
+use std::path::{Path, PathBuf};
+
+use anyhow::{Context, Result};
+use rusqlite::{Connection, OpenFlags};
+use serde::Serialize;
+
+/// Window param accepted by `/api/stats?window=`. Each maps to a
+/// total span + the bucket width used to roll up trend series.
+#[derive(Debug, Clone, Copy)]
+pub enum Window {
+    Day,
+    Week,
+    Month,
+}
+
+impl Window {
+    pub fn parse(s: &str) -> Self {
+        match s {
+            "7d" => Self::Week,
+            "30d" => Self::Month,
+            _ => Self::Day,
+        }
+    }
+
+    fn label(self) -> &'static str {
+        match self {
+            Self::Day => "24h",
+            Self::Week => "7d",
+            Self::Month => "30d",
+        }
+    }
+
+    fn span_secs(self) -> i64 {
+        match self {
+            Self::Day => 24 * 3600,
+            Self::Week => 7 * 24 * 3600,
+            Self::Month => 30 * 24 * 3600,
+        }
+    }
+
+    fn bucket_secs(self) -> i64 {
+        match self {
+            // hourly for the 24h view, daily for the longer ranges.
+            Self::Day => 3600,
+            Self::Week | Self::Month => 24 * 3600,
+        }
+    }
+}
+
+#[derive(Debug, Serialize)]
+pub struct Snapshot {
+    pub window: &'static str,
+    pub bucket_seconds: i64,
+    pub now: i64,
+    pub from: i64,
+    /// Total turns in the window.
+    pub turn_count: u64,
+    /// Time-bucketed trend series, oldest first. Always covers the
+    /// full window even for empty buckets (so charts paint a stable
+    /// x-axis instead of skipping gaps).
+    pub buckets: Vec<Bucket>,
+    /// Top tools by call count across the window. Capped to 10.
+    pub tool_breakdown: Vec<KeyCount>,
+    pub wake_mix: Vec<KeyCount>,
+    pub result_mix: Vec<KeyCount>,
+    /// Across-window p50 / p95 / avg of `duration_ms`. Same numbers
+    /// as the per-bucket fields but aggregated over the whole window
+    /// for the headline summary chips.
+    pub duration_summary: DurationSummary,
+}
+
+#[derive(Debug, Serialize)]
+pub struct Bucket {
+    /// Unix timestamp of the bucket start.
+    pub ts: i64,
+    pub turn_count: u64,
+    pub avg_duration_ms: f64,
+    pub p50_duration_ms: f64,
+    pub p95_duration_ms: f64,
+    /// Sums across the bucket. JS picks how to combine them
+    /// (input + output for cost, etc.) so we don't bake a policy in.
+    pub input_tokens: u64,
+    pub output_tokens: u64,
+    pub cache_read_input_tokens: u64,
+    pub cache_creation_input_tokens: u64,
+    /// Mean of `last_input_tokens` across the bucket (the context
+    /// size at turn-end — useful for spotting drift toward compaction).
+    pub avg_ctx_tokens: f64,
+    pub max_ctx_tokens: u64,
+}
+
+#[derive(Debug, Serialize)]
+pub struct KeyCount {
+    pub key: String,
+    pub count: u64,
+}
+
+#[derive(Debug, Default, Serialize)]
+pub struct DurationSummary {
+    pub avg_ms: f64,
+    pub p50_ms: f64,
+    pub p95_ms: f64,
+}
+
+#[must_use]
+pub fn snapshot_default(window: Window) -> Snapshot {
+    let path = default_path();
+    match snapshot(&path, window) {
+        Ok(s) => s,
+        Err(e) => {
+            tracing::warn!(error = ?e, path = %path.display(), "stats: snapshot failed");
+            empty_snapshot(window)
+        }
+    }
+}
+
+fn default_path() -> PathBuf {
+    crate::paths::state_dir().join("hyperhive-turn-stats.sqlite")
+}
+
+fn empty_snapshot(window: Window) -> Snapshot {
+    let now = now_secs();
+    let from = now - window.span_secs();
+    let buckets = fill_buckets(from, now, window.bucket_secs(), &HashMap::new());
+    Snapshot {
+        window: window.label(),
+        bucket_seconds: window.bucket_secs(),
+        now,
+        from,
+        turn_count: 0,
+        buckets,
+        tool_breakdown: Vec::new(),
+        wake_mix: Vec::new(),
+        result_mix: Vec::new(),
+        duration_summary: DurationSummary::default(),
+    }
+}
+
+fn snapshot(path: &Path, window: Window) -> Result<Snapshot> {
+    // Read-only open so an in-flight writer (the harness's own
+    // turn_stats sink) never blocks us and we can't corrupt the db
+    // via a query bug.
+    let conn = Connection::open_with_flags(path, OpenFlags::SQLITE_OPEN_READ_ONLY)
+        .with_context(|| format!("open {} read-only", path.display()))?;
+    let now = now_secs();
+    let from = now - window.span_secs();
+    let bucket_secs = window.bucket_secs();
+
+    let mut stmt = conn.prepare(
+        "SELECT started_at, duration_ms,
+                input_tokens, output_tokens,
+                cache_read_input_tokens, cache_creation_input_tokens,
+                last_input_tokens,
+                tool_call_breakdown_json,
+                wake_from, result_kind
+         FROM turn_stats
+         WHERE started_at >= ?1
+         ORDER BY started_at ASC",
+    )?;
+    let rows = stmt.query_map([from], |row| {
+        Ok(Row {
+            started_at: row.get(0)?,
+            duration_ms: row.get::<_, i64>(1)?,
+            input_tokens: u64_from_i64(row.get::<_, i64>(2)?),
+            output_tokens: u64_from_i64(row.get::<_, i64>(3)?),
+            cache_read_input_tokens: u64_from_i64(row.get::<_, i64>(4)?),
+            cache_creation_input_tokens: u64_from_i64(row.get::<_, i64>(5)?),
+            last_input_tokens: u64_from_i64(row.get::<_, i64>(6)?),
+            tool_breakdown_json: row.get::<_, Option<String>>(7)?,
+            wake_from: row.get::<_, String>(8)?,
+            result_kind: row.get::<_, String>(9)?,
+        })
+    })?;
+
+    let mut by_bucket: HashMap<i64, BucketAcc> = HashMap::new();
+    let mut tool_totals: HashMap<String, u64> = HashMap::new();
+    let mut wake_totals: HashMap<String, u64> = HashMap::new();
+    let mut result_totals: HashMap<String, u64> = HashMap::new();
+    let mut all_durations: Vec<i64> = Vec::new();
+    let mut turn_count: u64 = 0;
+
+    for r in rows {
+        let r = r?;
+        turn_count += 1;
+        let bucket_ts = (r.started_at / bucket_secs) * bucket_secs;
+        let acc = by_bucket.entry(bucket_ts).or_default();
+        acc.turn_count += 1;
+        acc.durations.push(r.duration_ms.max(0));
+        acc.input_tokens = acc.input_tokens.saturating_add(r.input_tokens);
+        acc.output_tokens = acc.output_tokens.saturating_add(r.output_tokens);
+        acc.cache_read_input_tokens = acc
+            .cache_read_input_tokens
+            .saturating_add(r.cache_read_input_tokens);
+        acc.cache_creation_input_tokens = acc
+            .cache_creation_input_tokens
+            .saturating_add(r.cache_creation_input_tokens);
+        acc.ctx_sum = acc.ctx_sum.saturating_add(r.last_input_tokens);
+        acc.ctx_max = acc.ctx_max.max(r.last_input_tokens);
+
+        all_durations.push(r.duration_ms.max(0));
+        *wake_totals.entry(r.wake_from).or_insert(0) += 1;
+        *result_totals.entry(r.result_kind).or_insert(0) += 1;
+
+        if let Some(json) = r.tool_breakdown_json
+            && let Ok(map) = serde_json::from_str::<HashMap<String, u64>>(&json)
+        {
+            for (k, v) in map {
+                *tool_totals.entry(k).or_insert(0) += v;
+            }
+        }
+    }
+
+    let buckets = fill_buckets(from, now, bucket_secs, &by_bucket);
+    let duration_summary = summarize_durations(&mut all_durations);
+
+    Ok(Snapshot {
+        window: window.label(),
+        bucket_seconds: bucket_secs,
+        now,
+        from,
+        turn_count,
+        buckets,
+        tool_breakdown: top_n(tool_totals, 10),
+        wake_mix: top_n(wake_totals, 20),
+        result_mix: top_n(result_totals, 20),
+        duration_summary,
+    })
+}
+
+struct Row {
+    started_at: i64,
+    duration_ms: i64,
+    input_tokens: u64,
+    output_tokens: u64,
+    cache_read_input_tokens: u64,
+    cache_creation_input_tokens: u64,
+    last_input_tokens: u64,
+    tool_breakdown_json: Option<String>,
+    wake_from: String,
+    result_kind: String,
+}
+
+#[derive(Default)]
+struct BucketAcc {
+    turn_count: u64,
+    durations: Vec<i64>,
+    input_tokens: u64,
+    output_tokens: u64,
+    cache_read_input_tokens: u64,
+    cache_creation_input_tokens: u64,
+    ctx_sum: u64,
+    ctx_max: u64,
+}
+
+fn fill_buckets(
+    from: i64,
+    now: i64,
+    bucket_secs: i64,
+    by_bucket: &HashMap<i64, BucketAcc>,
+) -> Vec<Bucket> {
+    let start = (from / bucket_secs) * bucket_secs;
+    let mut out = Vec::new();
+    let mut ts = start;
+    while ts <= now {
+        let bucket = if let Some(acc) = by_bucket.get(&ts) {
+            let mut sorted = acc.durations.clone();
+            sorted.sort_unstable();
+            let avg = if sorted.is_empty() {
+                0.0
+            } else {
+                #[allow(clippy::cast_precision_loss)]
+                let sum_f = sorted.iter().sum::<i64>() as f64;
+                #[allow(clippy::cast_precision_loss)]
+                let len_f = sorted.len() as f64;
+                sum_f / len_f
+            };
+            let p50 = percentile(&sorted, 50);
+            let p95 = percentile(&sorted, 95);
+            let avg_ctx = if acc.turn_count == 0 {
+                0.0
+            } else {
+                #[allow(clippy::cast_precision_loss)]
+                let sum_f = acc.ctx_sum as f64;
+                #[allow(clippy::cast_precision_loss)]
+                let cnt_f = acc.turn_count as f64;
+                sum_f / cnt_f
+            };
+            Bucket {
+                ts,
+                turn_count: acc.turn_count,
+                avg_duration_ms: avg,
+                p50_duration_ms: p50,
+                p95_duration_ms: p95,
+                input_tokens: acc.input_tokens,
+                output_tokens: acc.output_tokens,
+                cache_read_input_tokens: acc.cache_read_input_tokens,
+                cache_creation_input_tokens: acc.cache_creation_input_tokens,
+                avg_ctx_tokens: avg_ctx,
+                max_ctx_tokens: acc.ctx_max,
+            }
+        } else {
+            Bucket {
+                ts,
+                turn_count: 0,
+                avg_duration_ms: 0.0,
+                p50_duration_ms: 0.0,
+                p95_duration_ms: 0.0,
+                input_tokens: 0,
+                output_tokens: 0,
+                cache_read_input_tokens: 0,
+                cache_creation_input_tokens: 0,
+                avg_ctx_tokens: 0.0,
+                max_ctx_tokens: 0,
+            }
+        };
+        out.push(bucket);
+        ts += bucket_secs;
+    }
+    out
+}
+
+fn summarize_durations(all: &mut [i64]) -> DurationSummary {
+    if all.is_empty() {
+        return DurationSummary::default();
+    }
+    all.sort_unstable();
+    #[allow(clippy::cast_precision_loss)]
+    let sum_f = all.iter().sum::<i64>() as f64;
+    #[allow(clippy::cast_precision_loss)]
+    let len_f = all.len() as f64;
+    DurationSummary {
+        avg_ms: sum_f / len_f,
+        p50_ms: percentile(all, 50),
+        p95_ms: percentile(all, 95),
+    }
+}
+
+#[allow(clippy::cast_precision_loss, clippy::cast_possible_truncation, clippy::cast_sign_loss)]
+fn percentile(sorted: &[i64], pct: u8) -> f64 {
+    if sorted.is_empty() {
+        return 0.0;
+    }
+    if sorted.len() == 1 {
+        return sorted[0] as f64;
+    }
+    // Nearest-rank, clamped.
+    let rank = ((f64::from(pct) / 100.0) * (sorted.len() as f64 - 1.0)).round() as usize;
+    sorted[rank.min(sorted.len() - 1)] as f64
+}
+
+fn top_n(map: HashMap<String, u64>, n: usize) -> Vec<KeyCount> {
+    let mut v: Vec<KeyCount> = map
+        .into_iter()
+        .map(|(key, count)| KeyCount { key, count })
+        .collect();
+    v.sort_unstable_by(|a, b| b.count.cmp(&a.count).then_with(|| a.key.cmp(&b.key)));
+    v.truncate(n);
+    v
+}
+
+fn u64_from_i64(v: i64) -> u64 {
+    u64::try_from(v).unwrap_or(0)
+}
+
+fn now_secs() -> i64 {
+    std::time::SystemTime::now()
+        .duration_since(std::time::UNIX_EPOCH)
+        .map_or(0, |d| i64::try_from(d.as_secs()).unwrap_or(i64::MAX))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use rusqlite::params;
+    use std::sync::atomic::{AtomicU32, Ordering};
+
+    static SEQ: AtomicU32 = AtomicU32::new(0);
+
+    fn tmp_db() -> PathBuf {
+        let n = SEQ.fetch_add(1, Ordering::SeqCst);
+        let pid = std::process::id();
+        std::env::temp_dir().join(format!("hyperhive-stats-test-{pid}-{n}.sqlite"))
+    }
+
+    fn seed_db(path: &Path, rows: &[(i64, i64, &str, &str, &str)]) {
+        let conn = Connection::open(path).unwrap();
+        conn.execute_batch(
+            "CREATE TABLE turn_stats (
+                id INTEGER PRIMARY KEY,
+                started_at INTEGER NOT NULL,
+                ended_at INTEGER NOT NULL,
+                duration_ms INTEGER NOT NULL,
+                model TEXT NOT NULL,
+                wake_from TEXT NOT NULL,
+                input_tokens INTEGER NOT NULL DEFAULT 0,
+                output_tokens INTEGER NOT NULL DEFAULT 0,
+                cache_read_input_tokens INTEGER NOT NULL DEFAULT 0,
+                cache_creation_input_tokens INTEGER NOT NULL DEFAULT 0,
+                last_input_tokens INTEGER NOT NULL DEFAULT 0,
+                last_output_tokens INTEGER NOT NULL DEFAULT 0,
+                last_cache_read_input_tokens INTEGER NOT NULL DEFAULT 0,
+                last_cache_creation_input_tokens INTEGER NOT NULL DEFAULT 0,
+                tool_call_count INTEGER NOT NULL DEFAULT 0,
+                tool_call_breakdown_json TEXT,
+                open_threads_count INTEGER,
+                open_reminders_count INTEGER,
+                result_kind TEXT NOT NULL,
+                note TEXT
+            );",
+        )
+        .unwrap();
+        for (started, dur, wake, result, tools_json) in rows {
+            conn.execute(
+                "INSERT INTO turn_stats
+                    (started_at, ended_at, duration_ms, model, wake_from,
+                     last_input_tokens, tool_call_breakdown_json, result_kind)
+                 VALUES (?1, ?2, ?3, 'm', ?4, 1000, ?5, ?6)",
+                params![started, started + dur / 1000, dur, wake, tools_json, result],
+            )
+            .unwrap();
+        }
+    }
+
+    #[test]
+    fn snapshot_aggregates_rows() {
+        let db = tmp_db();
+        let _ = std::fs::remove_file(&db);
+        let now = now_secs();
+        seed_db(
+            &db,
+            &[
+                (now - 600, 5_000, "recv", "ok", r#"{"Read":2,"Bash":1}"#),
+                (now - 300, 10_000, "recv", "ok", r#"{"Read":3}"#),
+                (now - 100, 20_000, "operator", "failed", "{}"),
+            ],
+        );
+        let s = snapshot(&db, Window::Day).unwrap();
+        assert_eq!(s.turn_count, 3);
+        assert_eq!(s.window, "24h");
+        assert_eq!(s.bucket_seconds, 3600);
+        let tool_map: HashMap<_, _> = s
+            .tool_breakdown
+            .iter()
+            .map(|kc| (kc.key.clone(), kc.count))
+            .collect();
+        assert_eq!(tool_map.get("Read").copied(), Some(5));
+        assert_eq!(tool_map.get("Bash").copied(), Some(1));
+        let wake_map: HashMap<_, _> = s
+            .wake_mix
+            .iter()
+            .map(|kc| (kc.key.clone(), kc.count))
+            .collect();
+        assert_eq!(wake_map.get("recv").copied(), Some(2));
+        assert_eq!(wake_map.get("operator").copied(), Some(1));
+        let result_map: HashMap<_, _> = s
+            .result_mix
+            .iter()
+            .map(|kc| (kc.key.clone(), kc.count))
+            .collect();
+        assert_eq!(result_map.get("ok").copied(), Some(2));
+        assert_eq!(result_map.get("failed").copied(), Some(1));
+        // Durations: [5000, 10000, 20000] → avg ≈ 11666.67, p50 = 10000, p95 ~ 20000
+        assert!((s.duration_summary.avg_ms - 11_666.666_666_666_666).abs() < 1.0);
+        assert!((s.duration_summary.p50_ms - 10_000.0).abs() < 1.0);
+        assert!((s.duration_summary.p95_ms - 20_000.0).abs() < 1.0);
+    }
+
+    #[test]
+    fn empty_window_still_paints_buckets() {
+        let db = tmp_db();
+        let _ = std::fs::remove_file(&db);
+        seed_db(&db, &[]);
+        let s = snapshot(&db, Window::Day).unwrap();
+        assert_eq!(s.turn_count, 0);
+        // 24h / 1h buckets = ~24-25 buckets covering the window.
+        assert!(s.buckets.len() >= 24);
+        assert!(s.buckets.iter().all(|b| b.turn_count == 0));
+    }
+
+    #[test]
+    fn week_uses_daily_buckets() {
+        let db = tmp_db();
+        let _ = std::fs::remove_file(&db);
+        seed_db(&db, &[]);
+        let s = snapshot(&db, Window::Week).unwrap();
+        assert_eq!(s.window, "7d");
+        assert_eq!(s.bucket_seconds, 86_400);
+        assert!(s.buckets.len() >= 7);
+    }
+}
--- a/hive-ag3nt/src/web_ui.rs
+++ b/hive-ag3nt/src/web_ui.rs
@ -107,6 +107,9 @@ pub async fn serve(
        .route("/api/model", post(post_set_model))
        .route("/api/new-session", post(post_new_session))
        .route("/api/loose-ends", get(api_loose_ends))
+        .route("/stats", get(serve_stats))
+        .route("/static/stats.js", get(serve_stats_js))
+        .route("/api/stats", get(api_stats))
        .with_state(state);
    let addr = SocketAddr::from(([0, 0, 0, 0], port));
    let listener = bind_with_retry(addr, "web UI").await?;
@ -198,6 +201,33 @@ async fn serve_marked_js() -> impl IntoResponse {
    )
 }

+async fn serve_stats() -> impl IntoResponse {
+    (
+        [("content-type", "text/html; charset=utf-8")],
+        include_str!("../assets/stats.html"),
+    )
+}
+
+async fn serve_stats_js() -> impl IntoResponse {
+    (
+        [("content-type", "application/javascript")],
+        include_str!("../assets/stats.js"),
+    )
+}
+
+#[derive(Deserialize)]
+struct StatsQuery {
+    window: Option<String>,
+}
+
+async fn api_stats(
+    State(_state): State<AppState>,
+    axum::extract::Query(q): axum::extract::Query<StatsQuery>,
+) -> axum::Json<crate::stats::Snapshot> {
+    let window = crate::stats::Window::parse(q.window.as_deref().unwrap_or("24h"));
+    axum::Json(crate::stats::snapshot_default(window))
+}
+
 #[derive(Serialize)]
 struct StateSnapshot {
    /// Bus seq at the moment this snapshot was assembled. Clients dedupe