feat(hooks): emit per-run token usage and duration on run.end

The stats layer reads usage/duration only from run.end, but neither framework populated them, so tokens/cost/avg-duration were always 0. - hermes: accumulate token usage across each run's api-result calls in session state and attach the summed usage plus a computed duration_ms (from a stored runStartedAt) onto run.end. metric.snapshot emission is unchanged, so there is no double counting. - claude-code: store runStartedAt and use it as a duration_ms fallback at all run.end sites. Usage is unavailable from CC hook inputs. Live verification: a real hermes run now reports duration_ms and total_tokens on run.end; dashboard tokens_today/avg_duration_ms, both previously 0, now populate. cost_today stays 0 (no provider emits cost through the hooks). Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
2026-06-23 11:16:23 -07:00
parent 5014d89258
commit 478c7529a7
4 changed files with 130 additions and 29 deletions
@@ -23,9 +23,41 @@ const { enqueue, flush } = createTransport(INGEST_URL);
 interface SessionState {
  sessionStarted?: boolean;
  runId?: string;
+  runStartedAt?: number;
+  runUsage?: Dict;
  spans: { [key: string]: string };
 }

+// Token fields are reported per LLM call (api-result). A single run (user turn)
+// can span several calls, so we sum them into a per-run total that rides along
+// on run.end — the location the stats layer reads usage from.
+const USAGE_TOKEN_FIELDS = [
+  'input_tokens',
+  'output_tokens',
+  'total_tokens',
+  'cache_read_tokens',
+  'cache_write_tokens',
+  'reasoning_tokens',
+  'total_cost',
+];
+
+function accumulateUsage(into: Dict, usage: Dict | undefined): Dict {
+  if (!usage) {
+    return into;
+  }
+  for (const key of USAGE_TOKEN_FIELDS) {
+    const v = pickNumber(usage[key]);
+    if (v !== undefined) {
+      into[key] = (pickNumber(into[key]) ?? 0) + v;
+    }
+  }
+  return into;
+}
+
+function runUsagePayload(state: SessionState): Dict | undefined {
+  return state.runUsage && Object.keys(state.runUsage).length > 0 ? state.runUsage : undefined;
+}
+
 const STATE_DIR = join(homedir(), '.agentmon-state', 'hermes');

 function ensureStateDir() {
@@ -179,12 +211,18 @@ async function handleRunStart(input: Dict) {
  if (state.runId) {
    enqueue(buildEnvelope(FRAMEWORK, HOST, 'run.end', sessionKey, {
      runId: state.runId,
-      payload: { status: 'success' },
+      payload: {
+        status: 'success',
+        duration_ms: state.runStartedAt ? Date.now() - state.runStartedAt : undefined,
+        ...(runUsagePayload(state) && { usage: runUsagePayload(state) }),
+      },
    }));
  }

  const runId = randomUUID();
  state.runId = runId;
+  state.runStartedAt = Date.now();
+  state.runUsage = {};
  saveState(sessionKey, state);

  const extra = getExtra(input);
@@ -217,12 +255,15 @@ async function handleRunEnd(input: Dict) {
      runId: state.runId,
      payload: {
        status: 'success',
-        duration_ms: getDuration(input),
+        duration_ms: getDuration(input) ?? (state.runStartedAt ? Date.now() - state.runStartedAt : undefined),
        model: getModel(input),
        response_preview: truncate(getExtra(input).assistant_response, 500),
+        ...(runUsagePayload(state) && { usage: runUsagePayload(state) }),
      },
    }));
    state.runId = undefined;
+    state.runStartedAt = undefined;
+    state.runUsage = {};
    saveState(sessionKey, state);
  }
  await flush();
@@ -296,6 +337,11 @@ async function handleAPIResult(input: Dict) {
    return;
  }

+  if (sessionKey) {
+    state.runUsage = accumulateUsage(state.runUsage || {}, usage);
+    saveState(sessionKey, state);
+  }
+
  enqueue(buildEnvelope(FRAMEWORK, HOST, 'metric.snapshot', sessionKey, {
    runId: state.runId,
    payload: {
@@ -318,7 +364,9 @@ async function handleSessionEnd(input: Dict) {
      runId: state.runId,
      payload: {
        status: input.interrupted || getExtra(input).interrupted ? 'interrupted' : 'success',
+        duration_ms: state.runStartedAt ? Date.now() - state.runStartedAt : undefined,
        model: getModel(input),
+        ...(runUsagePayload(state) && { usage: runUsagePayload(state) }),
      },
    }));
  }