From fe78e3aa49a90e9f72fd5d23455762ff29bbe4a3 Mon Sep 17 00:00:00 2001
From: Dinah Gao <xiaomgao@microsoft.com>
Date: Fri, 12 Jun 2026 16:43:45 +0800
Subject: [PATCH 1/3] cost calculation module

---
 src/tools/cost-module/.gitignore              |   9 +
 src/tools/cost-module/README.md               | 349 ++++++++
 src/tools/cost-module/examples/analyze-run.ts |  52 ++
 src/tools/cost-module/package-lock.json       |  48 ++
 src/tools/cost-module/package.json            |  25 +
 src/tools/cost-module/src/copilot-cost.ts     | 748 ++++++++++++++++++
 src/tools/cost-module/src/index.ts            |   1 +
 src/tools/cost-module/tsconfig.json           |  17 +
 8 files changed, 1249 insertions(+)
 create mode 100644 src/tools/cost-module/.gitignore
 create mode 100644 src/tools/cost-module/README.md
 create mode 100644 src/tools/cost-module/examples/analyze-run.ts
 create mode 100644 src/tools/cost-module/package-lock.json
 create mode 100644 src/tools/cost-module/package.json
 create mode 100644 src/tools/cost-module/src/copilot-cost.ts
 create mode 100644 src/tools/cost-module/src/index.ts
 create mode 100644 src/tools/cost-module/tsconfig.json

diff --git a/src/tools/cost-module/.gitignore b/src/tools/cost-module/.gitignore
new file mode 100644
index 0000000..c94af7e
--- /dev/null
+++ b/src/tools/cost-module/.gitignore
@@ -0,0 +1,9 @@
+# Build output (generated by `tsc`; shipped via npm "files", never committed)
+dist/
+*.tsbuildinfo
+
+# Dependencies
+node_modules/
+
+*.log
+devtest.md
\ No newline at end of file
diff --git a/src/tools/cost-module/README.md b/src/tools/cost-module/README.md
new file mode 100644
index 0000000..6133dd2
--- /dev/null
+++ b/src/tools/cost-module/README.md
@@ -0,0 +1,349 @@
+# copilot-cost
+
+A tiny, **zero-dependency TypeScript module** that computes the token usage and
+**AI-credit (AIU) cost** of a GitHub Copilot CLI / Copilot SDK session, split
+between the **main agent** and any **sub-agents**.
+
+For each scope (main, each sub-agent, and total) it reports:
+
+| Field | Meaning |
+|-------|---------|
+| `inputTokens` | Fresh, **uncached** prompt tokens (billed at the base input rate) |
+| `cachedTokens` | Prompt tokens served from cache (`cache_read`, billed cheaply) |
+| `cacheWriteTokens` | Prompt tokens written to cache (`cache_write`, billed at a premium) |
+| `outputTokens` | Generated tokens (includes reasoning tokens) |
+| `grossInputTokens` | `inputTokens + cachedTokens + cacheWriteTokens` (total prompt) |
+| `aiCreditCost` | **AI credit cost in AIU** (the headline number — exact, billed by the CLI) |
+| `nanoAiu` | Raw billed cost in nano-AIU (1e-9 AIU), straight from the logs |
+
+> The CLI denominates cost only in **AIU** (nano-AIU). There are **no dollar
+> amounts in the logs**, so this module does not invent a currency conversion —
+> it reports AIU, which is exact. Apply your own AIU→USD rate downstream if you
+> need one.
+
+It works in **any TypeScript/JavaScript runtime** (the pure functions have no
+imports). Optional `analyze*File` / `analyze*Dir` helpers use Node's `fs`.
+
+---
+
+## Quick start
+
+```ts
+import { analyzeCopilotSession, formatReport } from "copilot-cost";
+
+// Point at a recorded session/trial directory (auto-discovers the logs):
+const report = await analyzeCopilotSession("path/to/session-logs-dir");
+
+console.log(formatReport(report));
+
+report.main.aiCreditCost;     // main agent AI credits (AIU)
+report.subAgents[0].cachedTokens;
+report.total.nanoAiu;         // whole-session raw cost (nano-AIU)
+```
+
+Pure (no filesystem — pass events you already have):
+
+```ts
+import { parseJsonl, analyzeEvents } from "copilot-cost";
+
+const events = parseJsonl(jsonlText);   // string with one JSON object per line
+const report = analyzeEvents(events);
+```
+
+Run the bundled example against the checked-in sample trial:
+
+```bash
+node examples/analyze-run.ts        # Node >= 22 (native TS), or: npx tsx examples/analyze-run.ts
+```
+
+---
+
+## Where the data comes from (read this)
+
+A Copilot CLI session writes **two complementary JSONL logs**. This module reads
+both for full accuracy; it is safe to feed both to `analyzeEvents` (credits are
+taken from the per-call events; the session summary only adds `premiumRequests`
+and a cross-check, so nothing is double-counted).
+
+### 1. The SDK event stream (e.g. an exported `*-events.jsonl`)
+
+The Copilot SDK emits this stream; a harness may export it to a file. It is the
+**only** source with **per-API-call** usage events, and the **only** way to
+reliably separate the main agent from inline sub-agents.
+
+Look for events with `type: "assistant.usage"`:
+
+```jsonc
+{
+  "type": "assistant.usage",
+  "data": {
+    "model": "claude-opus-4.6",
+    "inputTokens": 18631,          // GROSS prompt tokens (already includes cache)
+    "outputTokens": 554,
+    "cacheReadTokens": 0,
+    "cacheWriteTokens": 18628,
+    "reasoningTokens": 213,
+    "parentToolCallId": "toolu_…",  // PRESENT => this call belongs to a SUB-AGENT
+                                    // ABSENT  => this call is the MAIN agent
+    "copilotUsage": {
+      "tokenDetails": [
+        { "tokenType": "input",       "tokenCount": 3,     "batchSize": 1000000, "costPerBatch": 500000000000 },
+        { "tokenType": "cache_read",  "tokenCount": 0,     "batchSize": 1000000, "costPerBatch": 50000000000 },
+        { "tokenType": "cache_write", "tokenCount": 18628, "batchSize": 1000000, "costPerBatch": 625000000000 },
+        { "tokenType": "output",      "tokenCount": 554,   "batchSize": 1000000, "costPerBatch": 2500000000000 }
+      ],
+      "totalNanoAiu": 13029000000   // EXACT billed cost of THIS call (nano-AIU)
+    }
+  }
+}
+```
+
+Sub-agent **names / models** come from the same file:
+
+- `tool.execution_start` where `data.toolName === "task"` →
+  `data.toolCallId` maps to `data.arguments.{name, description, agent_type}`
+- `subagent.completed` / `subagent.failed` →
+  `data.{toolCallId, agentName, agentDisplayName, model, totalTokens, durationMs}`
+
+### 2. The canonical session log — `~/.copilot/session-state/<sessionId>/events.jsonl`
+
+The **only** file with the session-end summary. Look for
+`type: "session.shutdown"` with `data.shutdownType === "routine"`:
+
+```jsonc
+{
+  "type": "session.shutdown",
+  "data": {
+    "shutdownType": "routine",
+    "totalPremiumRequests": 3,
+    "totalNanoAiu": 156131000000,   // whole-session billed cost
+    "tokenDetails": {               // session totals (fresh input / cache / output)
+      "input": { "tokenCount": 125607 },
+      "cache_read": { "tokenCount": 814464 },
+      "cache_write": { "tokenCount": 67884 },
+      "output": { "tokenCount": 31435 }
+    },
+    "modelMetrics": {
+      "claude-opus-4.6": {
+        "usage": { "inputTokens": 470721, "outputTokens": 4712,
+                   "cacheReadTokens": 402816, "cacheWriteTokens": 67884 },
+        "totalNanoAiu": 74358800000   // <-- note: usage.inputTokens here is GROSS
+      }
+    }
+  }
+}
+```
+
+> A sub-agent that runs as its **own session** appears here as a
+> `session.shutdown` **without** a `shutdownType` field.
+
+The module uses this file for `premiumRequests` and as a cross-check against the
+summed per-call cost.
+
+---
+
+## How the cost is computed (read straight from the logs — no price table)
+
+The CLI denominates every cost in **nano-AIU** (1e-9 AI Units), so that is the
+only cost unit the data contains. This module applies **no price table and no
+currency conversion**.
+
+**Per call** the cost in nano-AIU is
+
+```
+nanoAiu = Σ_type ( tokenCount / batchSize × costPerBatch )
+```
+
+which is exactly the value the CLI already reports as
+`copilotUsage.totalNanoAiu`. The module sums `totalNanoAiu` directly (and falls
+back to the formula above only if that field is missing).
+
+**AI credits (AIU) — exact.** AIU is just nano-AIU unscaled (the field is
+literally named `totalNanoAiu`, and "nano" = 1e-9), so this is not derived or
+estimated:
+
+```
+1 AIU = 1e9 nano-AIU      →  aiCreditCost = nanoAiu / 1e9
+```
+
+**No USD.** The logs contain **no dollar amounts** — every cost field is in
+nano-AIU. Converting to USD would require an AIU→USD rate that is **not in the
+data**, so this module deliberately does not do it. If you need a currency,
+multiply `aiCreditCost` by your own contract rate downstream.
+
+### Main vs. sub-agent split
+
+The robust split is per-call, from the SDK event stream:
+
+- `assistant.usage` **without** `parentToolCallId` → **main agent**
+- `assistant.usage` **with** `parentToolCallId` → **sub-agent**; grouped by
+  `parentToolCallId` so each sub-agent invocation gets its own line
+
+This works for **inline** sub-agents (spawned via the `task` tool, which share
+the parent session) — the common case. If only the canonical log is available,
+the module falls back to `session.shutdown.modelMetrics` and emits a warning,
+because inline sub-agents there roll up by **model**, not by scope.
+
+### Token categories
+
+The five categories are **non-overlapping** and map directly to the provider's
+billing tiers, so `inputTokens + cachedTokens + cacheWriteTokens = grossInputTokens`.
+
+> Note: the raw `assistant.usage.data.inputTokens` field is **gross** (it already
+> includes cached + cache-write). This module exposes both the non-overlapping
+> `inputTokens` (fresh only) **and** `grossInputTokens`, so you can use whichever
+> your report needs.
+
+---
+
+## Validation
+
+Running against the checked-in sample trial
+(`agent-benchmark/results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir`):
+
+```
+MAIN agent  in 21      cache(r) 402.8k  cache(w) 67.9k  out 4.7k    74.36 AIU
+SUB (gpt-5.4) in 125.6k cache(r) 411.6k  cache(w) 0      out 26.7k   81.77 AIU
+TOTAL       in 125.6k  cache(r) 814.5k  cache(w) 67.9k  out 31.4k  156.13 AIU
+premium requests: 3
+```
+
+Every number ties out to the canonical `session.shutdown`:
+
+- `total.aiCreditCost` 156.13 AIU == `totalNanoAiu` `156131000000`
+- `main` 74.36 AIU == `modelMetrics["claude-opus-4.6"].totalNanoAiu` `74358800000`
+- token totals (125607 / 814464 / 67884 / 31435) == the shutdown `tokenDetails`
+- `premiumRequests` 3 == `totalPremiumRequests`
+
+---
+
+## API
+
+### Pure (any runtime)
+
+| Function | Description |
+|----------|-------------|
+| `parseJsonl(text): CopilotEvent[]` | Parse JSONL, skipping blank/malformed lines |
+| `analyzeEvents(events, options?): SessionCostReport` | Core analysis; accepts events from either or both logs |
+| `nanoAiuFromTokenDetails(tokenDetails): number` | Cost of a `tokenDetails` array (fallback) |
+| `formatReport(report): string` | Human-readable table |
+
+### Node (require `node:fs`)
+
+| Function | Description |
+|----------|-------------|
+| `analyzeJsonlFile(path, options?)` | Analyze a single `.jsonl` file |
+| `analyzeCopilotSession(pathOrDir, options?)` | Auto-discover `*-events.jsonl` + `.copilot/session-state/**/events.jsonl` under a dir (or analyze a single file), de-duplicate by event id, and report |
+
+### Options
+
+```ts
+interface CostOptions {
+  reconcileTolerance?: number; // sanity-check tolerance vs session.shutdown total (default 0.01 = 1%)
+}
+```
+
+### Result shape
+
+```ts
+interface SessionCostReport {
+  main: CostBreakdown;            // main agent
+  subAgents: SubAgentCost[];      // per-call AIU split (SDK stream only; sorted by cost desc)
+  subAgentsTotal: CostBreakdown;  // aggregate of all sub-agents
+  total: CostBreakdown;           // main + all sub-agents (== session billed total)
+  models: Record<string, CostBreakdown>;  // per-model rollup (exact per-model AIU)
+  subAgentRuns: SubAgentRun[];    // from subagent.completed; available for plain CLI logs too
+  subAgentCount: number;          // best available sub-agent count
+  premiumRequests?: number;       // from session.shutdown
+  sessionIds: string[];
+  warnings: string[];             // e.g. cross-check mismatch, missing per-call data
+}
+
+interface CostBreakdown {
+  inputTokens: number; cachedTokens: number; cacheWriteTokens: number;
+  outputTokens: number; reasoningTokens: number; grossInputTokens: number;
+  nanoAiu: number; aiCreditCost: number; apiCalls: number;
+}
+
+interface SubAgentCost extends CostBreakdown {
+  toolCallId: string; agentName?: string; model?: string; durationMs?: number;
+}
+
+// From subagent.completed / subagent.failed events. Combined token count only
+// (no input/output/cache breakdown, no per-sub AIU). Present in BOTH the SDK
+// stream and a plain CLI session's on-disk events.jsonl.
+interface SubAgentRun {
+  toolCallId?: string; name?: string; model?: string;
+  totalTokens: number; durationMs?: number; status: "completed" | "failed";
+}
+```
+
+---
+
+## Using it with a plain Copilot CLI session (no harness)
+
+You can capture a log the module reads from a bare `copilot` command. **Run the
+session to completion**, then point the module at the session-state folder.
+
+Where the cost data lands for a plain CLI session:
+
+| Source | Has what | Good for |
+|--------|----------|----------|
+| `~/.copilot/session-state/<sessionId>/events.jsonl` (written automatically) | `session.shutdown` (exact **token totals + AIU + premium** + per-model `modelMetrics`) **and** `subagent.completed` (sub-agent **count + per-sub total tokens + model + duration**) | Exact session totals, sub-agent count/tokens, and per-**model** AIU |
+| `copilot --output-format json` (stdout you redirect) | leaner stream: `result` (premium, durations) + `assistant.message` (output tokens) + `subagent.completed` | sub-agent count + output tokens only |
+
+> **Important fidelity note.** A plain CLI session's logs do **not** contain the
+> per-call `assistant.usage` events, so the module cannot produce a per-**scope**
+> (main-vs-sub) **AIU** split from them. You still get: exact **session totals**,
+> the **sub-agent count + per-sub total tokens** (`subAgentRuns`), and the exact
+> **per-model** AIU (`models`) — which separates main from sub whenever they run
+> on different models. A precise per-scope AIU split requires the SDK event
+> stream (per-call `assistant.usage`), e.g. captured via `@github/copilot-sdk`.
+
+### Make a multi-sub-agent session, then analyze it
+
+```powershell
+# 1. fresh working dir + a known session id
+$work = Join-Path $env:TEMP "cc-test-$(Get-Random)"; New-Item -ItemType Directory $work | Out-Null; Set-Location $work
+$sid  = [guid]::NewGuid().ToString()
+
+# 2. run non-interactively; force 3 parallel sub-agents via the task tool
+$prompt = "You MUST use the 'task' tool to launch exactly 3 sub-agents in parallel in a single turn. " +
+          "Give each one this exact instruction: 'Reply with one line: WORKER OK'. " +
+          "Do not do the work yourself. After all three return, print: ALL DONE."
+copilot -p $prompt --allow-all-tools --output-format json --session-id $sid > stdout.jsonl
+
+# 3. analyze the on-disk session log (richest plain-CLI source)
+$events = Join-Path $env:USERPROFILE ".copilot/session-state/$sid/events.jsonl"
+node -e "import('copilot-cost').then(async m => console.log(m.formatReport(await m.analyzeJsonlFile(process.argv[1]))))" $events
+```
+
+Key flags: `-p` (non-interactive), `--allow-all-tools` (required for `-p`, else
+it blocks on permission prompts), `--output-format json` (JSONL stream),
+`--session-id` (so you know which folder to read).
+
+---
+
+---
+
+## Design notes
+
+- **No price table.** Cost is read from the CLI's own `totalNanoAiu`, so it
+  stays correct even as model prices change — there is nothing to maintain, and
+  no fabricated rates.
+- **Per-call main-vs-sub split.** Sub-agents are separated by `parentToolCallId`
+  on each `assistant.usage` event, so **inline** `task`-tool sub-agents (which
+  share the parent session) are attributed correctly — not folded into the main
+  agent.
+- **Premium requests from the summary.** `data.cost` on a usage event is a
+  per-request multiplier, not an additive counter, so premium requests are read
+  from `session.shutdown.totalPremiumRequests`.
+- **Built-in sanity-check.** The summed per-call cost is reconciled against the
+  session's `totalNanoAiu`; drift beyond `reconcileTolerance` adds a warning
+  (it never changes the reported numbers).
+
+---
+
+## License
+
+MIT
diff --git a/src/tools/cost-module/examples/analyze-run.ts b/src/tools/cost-module/examples/analyze-run.ts
new file mode 100644
index 0000000..019720b
--- /dev/null
+++ b/src/tools/cost-module/examples/analyze-run.ts
@@ -0,0 +1,52 @@
+/**
+ * Example: analyze the cost of a recorded Copilot session and print a report.
+ *
+ * Run (Node >= 22):  node --experimental-strip-types examples/analyze-run.ts
+ * Or with tsx:       npx tsx examples/analyze-run.ts
+ *
+ * It points at a checked-in sample session (here, a benchmark trial):
+ *   agent-benchmark/results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir
+ */
+import { analyzeCopilotSession, formatReport } from "../src/copilot-cost.ts";
+import { fileURLToPath } from "node:url";
+import { dirname, resolve } from "node:path";
+
+const here = dirname(fileURLToPath(import.meta.url));
+const trialDir = resolve(
+  here,
+  "../../results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir",
+);
+
+const report = await analyzeCopilotSession(trialDir);
+
+console.log(formatReport(report));
+console.log("\n--- machine-readable ---\n");
+console.log(
+  JSON.stringify(
+    {
+      main: {
+        inputTokens: report.main.inputTokens,
+        outputTokens: report.main.outputTokens,
+        cachedTokens: report.main.cachedTokens,
+        aiCreditCost: report.main.aiCreditCost,
+      },
+      subAgents: report.subAgents.map((s) => ({
+        agentName: s.agentName,
+        model: s.model,
+        inputTokens: s.inputTokens,
+        outputTokens: s.outputTokens,
+        cachedTokens: s.cachedTokens,
+        aiCreditCost: s.aiCreditCost,
+      })),
+      total: {
+        inputTokens: report.total.inputTokens,
+        outputTokens: report.total.outputTokens,
+        cachedTokens: report.total.cachedTokens,
+        aiCreditCost: report.total.aiCreditCost,
+      },
+      premiumRequests: report.premiumRequests,
+    },
+    null,
+    2,
+  ),
+);
diff --git a/src/tools/cost-module/package-lock.json b/src/tools/cost-module/package-lock.json
new file mode 100644
index 0000000..ffd29bb
--- /dev/null
+++ b/src/tools/cost-module/package-lock.json
@@ -0,0 +1,48 @@
+{
+  "name": "copilot-cost",
+  "version": "1.0.0",
+  "lockfileVersion": 3,
+  "requires": true,
+  "packages": {
+    "": {
+      "name": "copilot-cost",
+      "version": "1.0.0",
+      "license": "MIT",
+      "devDependencies": {
+        "@types/node": "^20.0.0",
+        "typescript": "^5.4.0"
+      }
+    },
+    "node_modules/@types/node": {
+      "version": "20.19.43",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-20.19.43.tgz",
+      "integrity": "sha512-6oYBAi5ikg4Pl+kGsoYtawUMBT2zZMCvPNF7pVLnHZfd1zf38DRiWn/gT01RYCdUqkv7Fhr+C9ot4/tb+2sVvA==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "undici-types": "~6.21.0"
+      }
+    },
+    "node_modules/typescript": {
+      "version": "5.9.3",
+      "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.9.3.tgz",
+      "integrity": "sha512-jl1vZzPDinLr9eUt3J/t7V6FgNEw9QjvBPdysz9KfQDD41fQrC2Y4vKQdiaUpFT4bXlb1RHhLpp8wtm6M5TgSw==",
+      "dev": true,
+      "license": "Apache-2.0",
+      "bin": {
+        "tsc": "bin/tsc",
+        "tsserver": "bin/tsserver"
+      },
+      "engines": {
+        "node": ">=14.17"
+      }
+    },
+    "node_modules/undici-types": {
+      "version": "6.21.0",
+      "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-6.21.0.tgz",
+      "integrity": "sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ==",
+      "dev": true,
+      "license": "MIT"
+    }
+  }
+}
diff --git a/src/tools/cost-module/package.json b/src/tools/cost-module/package.json
new file mode 100644
index 0000000..b5eba44
--- /dev/null
+++ b/src/tools/cost-module/package.json
@@ -0,0 +1,25 @@
+{
+  "name": "copilot-cost",
+  "version": "1.0.0",
+  "description": "Compute the token usage and AI-credit (AIU) cost of a GitHub Copilot CLI/SDK session, split between the main agent and its sub-agents.",
+  "type": "module",
+  "main": "./dist/index.js",
+  "types": "./dist/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/index.d.ts",
+      "import": "./dist/index.js"
+    }
+  },
+  "files": ["dist", "src", "README.md"],
+  "scripts": {
+    "build": "tsc -p tsconfig.json",
+    "example": "node --experimental-strip-types examples/analyze-run.ts"
+  },
+  "keywords": ["github-copilot", "copilot-cli", "tokens", "cost", "aiu", "credits", "subagent"],
+  "license": "MIT",
+  "devDependencies": {
+    "@types/node": "^20.0.0",
+    "typescript": "^5.4.0"
+  }
+}
diff --git a/src/tools/cost-module/src/copilot-cost.ts b/src/tools/cost-module/src/copilot-cost.ts
new file mode 100644
index 0000000..7f1e539
--- /dev/null
+++ b/src/tools/cost-module/src/copilot-cost.ts
@@ -0,0 +1,748 @@
+/**
+ * copilot-cost — Compute the token usage and AI-credit cost of a GitHub Copilot
+ * CLI / Copilot SDK session, split between the MAIN agent and any SUB-agents.
+ *
+ * Zero runtime dependencies. The pure functions (`parseJsonl`, `analyzeEvents`,
+ * `formatReport`) run in any JS/TS runtime (Node, Deno, Bun, browser). The
+ * `analyze*File` / `analyze*Dir` helpers additionally require Node's `fs`.
+ *
+ * ===========================================================================
+ *  WHERE THE DATA LIVES  (read this first)
+ * ===========================================================================
+ * A Copilot CLI session writes two complementary event logs. Both are JSONL
+ * (one JSON object per line). For full accuracy this module reads BOTH:
+ *
+ *  1. The SDK event stream (the Copilot SDK emits this; a harness may export it
+ *     to a `*-events.jsonl` file). This is the ONLY source that contains
+ *     per-API-call usage events:
+ *
+ *         { "type": "assistant.usage",
+ *           "data": {
+ *             "model": "claude-opus-4.6",
+ *             "inputTokens": 18631,        // GROSS prompt tokens (incl. cache)
+ *             "outputTokens": 554,
+ *             "cacheReadTokens": 0,
+ *             "cacheWriteTokens": 18628,
+ *             "reasoningTokens": 213,
+ *             "parentToolCallId": "toolu_…",   // PRESENT => this call belongs
+ *                                              //   to a sub-agent. ABSENT =>
+ *                                              //   it is the main agent.
+ *             "copilotUsage": {
+ *               "tokenDetails": [
+ *                 { "tokenType": "input",       "tokenCount": 3,     "batchSize": 1e6, "costPerBatch": 5.0e11 },
+ *                 { "tokenType": "cache_read",  "tokenCount": 0,     "batchSize": 1e6, "costPerBatch": 5.0e10 },
+ *                 { "tokenType": "cache_write", "tokenCount": 18628, "batchSize": 1e6, "costPerBatch": 6.25e11 },
+ *                 { "tokenType": "output",      "tokenCount": 554,   "batchSize": 1e6, "costPerBatch": 2.5e12 }
+ *               ],
+ *               "totalNanoAiu": 13029000000   // EXACT billed cost of this call
+ *             }
+ *           } }
+ *
+ *     This file is what makes a reliable main-vs-sub split possible, because
+ *     inline sub-agents (spawned via the `task` tool) share the parent session
+ *     and are only distinguishable by `parentToolCallId`.
+ *
+ *     It also carries sub-agent metadata:
+ *       - `tool.execution_start` with `data.toolName === "task"`:
+ *             data.toolCallId -> data.arguments.{name, description, agent_type}
+ *       - `subagent.completed` / `subagent.failed`:
+ *             data.{toolCallId, agentName, agentDisplayName, model, totalTokens, durationMs}
+ *
+ *  2. The canonical session log —
+ *     `~/.copilot/session-state/<sessionId>/events.jsonl`. This is the ONLY
+ *     source with the session-end summary:
+ *
+ *         { "type": "session.shutdown",
+ *           "data": {
+ *             "shutdownType": "routine",      // the main session's shutdown
+ *             "totalPremiumRequests": 3,
+ *             "totalNanoAiu": 156131000000,   // whole-session billed cost
+ *             "tokenDetails": { "input": { "tokenCount": … }, "cache_read": {…}, "cache_write": {…}, "output": {…} },
+ *             "modelMetrics": {
+ *               "claude-opus-4.6": {
+ *                 "usage": { "inputTokens": 470721, "outputTokens": 4712,   // inputTokens is GROSS
+ *                            "cacheReadTokens": 402816, "cacheWriteTokens": 67884, "reasoningTokens": 415 },
+ *                 "totalNanoAiu": 74358800000,
+ *                 "tokenDetails": { "input": {…}, "cache_read": {…}, "cache_write": {…}, "output": {…} }
+ *               }
+ *             } } }
+ *
+ *     This module uses it for `premiumRequests` and as a cross-check against
+ *     the per-call total. (A sub-agent that runs as its OWN session shows up
+ *     here as a `session.shutdown` WITHOUT a `shutdownType` field.)
+ *
+ * It is safe to concatenate the events of both files and pass them to
+ * `analyzeEvents` — credits/tokens are taken from the per-call `assistant.usage`
+ * events when present, and the `session.shutdown` summary only contributes
+ * `premiumRequests` + a validation cross-check, so nothing is double-counted.
+ *
+ * ===========================================================================
+ *  HOW THE COST IS COMPUTED  (read straight from the logs — no price table)
+ * ===========================================================================
+ *  The CLI denominates every cost in *nano-AIU* (1e-9 AI Units), so that is the
+ *  only cost unit the data actually contains. This module does NOT apply any
+ *  price table or currency conversion.
+ *
+ *  - Per call, cost in nano-AIU:
+ *        nanoAiu = Σ_type ( tokenCount / batchSize * costPerBatch )
+ *    which is exactly the value the CLI reports as `copilotUsage.totalNanoAiu`.
+ *    The module sums `totalNanoAiu` directly and only falls back to the formula
+ *    above if that field is missing.
+ *  - AIU is just nano-AIU unscaled (the field is literally named `totalNanoAiu`
+ *    and "nano" = 1e-9), so it is exact, not an estimate:
+ *        aiCreditCost (AIU) = nanoAiu / 1e9
+ *    There is no dollar amount anywhere in the logs; converting AIU→USD would
+ *    require an external rate that is not part of the data, so this module does
+ *    not do it. Apply your own rate downstream if you need a currency.
+ *
+ *  Token categories (non-overlapping; the relative `costPerBatch` values in the
+ *  logs confirm the cost ordering noted below):
+ *        inputTokens       = "input"       — fresh, uncached prompt tokens
+ *        cachedTokens      = "cache_read"  — prompt tokens served from cache (cheapest)
+ *        cacheWriteTokens  = "cache_write" — prompt tokens written to cache (priciest prompt tier)
+ *        outputTokens      = "output"      — generated tokens (includes reasoning)
+ *        grossInputTokens  = input + cachedTokens + cacheWriteTokens  (total prompt)
+ *
+ *  NOTE on "input tokens": the raw `assistant.usage.data.inputTokens` field is
+ *  GROSS (it already includes cached + cache-write). This module exposes both
+ *  the non-overlapping `inputTokens` (fresh only) AND `grossInputTokens` so you
+ *  can use whichever your report needs.
+ */
+
+// ─────────────────────────────────────────────────────────────────────────────
+// Types
+// ─────────────────────────────────────────────────────────────────────────────
+
+/** Raw Copilot event (loosely typed — only the fields we read are described). */
+export interface CopilotEvent {
+  type?: string;
+  data?: any;
+  id?: string;
+  timestamp?: string;
+  agentId?: string;
+  ephemeral?: boolean;
+  [k: string]: unknown;
+}
+
+export type TokenType = "input" | "cache_read" | "cache_write" | "output";
+
+/** Non-overlapping token counts plus a convenience gross-input total. */
+export interface TokenBreakdown {
+  /** Fresh, uncached prompt tokens (billed at the base input rate). */
+  inputTokens: number;
+  /** Prompt tokens served from cache (cache hits, billed cheaply). */
+  cachedTokens: number;
+  /** Prompt tokens written to the cache (cache creation, billed at a premium). */
+  cacheWriteTokens: number;
+  /** Generated output tokens (includes reasoning tokens). */
+  outputTokens: number;
+  /** Reasoning tokens — informational subset already counted in outputTokens. */
+  reasoningTokens: number;
+  /** input + cachedTokens + cacheWriteTokens — the total prompt size. */
+  grossInputTokens: number;
+}
+
+/** A token breakdown plus the billed cost and call/request counts. */
+export interface CostBreakdown extends TokenBreakdown {
+  /** Raw billed cost in nano-AIU (1e-9 AIU) — taken straight from the logs. */
+  nanoAiu: number;
+  /** AI credit cost in AIU (= nanoAiu / 1e9). Exact — this is what the CLI bills. */
+  aiCreditCost: number;
+  /** Number of API calls (`assistant.usage` events) attributed to this scope. */
+  apiCalls: number;
+}
+
+/** Per sub-agent invocation cost (one entry per distinct parentToolCallId). */
+export interface SubAgentCost extends CostBreakdown {
+  /** The `parentToolCallId` that identifies this sub-agent invocation. */
+  toolCallId: string;
+  /** Friendly name from the `task` tool call or `subagent.completed`, if known. */
+  agentName?: string;
+  /** Model the sub-agent ran on, if known. */
+  model?: string;
+  /** Wall-clock duration in ms, from `subagent.completed`, if known. */
+  durationMs?: number;
+}
+
+/**
+ * A sub-agent run as reported by a `subagent.completed` / `subagent.failed`
+ * event. These events appear in BOTH the SDK stream and a plain CLI session's
+ * on-disk `events.jsonl`, so this is the universally-available view of
+ * sub-agents. It carries a single combined `totalTokens` (no input/output/cache
+ * breakdown, and no per-sub AIU) — for a precise per-sub token/AIU split you
+ * need the per-call `assistant.usage` events (the `subAgents` field).
+ */
+export interface SubAgentRun {
+  /** The sub-agent's tool-call id (`task` tool call), if known. */
+  toolCallId?: string;
+  /** Friendly name from the `task` tool call args, or the agent display name. */
+  name?: string;
+  /** Model the sub-agent ran on. */
+  model?: string;
+  /** Combined token count the CLI reported for this sub-agent run. */
+  totalTokens: number;
+  /** Wall-clock duration in ms. */
+  durationMs?: number;
+  /** Whether the sub-agent completed or failed. */
+  status: "completed" | "failed";
+}
+
+export interface SessionCostReport {
+  /** Main agent: all `assistant.usage` events WITHOUT a parentToolCallId. */
+  main: CostBreakdown;
+  /** One entry per sub-agent invocation (grouped by parentToolCallId). */
+  subAgents: SubAgentCost[];
+  /** Aggregate of every sub-agent invocation. */
+  subAgentsTotal: CostBreakdown;
+  /** main + subAgentsTotal — equals the session's billed total. */
+  total: CostBreakdown;
+  /** Per-model rollup across both scopes (model name -> cost). */
+  models: Record<string, CostBreakdown>;
+  /**
+   * Sub-agent runs from `subagent.completed` / `subagent.failed` events.
+   * Available for plain CLI logs too (where `subAgents` is empty because there
+   * are no per-call usage events). Total tokens only — no per-sub AIU.
+   */
+  subAgentRuns: SubAgentRun[];
+  /** Best available sub-agent count (max of per-call groups and completed events). */
+  subAgentCount: number;
+  /** Session-level premium requests (from `session.shutdown`, if available). */
+  premiumRequests?: number;
+  /** Session ids seen (from `session.start` / `session.shutdown`). */
+  sessionIds: string[];
+  /** Non-fatal diagnostics (e.g. cross-check mismatches, missing data). */
+  warnings: string[];
+}
+
+export interface CostOptions {
+  /**
+   * Tolerance (fraction) for the internal sanity-check that compares the summed
+   * per-call cost against `session.shutdown.totalNanoAiu`. A mismatch beyond
+   * this only adds a warning; it never changes the numbers. Default 0.01 (1%).
+   */
+  reconcileTolerance?: number;
+}
+
+// ─────────────────────────────────────────────────────────────────────────────
+// Constants
+// ─────────────────────────────────────────────────────────────────────────────
+
+/** 1 AIU = 1e9 nano-AIU. The CLI denominates cost in nano-AIU (`totalNanoAiu`);
+ *  "nano" = 1e-9, so AIU is that same value unscaled — exact, not an estimate. */
+export const NANO_AIU_PER_AIU = 1e9;
+
+// ─────────────────────────────────────────────────────────────────────────────
+// Pure core — works in any runtime
+// ─────────────────────────────────────────────────────────────────────────────
+
+/** Parse a JSONL string into events, skipping blank/malformed lines. */
+export function parseJsonl(text: string): CopilotEvent[] {
+  const out: CopilotEvent[] = [];
+  for (const line of text.split("\n")) {
+    const t = line.trim();
+    if (!t) continue;
+    try {
+      out.push(JSON.parse(t));
+    } catch {
+      /* skip malformed line */
+    }
+  }
+  return out;
+}
+
+function emptyTokens(): TokenBreakdown {
+  return {
+    inputTokens: 0,
+    cachedTokens: 0,
+    cacheWriteTokens: 0,
+    outputTokens: 0,
+    reasoningTokens: 0,
+    grossInputTokens: 0,
+  };
+}
+
+interface MutableCost extends CostBreakdown {}
+
+function emptyCost(): MutableCost {
+  return { ...emptyTokens(), nanoAiu: 0, aiCreditCost: 0, apiCalls: 0 };
+}
+
+/** Compute nano-AIU from a `copilotUsage.tokenDetails` array (fallback when
+ *  `totalNanoAiu` is absent). cost = Σ tokenCount / batchSize * costPerBatch. */
+export function nanoAiuFromTokenDetails(
+  tokenDetails: Array<{ tokenCount?: number; batchSize?: number; costPerBatch?: number }> | undefined,
+): number {
+  if (!Array.isArray(tokenDetails)) return 0;
+  let n = 0;
+  for (const d of tokenDetails) {
+    const count = Number(d?.tokenCount) || 0;
+    const batch = Number(d?.batchSize) || 0;
+    const per = Number(d?.costPerBatch) || 0;
+    if (count > 0 && batch > 0 && per > 0) n += (count / batch) * per;
+  }
+  return n;
+}
+
+/** Read the per-type token counts from one `assistant.usage` event's data. */
+function tokensFromUsageEvent(data: any): { input: number; cacheRead: number; cacheWrite: number; output: number; reasoning: number } {
+  const details: any[] = Array.isArray(data?.copilotUsage?.tokenDetails)
+    ? data.copilotUsage.tokenDetails
+    : [];
+  const byType: Record<string, number> = {};
+  for (const d of details) {
+    if (d && typeof d.tokenType === "string") byType[d.tokenType] = (byType[d.tokenType] || 0) + (Number(d.tokenCount) || 0);
+  }
+
+  // Prefer the authoritative tokenDetails array; fall back to the flat fields.
+  const cacheRead = "cache_read" in byType ? byType["cache_read"] : Number(data?.cacheReadTokens) || 0;
+  const cacheWrite = "cache_write" in byType ? byType["cache_write"] : Number(data?.cacheWriteTokens) || 0;
+  // tokenDetails "input" is the fresh/uncached input. The flat `data.inputTokens`
+  // is GROSS (incl. cache) so derive fresh input from it when details are absent.
+  const input = "input" in byType
+    ? byType["input"]
+    : Math.max(0, (Number(data?.inputTokens) || 0) - cacheRead - cacheWrite);
+  const output = "output" in byType ? byType["output"] : Number(data?.outputTokens) || 0;
+  const reasoning = Number(data?.reasoningTokens) || 0;
+  return { input, cacheRead, cacheWrite, output, reasoning };
+}
+
+function addUsageEventToCost(cost: MutableCost, data: any): void {
+  const t = tokensFromUsageEvent(data);
+  cost.inputTokens += t.input;
+  cost.cachedTokens += t.cacheRead;
+  cost.cacheWriteTokens += t.cacheWrite;
+  cost.outputTokens += t.output;
+  cost.reasoningTokens += t.reasoning;
+  cost.grossInputTokens += t.input + t.cacheRead + t.cacheWrite;
+
+  const total = Number(data?.copilotUsage?.totalNanoAiu);
+  cost.nanoAiu += Number.isFinite(total) && total > 0
+    ? total
+    : nanoAiuFromTokenDetails(data?.copilotUsage?.tokenDetails);
+  cost.apiCalls += 1;
+}
+
+function finalizeCost(cost: MutableCost): void {
+  // AIU is nano-AIU unscaled (1 AIU = 1e9 nano-AIU). Exact — straight from logs.
+  cost.aiCreditCost = round(cost.nanoAiu / NANO_AIU_PER_AIU, 4);
+  // Round token fields to integers (they are integer counts already).
+  cost.inputTokens = Math.round(cost.inputTokens);
+  cost.cachedTokens = Math.round(cost.cachedTokens);
+  cost.cacheWriteTokens = Math.round(cost.cacheWriteTokens);
+  cost.outputTokens = Math.round(cost.outputTokens);
+  cost.reasoningTokens = Math.round(cost.reasoningTokens);
+  cost.grossInputTokens = Math.round(cost.grossInputTokens);
+  cost.nanoAiu = Math.round(cost.nanoAiu);
+}
+
+function round(n: number, dp: number): number {
+  const f = Math.pow(10, dp);
+  return Math.round(n * f) / f;
+}
+
+/**
+ * Analyze a flat list of Copilot events into a main-vs-sub cost report.
+ *
+ * Accepts events from the SDK event stream (per-call `assistant.usage`), from
+ * the canonical `session-state/<id>/events.jsonl` (the `session.shutdown`
+ * summary), or both concatenated together.
+ */
+export function analyzeEvents(events: CopilotEvent[], options: CostOptions = {}): SessionCostReport {
+  const tolerance = options.reconcileTolerance ?? 0.01;
+  const warnings: string[] = [];
+
+  const main = emptyCost();
+  const subByTool = new Map<string, MutableCost>();
+  const modelTotals = new Map<string, MutableCost>();
+  const sessionIds = new Set<string>();
+
+  // Sub-agent metadata maps.
+  const taskName = new Map<string, string>(); // toolCallId -> friendly name
+  const subMeta = new Map<string, { agentName?: string; model?: string; durationMs?: number }>();
+  const subRuns: SubAgentRun[] = []; // from subagent.completed/.failed (universal)
+
+  let usageEventCount = 0;
+  let shutdownPremium: number | undefined;
+  let shutdownNanoAiu = 0;
+  let sawRoutineShutdown = false;
+
+  // Pass 1: collect sub-agent metadata + session ids.
+  for (const ev of events) {
+    const type = ev?.type || "";
+    const d: any = ev?.data;
+    if (!d) {
+      if (type === "session.start" && (ev as any)?.data?.sessionId) sessionIds.add((ev as any).data.sessionId);
+      continue;
+    }
+    if (type === "session.start" && d.sessionId) sessionIds.add(d.sessionId);
+    if (type === "tool.execution_start" && d.toolName === "task" && d.toolCallId) {
+      taskName.set(d.toolCallId, d.arguments?.description || d.arguments?.name || d.arguments?.agent_type || "");
+    }
+    if ((type === "subagent.completed" || type === "subagent.failed") && d.toolCallId) {
+      subMeta.set(d.toolCallId, {
+        agentName: d.agentDisplayName || d.agentName,
+        model: d.model,
+        durationMs: d.durationMs,
+      });
+      subRuns.push({
+        toolCallId: d.toolCallId,
+        model: d.model,
+        totalTokens: Number(d.totalTokens) || 0,
+        durationMs: d.durationMs,
+        status: type === "subagent.completed" ? "completed" : "failed",
+      });
+    }
+  }
+
+  // Pass 2: accumulate cost from per-call usage events + read shutdown summary.
+  for (const ev of events) {
+    const type = ev?.type || "";
+    const d: any = ev?.data;
+    if (!d) continue;
+
+    if (type === "assistant.usage") {
+      usageEventCount++;
+      const model: string = d.model || "unknown";
+      if (!modelTotals.has(model)) modelTotals.set(model, emptyCost());
+      addUsageEventToCost(modelTotals.get(model)!, d);
+
+      const parentToolCallId: string | undefined = d.parentToolCallId;
+      if (parentToolCallId) {
+        if (!subByTool.has(parentToolCallId)) subByTool.set(parentToolCallId, emptyCost());
+        addUsageEventToCost(subByTool.get(parentToolCallId)!, d);
+      } else {
+        addUsageEventToCost(main, d);
+      }
+    } else if (type === "session.shutdown") {
+      const isRoutine = d.shutdownType === "routine";
+      if (isRoutine && !sawRoutineShutdown) {
+        sawRoutineShutdown = true;
+        shutdownPremium = Number(d.totalPremiumRequests) || 0;
+        shutdownNanoAiu = Number(d.totalNanoAiu) || 0;
+      }
+    }
+  }
+
+  // Fallback: no per-call usage events (e.g. only the canonical events.jsonl was
+  // provided). Reconstruct from session.shutdown.modelMetrics. This cannot split
+  // inline sub-agents (they roll up by model), so attribute by model into MAIN
+  // and warn.
+  if (usageEventCount === 0) {
+    warnings.push(
+      "No per-call `assistant.usage` events found — falling back to `session.shutdown.modelMetrics`. " +
+        "Per-scope main-vs-sub AIU split is unavailable from this source (inline sub-agents roll up by " +
+        "model). See `subAgentRuns` for sub-agent count + per-sub total tokens, and `models` for the " +
+        "exact per-model AIU (which separates main from sub when they run on different models). " +
+        "Capture the SDK event stream (per-call `assistant.usage`) for a per-scope split.",
+    );
+    reconstructFromShutdowns(events, main, subByTool, subMeta, modelTotals);
+  }
+
+  // Finalize per-model.
+  const models: Record<string, CostBreakdown> = {};
+  for (const [model, c] of modelTotals) {
+    finalizeCost(c);
+    models[model] = c;
+  }
+
+  // Finalize main + subs.
+  finalizeCost(main);
+  const subAgents: SubAgentCost[] = [];
+  const subAgentsTotal = emptyCost();
+  for (const [toolCallId, c] of subByTool) {
+    // Aggregate into total BEFORE finalizing c (still raw).
+    subAgentsTotal.inputTokens += c.inputTokens;
+    subAgentsTotal.cachedTokens += c.cachedTokens;
+    subAgentsTotal.cacheWriteTokens += c.cacheWriteTokens;
+    subAgentsTotal.outputTokens += c.outputTokens;
+    subAgentsTotal.reasoningTokens += c.reasoningTokens;
+    subAgentsTotal.grossInputTokens += c.grossInputTokens;
+    subAgentsTotal.nanoAiu += c.nanoAiu;
+    subAgentsTotal.apiCalls += c.apiCalls;
+
+    finalizeCost(c);
+    const meta = subMeta.get(toolCallId);
+    subAgents.push({
+      ...c,
+      toolCallId,
+      agentName: meta?.agentName || taskName.get(toolCallId) || undefined,
+      model: meta?.model || dominantModel(toolCallId, events),
+      durationMs: meta?.durationMs,
+    });
+  }
+  finalizeCost(subAgentsTotal);
+
+  // total = main + subAgentsTotal.
+  const total = emptyCost();
+  for (const c of [main, subAgentsTotal]) {
+    total.inputTokens += c.inputTokens;
+    total.cachedTokens += c.cachedTokens;
+    total.cacheWriteTokens += c.cacheWriteTokens;
+    total.outputTokens += c.outputTokens;
+    total.reasoningTokens += c.reasoningTokens;
+    total.grossInputTokens += c.grossInputTokens;
+    total.nanoAiu += c.nanoAiu;
+    total.apiCalls += c.apiCalls;
+  }
+  finalizeCost(total);
+
+  // Cross-check against the canonical session total.
+  if (shutdownNanoAiu > 0 && total.nanoAiu > 0) {
+    const diff = Math.abs(total.nanoAiu - shutdownNanoAiu) / shutdownNanoAiu;
+    if (diff > tolerance) {
+      warnings.push(
+        `Per-call cost (${total.nanoAiu} nAIU) differs from session.shutdown.totalNanoAiu ` +
+          `(${shutdownNanoAiu} nAIU) by ${(diff * 100).toFixed(1)}%.`,
+      );
+    }
+  }
+
+  // Sort sub-agents by cost descending for stable, useful output.
+  subAgents.sort((a, b) => b.nanoAiu - a.nanoAiu);
+
+  // Resolve friendly names for the subagent.completed runs (prefer the user's
+  // own `task` label over the generic agent display name).
+  for (const run of subRuns) {
+    if (run.toolCallId) {
+      run.name = taskName.get(run.toolCallId) || subMeta.get(run.toolCallId)?.agentName || undefined;
+    }
+  }
+
+  return {
+    main,
+    subAgents,
+    subAgentsTotal,
+    total,
+    models,
+    subAgentRuns: subRuns,
+    subAgentCount: Math.max(subAgents.length, subRuns.length),
+    premiumRequests: shutdownPremium,
+    sessionIds: [...sessionIds],
+    warnings,
+  };
+}
+
+/** Best-effort model for a sub-agent: the model of its usage events. */
+function dominantModel(parentToolCallId: string, events: CopilotEvent[]): string | undefined {
+  const counts = new Map<string, number>();
+  for (const ev of events) {
+    if (ev?.type === "assistant.usage" && ev.data?.parentToolCallId === parentToolCallId && ev.data?.model) {
+      counts.set(ev.data.model, (counts.get(ev.data.model) || 0) + 1);
+    }
+  }
+  let best: string | undefined;
+  let bestN = 0;
+  for (const [m, n] of counts) if (n > bestN) ((best = m), (bestN = n));
+  return best;
+}
+
+/** Fallback reconstruction from `session.shutdown` events (no per-call data). */
+function reconstructFromShutdowns(
+  events: CopilotEvent[],
+  main: MutableCost,
+  subByTool: Map<string, MutableCost>,
+  subMeta: Map<string, { agentName?: string; model?: string; durationMs?: number }>,
+  modelTotals: Map<string, MutableCost>,
+): void {
+  let routineSeen = false;
+  let subIndex = 0;
+  for (const ev of events) {
+    if (ev?.type !== "session.shutdown" || !ev.data) continue;
+    const d: any = ev.data;
+    const isRoutine = d.shutdownType === "routine";
+    const target = isRoutine
+      ? main
+      : (() => {
+          const key = `separate-session-${subIndex++}`;
+          const c = emptyCost();
+          subByTool.set(key, c);
+          subMeta.set(key, { agentName: "separate-session sub-agent" });
+          return c;
+        })();
+
+    if (isRoutine) {
+      // Count the main session once; skip any extra routine shutdowns (e.g. a
+      // --resume continuation) so they don't double-count.
+      if (routineSeen) continue;
+      routineSeen = true;
+    }
+
+    const mm = d.modelMetrics || {};
+    for (const [model, metricsRaw] of Object.entries(mm)) {
+      const m: any = metricsRaw;
+      const usage = m?.usage || {};
+      const gross = Number(usage.inputTokens) || 0; // GROSS in modelMetrics
+      const cacheRead = Number(usage.cacheReadTokens) || 0;
+      const cacheWrite = Number(usage.cacheWriteTokens) || 0;
+      const freshInput = Math.max(0, gross - cacheRead - cacheWrite);
+      const output = Number(usage.outputTokens) || 0;
+      const reasoning = Number(usage.reasoningTokens) || 0;
+      const nano = Number(m?.totalNanoAiu) || 0;
+
+      target.inputTokens += freshInput;
+      target.cachedTokens += cacheRead;
+      target.cacheWriteTokens += cacheWrite;
+      target.outputTokens += output;
+      target.reasoningTokens += reasoning;
+      target.grossInputTokens += gross;
+      target.nanoAiu += nano;
+      target.apiCalls += Number(m?.requests?.count) || 0;
+
+      if (!modelTotals.has(model)) modelTotals.set(model, emptyCost());
+      const mt = modelTotals.get(model)!;
+      mt.inputTokens += freshInput;
+      mt.cachedTokens += cacheRead;
+      mt.cacheWriteTokens += cacheWrite;
+      mt.outputTokens += output;
+      mt.reasoningTokens += reasoning;
+      mt.grossInputTokens += gross;
+      mt.nanoAiu += nano;
+      mt.apiCalls += Number(m?.requests?.count) || 0;
+    }
+  }
+}
+
+// ─────────────────────────────────────────────────────────────────────────────
+// Formatting
+// ─────────────────────────────────────────────────────────────────────────────
+
+function fmtTokens(n: number): string {
+  if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(2)}m`;
+  if (n >= 1_000) return `${(n / 1_000).toFixed(1)}k`;
+  return String(n);
+}
+
+function costLine(label: string, c: CostBreakdown): string {
+  return (
+    `${label.padEnd(16)} ` +
+    `in ${fmtTokens(c.inputTokens).padStart(8)}  ` +
+    `cache(r) ${fmtTokens(c.cachedTokens).padStart(8)}  ` +
+    `cache(w) ${fmtTokens(c.cacheWriteTokens).padStart(8)}  ` +
+    `out ${fmtTokens(c.outputTokens).padStart(8)}  ` +
+    `${c.aiCreditCost.toFixed(2).padStart(10)} AIU`
+  );
+}
+
+/** Render a human-readable report (handy for CLIs / logs). */
+export function formatReport(report: SessionCostReport): string {
+  const lines: string[] = [];
+  lines.push("Copilot session cost — tokens + AI credits (AIU), straight from the logs");
+  lines.push("".padEnd(96, "─"));
+  lines.push(costLine("MAIN agent", report.main));
+  for (const s of report.subAgents) {
+    const name = s.agentName ? ` ${s.agentName}` : "";
+    const model = s.model ? ` (${s.model})` : "";
+    lines.push(costLine(`SUB${name}${model}`.slice(0, 16), s));
+  }
+  if (report.subAgents.length > 1) lines.push(costLine("SUB total", report.subAgentsTotal));
+  lines.push("".padEnd(96, "─"));
+  lines.push(costLine("TOTAL", report.total));
+  if (report.premiumRequests != null) lines.push(`premium requests: ${report.premiumRequests}`);
+  // Sub-agent runs (always available from subagent.completed; the only sub view
+  // for plain CLI logs). Shown when the per-call split didn't already cover them.
+  if (report.subAgentRuns.length > 0 && report.subAgents.length === 0) {
+    lines.push(`sub-agents: ${report.subAgentCount} (total tokens only — per-sub AIU needs the SDK stream)`);
+    for (const r of report.subAgentRuns) {
+      const flag = r.status === "failed" ? "  [FAILED]" : "";
+      lines.push(
+        `  • ${(r.name || "sub").slice(0, 24).padEnd(24)} ${(r.model || "?").padEnd(18)} ` +
+          `${fmtTokens(r.totalTokens).padStart(8)} tok  ${r.durationMs ?? "?"}ms${flag}`,
+      );
+    }
+  }
+  if (report.sessionIds.length) lines.push(`sessions: ${report.sessionIds.join(", ")}`);
+  for (const w of report.warnings) lines.push(`⚠ ${w}`);
+  return lines.join("\n");
+}
+
+// ─────────────────────────────────────────────────────────────────────────────
+// Node helpers (require node:fs / node:path)
+// ─────────────────────────────────────────────────────────────────────────────
+
+/** Analyze a single `.jsonl` file path. (Node only.) */
+export async function analyzeJsonlFile(filePath: string, options?: CostOptions): Promise<SessionCostReport> {
+  const { readFileSync } = await import("node:fs");
+  return analyzeEvents(parseJsonl(readFileSync(filePath, "utf-8")), options);
+}
+
+/**
+ * Analyze a session directory, auto-discovering the relevant logs. (Node only.)
+ * Reads, when present and de-duplicated:
+ *   - any `*-events.jsonl` / `events.jsonl` at the top level (an exported SDK stream)
+ *   - `<dir>/**\/.copilot/session-state/<id>/events.jsonl` (the canonical logs)
+ *   - a directly-passed `.jsonl` file
+ * It concatenates their events and calls `analyzeEvents` once (safe — see the
+ * module header: shutdown summaries don't double-count per-call credits).
+ */
+export async function analyzeCopilotSession(pathOrDir: string, options?: CostOptions): Promise<SessionCostReport> {
+  const fs = await import("node:fs");
+  const path = await import("node:path");
+
+  const stat = fs.statSync(pathOrDir);
+  const files: string[] = [];
+
+  if (stat.isFile()) {
+    files.push(pathOrDir);
+  } else {
+    // Collect any exported SDK stream(s) + a top-level canonical events.jsonl.
+    for (const entry of fs.readdirSync(pathOrDir)) {
+      if (entry.endsWith("-events.jsonl") || entry === "events.jsonl") files.push(path.join(pathOrDir, entry));
+    }
+    // Walk for canonical session-state events.jsonl.
+    walkForSessionState(fs, path, pathOrDir, files);
+  }
+
+  // De-duplicate file paths.
+  const unique = [...new Set(files.map((f) => path.resolve(f)))];
+  const allEvents: CopilotEvent[] = [];
+  const seenEventIds = new Set<string>();
+  for (const f of unique) {
+    let text: string;
+    try {
+      text = fs.readFileSync(f, "utf-8");
+    } catch {
+      continue;
+    }
+    for (const ev of parseJsonl(text)) {
+      // Guard against the same event appearing in two copied files.
+      const id = typeof ev.id === "string" ? ev.id : "";
+      if (id && seenEventIds.has(id)) continue;
+      if (id) seenEventIds.add(id);
+      allEvents.push(ev);
+    }
+  }
+  const report = analyzeEvents(allEvents, options);
+  if (unique.length === 0) report.warnings.push(`No event logs found under ${pathOrDir}.`);
+  return report;
+}
+
+function walkForSessionState(
+  fs: typeof import("node:fs"),
+  path: typeof import("node:path"),
+  dir: string,
+  out: string[],
+  depth = 0,
+): void {
+  if (depth > 8) return;
+  let entries: import("node:fs").Dirent[];
+  try {
+    entries = fs.readdirSync(dir, { withFileTypes: true });
+  } catch {
+    return;
+  }
+  for (const e of entries) {
+    if (!e.isDirectory()) continue;
+    const full = path.join(dir, e.name);
+    if (e.name === "session-state") {
+      // session-state/<sessionId>/events.jsonl
+      for (const sub of fs.readdirSync(full, { withFileTypes: true })) {
+        if (sub.isDirectory()) {
+          const ev = path.join(full, sub.name, "events.jsonl");
+          if (fs.existsSync(ev)) out.push(ev);
+        }
+      }
+    } else if (e.name !== "node_modules" && e.name !== ".git") {
+      walkForSessionState(fs, path, full, out, depth + 1);
+    }
+  }
+}
diff --git a/src/tools/cost-module/src/index.ts b/src/tools/cost-module/src/index.ts
new file mode 100644
index 0000000..f1cc6ee
--- /dev/null
+++ b/src/tools/cost-module/src/index.ts
@@ -0,0 +1 @@
+export * from "./copilot-cost.js";
diff --git a/src/tools/cost-module/tsconfig.json b/src/tools/cost-module/tsconfig.json
new file mode 100644
index 0000000..e4b219a
--- /dev/null
+++ b/src/tools/cost-module/tsconfig.json
@@ -0,0 +1,17 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "NodeNext",
+    "moduleResolution": "NodeNext",
+    "lib": ["ES2022"],
+    "declaration": true,
+    "outDir": "./dist",
+    "rootDir": "./src",
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true
+  },
+  "include": ["src/**/*.ts"],
+  "exclude": ["node_modules", "dist", "examples"]
+}

From c3b69779abb375e122eefd2d8cf3bff841f8b786 Mon Sep 17 00:00:00 2001
From: Dinah Gao <xiaomgao@microsoft.com>
Date: Fri, 12 Jun 2026 16:52:44 +0800
Subject: [PATCH 2/3] sharpen

---
 src/tools/cost-module/examples/analyze-run.ts | 76 ++++++++-----------
 1 file changed, 33 insertions(+), 43 deletions(-)

diff --git a/src/tools/cost-module/examples/analyze-run.ts b/src/tools/cost-module/examples/analyze-run.ts
index 019720b..57d6443 100644
--- a/src/tools/cost-module/examples/analyze-run.ts
+++ b/src/tools/cost-module/examples/analyze-run.ts
@@ -1,52 +1,42 @@
 /**
- * Example: analyze the cost of a recorded Copilot session and print a report.
+ * Example: analyze your most recent Copilot CLI session and print a report.
  *
- * Run (Node >= 22):  node --experimental-strip-types examples/analyze-run.ts
+ * Run (Node >= 22):  node examples/analyze-run.ts
  * Or with tsx:       npx tsx examples/analyze-run.ts
  *
- * It points at a checked-in sample session (here, a benchmark trial):
- *   agent-benchmark/results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir
+ * It auto-discovers the newest ~/.copilot/session-state/<id>/events.jsonl on
+ * this machine. Run any `copilot` session first (and exit it cleanly), then
+ * run this. To analyze a specific log instead, pass its path as an argument.
  */
-import { analyzeCopilotSession, formatReport } from "../src/copilot-cost.ts";
-import { fileURLToPath } from "node:url";
-import { dirname, resolve } from "node:path";
+import { analyzeJsonlFile, formatReport } from "../src/copilot-cost.ts";
+import { existsSync, readdirSync, statSync } from "node:fs";
+import { homedir } from "node:os";
+import { join } from "node:path";
 
-const here = dirname(fileURLToPath(import.meta.url));
-const trialDir = resolve(
-  here,
-  "../../results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir",
-);
+function findLatestSessionLog(): string | undefined {
+  const root = join(homedir(), ".copilot", "session-state");
+  if (!existsSync(root)) return undefined;
+  let newest: { path: string; mtime: number } | undefined;
+  for (const id of readdirSync(root)) {
+    const events = join(root, id, "events.jsonl");
+    if (!existsSync(events)) continue;
+    const mtime = statSync(events).mtimeMs;
+    if (!newest || mtime > newest.mtime) newest = { path: events, mtime };
+  }
+  return newest?.path;
+}
 
-const report = await analyzeCopilotSession(trialDir);
+const target = process.argv[2] || findLatestSessionLog();
 
+if (!target) {
+  console.error(
+    "No Copilot session log found.\n" +
+      "Run a `copilot` session first (exit it cleanly with /exit), then re-run this.\n" +
+      "Or pass a path:  node examples/analyze-run.ts <path-to-events.jsonl>",
+  );
+  process.exit(1);
+}
+
+console.log(`Analyzing: ${target}\n`);
+const report = await analyzeJsonlFile(target);
 console.log(formatReport(report));
-console.log("\n--- machine-readable ---\n");
-console.log(
-  JSON.stringify(
-    {
-      main: {
-        inputTokens: report.main.inputTokens,
-        outputTokens: report.main.outputTokens,
-        cachedTokens: report.main.cachedTokens,
-        aiCreditCost: report.main.aiCreditCost,
-      },
-      subAgents: report.subAgents.map((s) => ({
-        agentName: s.agentName,
-        model: s.model,
-        inputTokens: s.inputTokens,
-        outputTokens: s.outputTokens,
-        cachedTokens: s.cachedTokens,
-        aiCreditCost: s.aiCreditCost,
-      })),
-      total: {
-        inputTokens: report.total.inputTokens,
-        outputTokens: report.total.outputTokens,
-        cachedTokens: report.total.cachedTokens,
-        aiCreditCost: report.total.aiCreditCost,
-      },
-      premiumRequests: report.premiumRequests,
-    },
-    null,
-    2,
-  ),
-);

From 05d94a8a9d06c2d9154ebec40ea9a9c948d4a431 Mon Sep 17 00:00:00 2001
From: Dinah Gao <xiaomgao@microsoft.com>
Date: Fri, 12 Jun 2026 16:55:53 +0800
Subject: [PATCH 3/3] update readme

---
 src/tools/cost-module/README.md | 396 +++++++++-----------------------
 1 file changed, 106 insertions(+), 290 deletions(-)

diff --git a/src/tools/cost-module/README.md b/src/tools/cost-module/README.md
index 6133dd2..f64df0f 100644
--- a/src/tools/cost-module/README.md
+++ b/src/tools/cost-module/README.md
@@ -1,349 +1,165 @@
 # copilot-cost
 
-A tiny, **zero-dependency TypeScript module** that computes the token usage and
-**AI-credit (AIU) cost** of a GitHub Copilot CLI / Copilot SDK session, split
-between the **main agent** and any **sub-agents**.
+Work out how many **tokens** and **AI credits (AIU)** a GitHub Copilot session
+used — split between the **main agent** and its **sub-agents**. Tiny,
+zero-dependency TypeScript. Reads the JSONL logs Copilot already writes.
 
-For each scope (main, each sub-agent, and total) it reports:
+It reports, for the main agent / each sub-agent / the total:
 
 | Field | Meaning |
 |-------|---------|
-| `inputTokens` | Fresh, **uncached** prompt tokens (billed at the base input rate) |
-| `cachedTokens` | Prompt tokens served from cache (`cache_read`, billed cheaply) |
-| `cacheWriteTokens` | Prompt tokens written to cache (`cache_write`, billed at a premium) |
-| `outputTokens` | Generated tokens (includes reasoning tokens) |
-| `grossInputTokens` | `inputTokens + cachedTokens + cacheWriteTokens` (total prompt) |
-| `aiCreditCost` | **AI credit cost in AIU** (the headline number — exact, billed by the CLI) |
-| `nanoAiu` | Raw billed cost in nano-AIU (1e-9 AIU), straight from the logs |
-
-> The CLI denominates cost only in **AIU** (nano-AIU). There are **no dollar
-> amounts in the logs**, so this module does not invent a currency conversion —
-> it reports AIU, which is exact. Apply your own AIU→USD rate downstream if you
-> need one.
-
-It works in **any TypeScript/JavaScript runtime** (the pure functions have no
-imports). Optional `analyze*File` / `analyze*Dir` helpers use Node's `fs`.
+| `inputTokens` | Fresh, uncached prompt tokens |
+| `cachedTokens` | Prompt tokens read from cache (cheap) |
+| `cacheWriteTokens` | Prompt tokens written to cache (priciest prompt tier) |
+| `outputTokens` | Generated tokens |
+| `aiCreditCost` | **AI credits (AIU)** — the headline cost, taken straight from the logs |
 
----
-
-## Quick start
-
-```ts
-import { analyzeCopilotSession, formatReport } from "copilot-cost";
-
-// Point at a recorded session/trial directory (auto-discovers the logs):
-const report = await analyzeCopilotSession("path/to/session-logs-dir");
-
-console.log(formatReport(report));
-
-report.main.aiCreditCost;     // main agent AI credits (AIU)
-report.subAgents[0].cachedTokens;
-report.total.nanoAiu;         // whole-session raw cost (nano-AIU)
-```
-
-Pure (no filesystem — pass events you already have):
-
-```ts
-import { parseJsonl, analyzeEvents } from "copilot-cost";
+> **Why no $?** The logs only contain AIU (the CLI's billing unit), never
+> dollars. The module reports AIU exactly and does not invent an exchange rate.
 
-const events = parseJsonl(jsonlText);   // string with one JSON object per line
-const report = analyzeEvents(events);
-```
+---
 
-Run the bundled example against the checked-in sample trial:
+## Quick start (2 minutes)
 
-```bash
-node examples/analyze-run.ts        # Node >= 22 (native TS), or: npx tsx examples/analyze-run.ts
+```powershell
+cd C:\ado\win-dev-skills\src\tools\cost-module
+npm install                      # one-time
+node examples/analyze-run.ts     # analyzes your most recent Copilot session
 ```
 
----
+You'll see a table like:
 
-## Where the data comes from (read this)
-
-A Copilot CLI session writes **two complementary JSONL logs**. This module reads
-both for full accuracy; it is safe to feed both to `analyzeEvents` (credits are
-taken from the per-call events; the session summary only adds `premiumRequests`
-and a cross-check, so nothing is double-counted).
-
-### 1. The SDK event stream (e.g. an exported `*-events.jsonl`)
-
-The Copilot SDK emits this stream; a harness may export it to a file. It is the
-**only** source with **per-API-call** usage events, and the **only** way to
-reliably separate the main agent from inline sub-agents.
-
-Look for events with `type: "assistant.usage"`:
-
-```jsonc
-{
-  "type": "assistant.usage",
-  "data": {
-    "model": "claude-opus-4.6",
-    "inputTokens": 18631,          // GROSS prompt tokens (already includes cache)
-    "outputTokens": 554,
-    "cacheReadTokens": 0,
-    "cacheWriteTokens": 18628,
-    "reasoningTokens": 213,
-    "parentToolCallId": "toolu_…",  // PRESENT => this call belongs to a SUB-AGENT
-                                    // ABSENT  => this call is the MAIN agent
-    "copilotUsage": {
-      "tokenDetails": [
-        { "tokenType": "input",       "tokenCount": 3,     "batchSize": 1000000, "costPerBatch": 500000000000 },
-        { "tokenType": "cache_read",  "tokenCount": 0,     "batchSize": 1000000, "costPerBatch": 50000000000 },
-        { "tokenType": "cache_write", "tokenCount": 18628, "batchSize": 1000000, "costPerBatch": 625000000000 },
-        { "tokenType": "output",      "tokenCount": 554,   "batchSize": 1000000, "costPerBatch": 2500000000000 }
-      ],
-      "totalNanoAiu": 13029000000   // EXACT billed cost of THIS call (nano-AIU)
-    }
-  }
-}
 ```
-
-Sub-agent **names / models** come from the same file:
-
-- `tool.execution_start` where `data.toolName === "task"` →
-  `data.toolCallId` maps to `data.arguments.{name, description, agent_type}`
-- `subagent.completed` / `subagent.failed` →
-  `data.{toolCallId, agentName, agentDisplayName, model, totalTokens, durationMs}`
-
-### 2. The canonical session log — `~/.copilot/session-state/<sessionId>/events.jsonl`
-
-The **only** file with the session-end summary. Look for
-`type: "session.shutdown"` with `data.shutdownType === "routine"`:
-
-```jsonc
-{
-  "type": "session.shutdown",
-  "data": {
-    "shutdownType": "routine",
-    "totalPremiumRequests": 3,
-    "totalNanoAiu": 156131000000,   // whole-session billed cost
-    "tokenDetails": {               // session totals (fresh input / cache / output)
-      "input": { "tokenCount": 125607 },
-      "cache_read": { "tokenCount": 814464 },
-      "cache_write": { "tokenCount": 67884 },
-      "output": { "tokenCount": 31435 }
-    },
-    "modelMetrics": {
-      "claude-opus-4.6": {
-        "usage": { "inputTokens": 470721, "outputTokens": 4712,
-                   "cacheReadTokens": 402816, "cacheWriteTokens": 67884 },
-        "totalNanoAiu": 74358800000   // <-- note: usage.inputTokens here is GROSS
-      }
-    }
-  }
-}
+MAIN agent   in 38   cache(r) 74.5k  cache(w) 77.0k  out 811     20.97 AIU
+TOTAL        in 38   cache(r) 74.5k  cache(w) 77.0k  out 811     20.97 AIU
+premium requests: 3
+sub-agents: 3 (total tokens only — per-sub AIU needs the SDK stream)
+  • Worker 2   claude-haiku-4.5   20.4k tok  6471ms
+  • Worker 1   claude-haiku-4.5   20.4k tok  7022ms
+  • Worker 3   claude-haiku-4.5   24.6k tok  7406ms
 ```
 
-> A sub-agent that runs as its **own session** appears here as a
-> `session.shutdown` **without** a `shutdownType` field.
-
-The module uses this file for `premiumRequests` and as a cross-check against the
-summed per-call cost.
+Requires Node ≥ 22 (runs TypeScript natively). No build step needed.
 
 ---
 
-## How the cost is computed (read straight from the logs — no price table)
-
-The CLI denominates every cost in **nano-AIU** (1e-9 AI Units), so that is the
-only cost unit the data contains. This module applies **no price table and no
-currency conversion**.
-
-**Per call** the cost in nano-AIU is
-
-```
-nanoAiu = Σ_type ( tokenCount / batchSize × costPerBatch )
-```
-
-which is exactly the value the CLI already reports as
-`copilotUsage.totalNanoAiu`. The module sums `totalNanoAiu` directly (and falls
-back to the formula above only if that field is missing).
+## Where do the logs come from?
 
-**AI credits (AIU) — exact.** AIU is just nano-AIU unscaled (the field is
-literally named `totalNanoAiu`, and "nano" = 1e-9), so this is not derived or
-estimated:
+Every Copilot CLI session writes a log here automatically when it **finishes**:
 
 ```
-1 AIU = 1e9 nano-AIU      →  aiCreditCost = nanoAiu / 1e9
+~/.copilot/session-state/<sessionId>/events.jsonl
 ```
 
-**No USD.** The logs contain **no dollar amounts** — every cost field is in
-nano-AIU. Converting to USD would require an AIU→USD rate that is **not in the
-data**, so this module deliberately does not do it. If you need a currency,
-multiply `aiCreditCost` by your own contract rate downstream.
-
-### Main vs. sub-agent split
+So the normal workflow is: **chat as usual → exit cleanly with `/exit` → analyze
+the log.** (⚠️ If you just close the terminal, the log may not be written.)
 
-The robust split is per-call, from the SDK event stream:
+### Make a test session with 3 sub-agents, then analyze it
 
-- `assistant.usage` **without** `parentToolCallId` → **main agent**
-- `assistant.usage` **with** `parentToolCallId` → **sub-agent**; grouped by
-  `parentToolCallId` so each sub-agent invocation gets its own line
+This is the exact recipe we use to test the module end-to-end:
 
-This works for **inline** sub-agents (spawned via the `task` tool, which share
-the parent session) — the common case. If only the canonical log is available,
-the module falls back to `session.shutdown.modelMetrics` and emits a warning,
-because inline sub-agents there roll up by **model**, not by scope.
+```powershell
+# 1. a throwaway working dir + a known session id
+$work = Join-Path $env:TEMP "cc-test-$(Get-Random)"; New-Item -ItemType Directory $work | Out-Null; Set-Location $work
+$sid  = [guid]::NewGuid().ToString()
 
-### Token categories
+# 2. run non-interactively and force 3 parallel sub-agents
+$prompt = "You MUST use the 'task' tool to launch exactly 3 sub-agents in parallel in a single turn. " +
+          "Give each one this instruction: 'Reply with one line: WORKER OK'. " +
+          "Do not do the work yourself. After all three return, print: ALL DONE."
+copilot -p $prompt --allow-all-tools --output-format json --session-id $sid > stdout.jsonl
 
-The five categories are **non-overlapping** and map directly to the provider's
-billing tiers, so `inputTokens + cachedTokens + cacheWriteTokens = grossInputTokens`.
+# 3. analyze that session's log
+$events = Join-Path $env:USERPROFILE ".copilot/session-state/$sid/events.jsonl"
+cd C:\ado\win-dev-skills\src\tools\cost-module
+node examples/analyze-run.ts $events
+```
 
-> Note: the raw `assistant.usage.data.inputTokens` field is **gross** (it already
-> includes cached + cache-write). This module exposes both the non-overlapping
-> `inputTokens` (fresh only) **and** `grossInputTokens`, so you can use whichever
-> your report needs.
+Flags used: `-p` = non-interactive (exits when done), `--allow-all-tools` =
+required for `-p` (otherwise it waits for permission prompts), `--session-id` =
+so you know which folder to read.
 
 ---
 
-## Validation
+## Use it in your own code
 
-Running against the checked-in sample trial
-(`agent-benchmark/results/run1/calc_subagent-cost-test_o46_i1/session-logs-dir`):
+```ts
+import { analyzeJsonlFile, formatReport } from "copilot-cost"; // or "../src/copilot-cost.ts" in-repo
 
-```
-MAIN agent  in 21      cache(r) 402.8k  cache(w) 67.9k  out 4.7k    74.36 AIU
-SUB (gpt-5.4) in 125.6k cache(r) 411.6k  cache(w) 0      out 26.7k   81.77 AIU
-TOTAL       in 125.6k  cache(r) 814.5k  cache(w) 67.9k  out 31.4k  156.13 AIU
-premium requests: 3
+const report = await analyzeJsonlFile("path/to/events.jsonl");
+
+console.log(formatReport(report));      // pretty table
+report.total.aiCreditCost;              // total AI credits (AIU)
+report.main.inputTokens;                // main agent's fresh input tokens
+report.subAgentCount;                   // how many sub-agents ran
+report.models["claude-haiku-4.5"]?.aiCreditCost;  // exact AIU per model
 ```
 
-Every number ties out to the canonical `session.shutdown`:
+No file handy? Pass events you already have in memory:
 
-- `total.aiCreditCost` 156.13 AIU == `totalNanoAiu` `156131000000`
-- `main` 74.36 AIU == `modelMetrics["claude-opus-4.6"].totalNanoAiu` `74358800000`
-- token totals (125607 / 814464 / 67884 / 31435) == the shutdown `tokenDetails`
-- `premiumRequests` 3 == `totalPremiumRequests`
+```ts
+import { parseJsonl, analyzeEvents } from "copilot-cost";
+const report = analyzeEvents(parseJsonl(jsonlText));
+```
 
 ---
 
-## API
-
-### Pure (any runtime)
+## Good to know
 
-| Function | Description |
-|----------|-------------|
-| `parseJsonl(text): CopilotEvent[]` | Parse JSONL, skipping blank/malformed lines |
-| `analyzeEvents(events, options?): SessionCostReport` | Core analysis; accepts events from either or both logs |
-| `nanoAiuFromTokenDetails(tokenDetails): number` | Cost of a `tokenDetails` array (fallback) |
-| `formatReport(report): string` | Human-readable table |
+- **AIU is exact.** It comes from the CLI's own `totalNanoAiu` (`AIU = nanoAiu / 1e9`).
+  No price table, nothing to keep up to date.
+- **Per-agent AIU split needs the richer "SDK stream".** A plain CLI log can't
+  attribute AIU to individual sub-agents, so the module gives you the next best
+  things from it: exact **session totals**, **sub-agent count + per-sub tokens**
+  (`subAgentRuns`), and **per-model** AIU (`models`) — which already separates
+  main from subs when they run on different models (the common case). For a true
+  per-sub-agent AIU split, capture the SDK event stream (per-call
+  `assistant.usage` events, e.g. via `@github/copilot-sdk`).
+- **`input` is only the *new* tokens.** The full prompt is
+  `input + cache(r) + cache(w)` — also available as `report.main.grossInputTokens`.
 
-### Node (require `node:fs`)
-
-| Function | Description |
-|----------|-------------|
-| `analyzeJsonlFile(path, options?)` | Analyze a single `.jsonl` file |
-| `analyzeCopilotSession(pathOrDir, options?)` | Auto-discover `*-events.jsonl` + `.copilot/session-state/**/events.jsonl` under a dir (or analyze a single file), de-duplicate by event id, and report |
+---
 
-### Options
+## API
 
-```ts
-interface CostOptions {
-  reconcileTolerance?: number; // sanity-check tolerance vs session.shutdown total (default 0.01 = 1%)
-}
-```
+| Function | Use |
+|----------|-----|
+| `analyzeJsonlFile(path)` | Analyze one `.jsonl` log file (Node) |
+| `analyzeCopilotSession(dir)` | Auto-discover logs under a folder and analyze (Node) |
+| `parseJsonl(text)` → `analyzeEvents(events)` | Pure, runtime-agnostic (no filesystem) |
+| `formatReport(report)` | Render the report as a text table |
 
-### Result shape
+`SessionCostReport` shape:
 
 ```ts
 interface SessionCostReport {
-  main: CostBreakdown;            // main agent
-  subAgents: SubAgentCost[];      // per-call AIU split (SDK stream only; sorted by cost desc)
-  subAgentsTotal: CostBreakdown;  // aggregate of all sub-agents
-  total: CostBreakdown;           // main + all sub-agents (== session billed total)
-  models: Record<string, CostBreakdown>;  // per-model rollup (exact per-model AIU)
-  subAgentRuns: SubAgentRun[];    // from subagent.completed; available for plain CLI logs too
-  subAgentCount: number;          // best available sub-agent count
-  premiumRequests?: number;       // from session.shutdown
+  main: CostBreakdown;                     // main agent
+  subAgents: SubAgentCost[];               // per-sub AIU split (SDK stream only)
+  subAgentsTotal: CostBreakdown;           // all sub-agents combined
+  total: CostBreakdown;                    // main + subs (== session total)
+  models: Record<string, CostBreakdown>;   // exact AIU per model
+  subAgentRuns: SubAgentRun[];             // sub-agent count + per-sub tokens (works on plain CLI logs)
+  subAgentCount: number;
+  premiumRequests?: number;
   sessionIds: string[];
-  warnings: string[];             // e.g. cross-check mismatch, missing per-call data
+  warnings: string[];                      // e.g. "no per-call data, using fallback"
 }
 
 interface CostBreakdown {
-  inputTokens: number; cachedTokens: number; cacheWriteTokens: number;
-  outputTokens: number; reasoningTokens: number; grossInputTokens: number;
-  nanoAiu: number; aiCreditCost: number; apiCalls: number;
-}
-
-interface SubAgentCost extends CostBreakdown {
-  toolCallId: string; agentName?: string; model?: string; durationMs?: number;
-}
-
-// From subagent.completed / subagent.failed events. Combined token count only
-// (no input/output/cache breakdown, no per-sub AIU). Present in BOTH the SDK
-// stream and a plain CLI session's on-disk events.jsonl.
-interface SubAgentRun {
-  toolCallId?: string; name?: string; model?: string;
-  totalTokens: number; durationMs?: number; status: "completed" | "failed";
+  inputTokens; cachedTokens; cacheWriteTokens; outputTokens;
+  reasoningTokens; grossInputTokens;       // token counts
+  nanoAiu; aiCreditCost; apiCalls;         // cost
 }
 ```
 
 ---
 
-## Using it with a plain Copilot CLI session (no harness)
-
-You can capture a log the module reads from a bare `copilot` command. **Run the
-session to completion**, then point the module at the session-state folder.
-
-Where the cost data lands for a plain CLI session:
-
-| Source | Has what | Good for |
-|--------|----------|----------|
-| `~/.copilot/session-state/<sessionId>/events.jsonl` (written automatically) | `session.shutdown` (exact **token totals + AIU + premium** + per-model `modelMetrics`) **and** `subagent.completed` (sub-agent **count + per-sub total tokens + model + duration**) | Exact session totals, sub-agent count/tokens, and per-**model** AIU |
-| `copilot --output-format json` (stdout you redirect) | leaner stream: `result` (premium, durations) + `assistant.message` (output tokens) + `subagent.completed` | sub-agent count + output tokens only |
-
-> **Important fidelity note.** A plain CLI session's logs do **not** contain the
-> per-call `assistant.usage` events, so the module cannot produce a per-**scope**
-> (main-vs-sub) **AIU** split from them. You still get: exact **session totals**,
-> the **sub-agent count + per-sub total tokens** (`subAgentRuns`), and the exact
-> **per-model** AIU (`models`) — which separates main from sub whenever they run
-> on different models. A precise per-scope AIU split requires the SDK event
-> stream (per-call `assistant.usage`), e.g. captured via `@github/copilot-sdk`.
-
-### Make a multi-sub-agent session, then analyze it
-
-```powershell
-# 1. fresh working dir + a known session id
-$work = Join-Path $env:TEMP "cc-test-$(Get-Random)"; New-Item -ItemType Directory $work | Out-Null; Set-Location $work
-$sid  = [guid]::NewGuid().ToString()
-
-# 2. run non-interactively; force 3 parallel sub-agents via the task tool
-$prompt = "You MUST use the 'task' tool to launch exactly 3 sub-agents in parallel in a single turn. " +
-          "Give each one this exact instruction: 'Reply with one line: WORKER OK'. " +
-          "Do not do the work yourself. After all three return, print: ALL DONE."
-copilot -p $prompt --allow-all-tools --output-format json --session-id $sid > stdout.jsonl
-
-# 3. analyze the on-disk session log (richest plain-CLI source)
-$events = Join-Path $env:USERPROFILE ".copilot/session-state/$sid/events.jsonl"
-node -e "import('copilot-cost').then(async m => console.log(m.formatReport(await m.analyzeJsonlFile(process.argv[1]))))" $events
-```
-
-Key flags: `-p` (non-interactive), `--allow-all-tools` (required for `-p`, else
-it blocks on permission prompts), `--output-format json` (JSONL stream),
-`--session-id` (so you know which folder to read).
-
----
-
----
-
-## Design notes
-
-- **No price table.** Cost is read from the CLI's own `totalNanoAiu`, so it
-  stays correct even as model prices change — there is nothing to maintain, and
-  no fabricated rates.
-- **Per-call main-vs-sub split.** Sub-agents are separated by `parentToolCallId`
-  on each `assistant.usage` event, so **inline** `task`-tool sub-agents (which
-  share the parent session) are attributed correctly — not folded into the main
-  agent.
-- **Premium requests from the summary.** `data.cost` on a usage event is a
-  per-request multiplier, not an additive counter, so premium requests are read
-  from `session.shutdown.totalPremiumRequests`.
-- **Built-in sanity-check.** The summed per-call cost is reconciled against the
-  session's `totalNanoAiu`; drift beyond `reconcileTolerance` adds a warning
-  (it never changes the reported numbers).
-
----
-
-## License
+## How it works (one paragraph)
 
-MIT
+The CLI records each call's cost in **nano-AIU** inside the event log. The
+module sums the `totalNanoAiu` the CLI already reports (so it's exact), divides
+by 1e9 to get AIU, and tallies tokens by type. It splits main vs. sub-agents
+per call via `parentToolCallId` when the detailed SDK stream is present; with a
+plain CLI log it falls back to the end-of-session summary (`session.shutdown`)
+plus `subagent.completed` events. As a safety net it cross-checks the summed
+cost against the session total and warns on any mismatch.