diff --git a/src/parser.ts b/src/parser.ts
index 21eed277..7018e4fa 100644
--- a/src/parser.ts
+++ b/src/parser.ts
@@ -21,7 +21,7 @@ import {
   reconcileFile,
   saveCache,
 } from './session-cache.js'
-import type { ParsedProviderCall } from './providers/types.js'
+import type { ParsedProviderCall, SessionSource } from './providers/types.js'
 import type {
   AssistantMessageContent,
   ClassifiedTurn,
@@ -1324,6 +1324,10 @@ function buildSessionSummary(
       totalCacheWrite += call.usage.cacheCreationInputTokens
       apiCalls++
 
+      if (process.env['DEBUG_OTEL'] && (call.usage.cacheReadInputTokens > 0 || call.usage.cacheCreationInputTokens > 0)) {
+        console.warn(`[Aggregate] Model=${call.model}, cache_read=${call.usage.cacheReadInputTokens}, cache_write=${call.usage.cacheCreationInputTokens}`)
+      }
+
       const modelKey = getShortModelName(call.model)
       if (!modelBreakdown[modelKey]) {
         modelBreakdown[modelKey] = {
@@ -1946,7 +1950,7 @@ function warnProviderParseFailure(providerName: string, sourcePath: string, err:
 
 async function parseProviderSources(
   providerName: string,
-  sources: Array<{ path: string; project: string }>,
+  sources: SessionSource[],
   seenKeys: Set<string>,
   diskCache: SessionCache,
   dateRange?: DateRange,
@@ -1957,8 +1961,8 @@ async function parseProviderSources(
   const section = getOrCreateProviderSection(diskCache, providerName)
   const allDiscoveredFiles = new Set<string>()
 
-  type SourceInfo = { source: { path: string; project: string }; fp: NonNullable<Awaited<ReturnType<typeof fingerprintFile>>> }
-  const unchangedSources: Array<{ source: { path: string; project: string }; cached: CachedFile }> = []
+  type SourceInfo = { source: SessionSource; fp: NonNullable<Awaited<ReturnType<typeof fingerprintFile>>> }
+  const unchangedSources: Array<{ source: SessionSource; cached: CachedFile }> = []
   const changedSources: SourceInfo[] = []
 
   for (const source of sources) {
@@ -2001,29 +2005,58 @@ async function parseProviderSources(
 
   // Parse changed files, update cache
   let didParse = false
+  // Track which paths have already been cleared this pass so that subsequent
+  // sources sharing the same path (e.g. multiple OTel conversations from one
+  // agent-traces.db) can accumulate via the merge logic below rather than
+  // being wiped on every iteration.
+  const clearedPaths = new Set<string>()
   try {
     for (const { source, fp } of changedSources) {
       if (dateRange) {
         if (fp.mtimeMs < dateRange.start.getTime()) continue
       }
 
-      // Clear stale entry before parse — if parse fails, file is excluded
-      delete section.files[source.path]
+      // Clear stale entry before parse — but only once per path so that
+      // multiple sources mapping to the same file path can merge their turns.
+      if (!clearedPaths.has(source.path)) {
+        delete section.files[source.path]
+        clearedPaths.add(source.path)
+      }
 
-      const parser = provider.createSessionParser(
-        { path: source.path, project: source.project, provider: providerName },
-        parserDedup,
-        dateRange,
-      )
+      const parser = provider.createSessionParser(source, parserDedup, dateRange)
 
       try {
         const providerCalls: ParsedProviderCall[] = []
         for await (const call of parser.parse()) {
           providerCalls.push(call)
         }
+        if (process.env['DEBUG_OTEL']) {
+          console.warn(`[Parse] File ${source.path.substring(0, 40)}: Collected ${providerCalls.length} provider calls, ${providerCalls.filter(c => c.cacheReadInputTokens > 0 || c.cacheCreationInputTokens > 0).length} with cache tokens`)
+        }
+        if (process.env['DEBUG_OTEL'] && providerCalls.some(c => c.cacheReadInputTokens > 0 || c.cacheCreationInputTokens > 0)) {
+          console.warn(`[Parse] After conversion: turns to be created...`)
+        }
         const canonicalCalls = await Promise.all(providerCalls.map(canonicalizeProviderCallProject))
         const turns = providerCallsToCachedTurns(canonicalCalls)
-        section.files[source.path] = { fingerprint: fp, mcpInventory: [], turns }
+        if (process.env['DEBUG_OTEL'] && providerCalls.some(c => c.cacheReadInputTokens > 0 || c.cacheCreationInputTokens > 0)) {
+          console.warn(`[Parse] After conversion: ${turns.length} turns, calls with cache: ${turns.flatMap(t => t.calls).filter(c => c.usage.cacheReadInputTokens > 0 || c.usage.cacheCreationInputTokens > 0).length}`)
+        }
+        
+        // For files with multiple sources (e.g., OTel database with many conversations),
+        // merge turns instead of overwriting. This allows us to parse the same file
+        // multiple times for different conversations and aggregate all results.
+        const existingCacheEntry = section.files[source.path]
+        if (process.env['DEBUG_OTEL']) {
+          console.warn(`[Parse] Cache entry exists for path: ${!!existingCacheEntry}, turns to merge: ${turns.length}`)
+        }
+        if (existingCacheEntry) {
+          existingCacheEntry.turns = [...existingCacheEntry.turns, ...turns]
+          if (process.env['DEBUG_OTEL']) {
+            console.warn(`[Parse] Merged with existing cache entry for ${source.path.substring(0, 40)}, now has ${existingCacheEntry.turns.length} turns total`)
+          }
+        } else {
+          section.files[source.path] = { fingerprint: fp, mcpInventory: [], turns }
+        }
         didParse = true
         ;(diskCache as { _dirty?: boolean })._dirty = true
       } catch (err) {
@@ -2064,13 +2097,31 @@ async function parseProviderSources(
   // Uses seenKeys (shared across providers) for cross-provider dedup.
   const sessionMap = new Map<string, { project: string; projectPath?: string; turns: ClassifiedTurn[] }>()
 
+  if (process.env['DEBUG_OTEL']) {
+    const totalCacheCalls = sources.flatMap(s => section.files[s.path]?.turns ?? []).flatMap(t => t.calls).filter(c => c.usage.cacheReadInputTokens > 0 || c.usage.cacheCreationInputTokens > 0)
+    console.warn(`[SessionMap] Starting with ${sources.length} sources, ${totalCacheCalls.length} calls with cache tokens`)
+    
+    const filesInfo = Object.entries(section.files).map(([path, file]) => ({
+      path: path.substring(0, 50),
+      turns: file.turns.length,
+      totalCalls: file.turns.flatMap(t => t.calls).length,
+      cacheTokenCalls: file.turns.flatMap(t => t.calls).filter(c => c.usage.cacheReadInputTokens > 0 || c.usage.cacheCreationInputTokens > 0).length
+    }))
+    console.warn(`[SessionMap] Cache files: ${JSON.stringify(filesInfo)}`)
+  }
+
   for (const source of sources) {
     const cachedFile = section.files[source.path]
     if (!cachedFile) continue
 
     for (const turn of cachedFile.turns) {
       const hasDup = turn.calls.some(c => seenKeys.has(c.deduplicationKey))
-      if (hasDup) continue
+      if (hasDup) {
+        if (process.env['DEBUG_OTEL'] && turn.calls.some(c => c.usage.cacheReadInputTokens > 0 || c.usage.cacheCreationInputTokens > 0)) {
+          console.warn(`[SessionMap] Skipping turn with cache tokens due to dedup: ${turn.calls.map(c => c.deduplicationKey).join(',')}`)
+        }
+        continue
+      }
 
       for (const c of turn.calls) seenKeys.add(c.deduplicationKey)
 
@@ -2085,6 +2136,10 @@ async function parseProviderSources(
       const project = turn.calls[0]?.project ?? source.project
       const key = `${providerName}:${turn.sessionId}:${project}`
 
+      if (process.env['DEBUG_OTEL'] && turn.calls.some(c => c.usage.cacheReadInputTokens > 0 || c.usage.cacheCreationInputTokens > 0)) {
+        console.warn(`[SessionMap] Adding turn with cache tokens to sessionMap key=${key}`)
+      }
+
       const existing = sessionMap.get(key)
       if (existing) {
         existing.turns.push(classified)
@@ -2246,10 +2301,10 @@ export async function parseAllSessions(dateRange?: DateRange, providerFilter?: s
   const claudeDirs = claudeSources.map(s => ({ path: s.path, name: s.project }))
   const claudeProjects = await scanProjectDirs(claudeDirs, seenMsgIds, diskCache, dateRange)
 
-  const providerGroups = new Map<string, Array<{ path: string; project: string }>>()
+  const providerGroups = new Map<string, SessionSource[]>()
   for (const source of nonClaudeSources) {
     const existing = providerGroups.get(source.provider) ?? []
-    existing.push({ path: source.path, project: source.project })
+    existing.push(source)
     providerGroups.set(source.provider, existing)
   }
 
diff --git a/src/providers/copilot.ts b/src/providers/copilot.ts
index 329158f3..bdf121dc 100644
--- a/src/providers/copilot.ts
+++ b/src/providers/copilot.ts
@@ -1,758 +1,1031 @@
+// =============================================================================
+// copilot.ts — Modified CodeBurn Copilot provider
+// =============================================================================
+//
+// WHAT CHANGED:
+//   The original provider only reads Copilot's JSONL session-state files from
+//   ~/.copilot/session-state/, which only log output tokens. Input tokens,
+//   cache-read tokens, and cache-creation tokens are never written there, so
+//   CodeBurn underreports Copilot costs by 60-80%.
+//
+//   This modified version adds a SECOND data source: VS Code Copilot Chat's
+//   OTel SQLite store (agent-traces.db). When present, it contains full
+//   per-LLM-call token breakdowns (input, output, cache_read, cache_creation)
+//   from the OpenTelemetry GenAI semantic conventions. We prefer OTel data
+//   when available and fall back to the original JSONL parsing.
+//
+// HOW TO ENABLE THE OTEL SQLITE STORE:
+//   TWO settings must both be enabled in VS Code settings.json:
+//
+//     {
+//       "github.copilot.chat.otel.enabled": true,
+//       "github.copilot.chat.otel.dbSpanExporter.enabled": true
+//     }
+//
+//   The first enables the OTel pipeline; the second (defaults to false) enables
+//   the SQLite span exporter that actually writes agent-traces.db.
+//   After changing these settings, restart VS Code — the extension watches for
+//   these changes and requires a reload to take effect.
+//
+//   Or set the environment variable before launching VS Code:
+//
+//     export COPILOT_OTEL_ENABLED=true
+//
+//   The DB file is created in VS Code's global storage directory:
+//     ~/Library/Application Support/Code/User/globalStorage/github.copilot-chat/agent-traces.db
+//
+// ENVIRONMENT VARIABLES:
+//   CODEBURN_COPILOT_OTEL_DB    — Override the agent-traces.db path
+//   CODEBURN_COPILOT_DISABLE_OTEL=1 — Skip OTel entirely, use only JSONL
+//
+// ARCHITECTURE:
+//   discoverSessions() returns BOTH OTel sessions (one per conversation_id)
+//   and JSONL sessions. The OTel sessions are deduped against JSONL by
+//   conversation ID so we don't double-count. OTel sessions carry the full
+//   token breakdown; JSONL sessions only carry output tokens (the original
+//   behaviour, as a fallback).
+//
+// LIMITATIONS:
+//   - The OTel DB only contains Copilot Chat and Agent mode spans. Inline
+//     completions (ghost text) and Agent Host spans are NOT yet written to
+//     this DB (see https://github.com/microsoft/vscode/issues/315901).
+//   - The DB schema is inferred from the official OTel GenAI semantic
+//     conventions and the Copilot Budget extension's approach. If VS Code
+//     changes the schema, this parser will need updating.
+// =============================================================================
+
+import { readdir, stat } from 'fs/promises'
+import { homedir, platform } from 'os'
+import { join, basename, dirname, posix, win32 } from 'path'
 import { existsSync } from 'fs'
-import { readdir, readFile, stat } from 'fs/promises'
-import { basename, dirname, join, posix, win32 } from 'path'
-import { homedir } from 'os'
-
 import { readSessionFile } from '../fs-utils.js'
 import { calculateCost } from '../models.js'
-import type { Provider, SessionSource, SessionParser, ParsedProviderCall } from './types.js'
-
+import type {
+  Provider,
+  SessionSource,
+  SessionParser,
+  ParsedProviderCall,
+} from './types.js'
+
+// ---------------------------------------------------------------------------
+// Model display names (unchanged from original)
+// ---------------------------------------------------------------------------
 const modelDisplayNames: Record<string, string> = {
   'gpt-4.1-nano': 'GPT-4.1 Nano',
   'gpt-4.1-mini': 'GPT-4.1 Mini',
   'gpt-4.1': 'GPT-4.1',
   'gpt-4o-mini': 'GPT-4o Mini',
   'gpt-4o': 'GPT-4o',
-  'gpt-5.4': 'GPT-5.4',
-  'gpt-5.3-codex': 'GPT-5.3 Codex',
   'gpt-5-mini': 'GPT-5 Mini',
   'gpt-5': 'GPT-5',
-  'claude-opus-4-7': 'Opus 4.7',
-  'claude-opus-4-6': 'Opus 4.6',
-  'claude-opus-4-5': 'Opus 4.5',
-  'claude-opus-4-1': 'Opus 4.1',
-  'claude-opus-4': 'Opus 4',
-  'claude-sonnet-4-6': 'Sonnet 4.6',
   'claude-sonnet-4-5': 'Sonnet 4.5',
   'claude-sonnet-4': 'Sonnet 4',
-  'claude-3-7-sonnet': 'Sonnet 3.7',
-  'claude-3-5-sonnet': 'Sonnet 3.5',
-  'o4-mini': 'o4-mini',
-  'o3': 'o3',
+  'copilot-openai-auto': 'Copilot (OpenAI auto)',
+  'copilot-anthropic-auto': 'Copilot (Anthropic auto)',
 }
 
+// ---------------------------------------------------------------------------
+// Tool name normalisation (unchanged from original, plus OTel tool names)
+// ---------------------------------------------------------------------------
 const toolNameMap: Record<string, string> = {
+  // JSONL session-state tool names
   bash: 'Bash',
-  run_in_terminal: 'Bash',
   read_file: 'Read',
   write_file: 'Edit',
   edit_file: 'Edit',
-  replace_string_in_file: 'Edit',
-  create_file: 'Write',
   delete_file: 'Delete',
-  search_files: 'Grep',
-  file_search: 'Grep',
-  find_files: 'Glob',
-  list_directory: 'LS',
-  list_dir: 'LS',
-  web_search: 'WebSearch',
-  fetch_webpage: 'WebFetch',
   github_repo: 'GitHub',
-  memory: 'Memory',
-  kill_terminal: 'Bash',
+  web_search: 'WebSearch',
+  run_in_terminal: 'Shell',
+  // OTel execute_tool span names from Copilot Chat:
+  readFile: 'Read',
+  writeFile: 'Edit',
+  editFile: 'Edit',
+  runCommand: 'Shell',
+  runInTerminal: 'Shell',
+  findFiles: 'Search',
+  grepSearch: 'Search',
+  codebaseSearch: 'Search',
+  getErrors: 'Diagnostics',
+  listCodeUsages: 'Search',
+  createFile: 'Edit',
+  deleteFile: 'Delete',
+  renameOrMoveFile: 'Edit',
+  fetchWebpage: 'Web',
 }
 
-function normalizeMcpSegment(segment: string): string {
-  return segment
-    .replace(/[^a-zA-Z0-9_]+/g, '_')
-    .replace(/_+/g, '_')
-    .replace(/^_+|_+$/g, '')
+/**
+ * Normalise a raw tool name to its display form.
+ * - Known tools are mapped via toolNameMap.
+ * - MCP tools (containing both '-' and '_') are formatted as
+ *   mcp__server_name__tool_name.
+ * - Everything else is returned unchanged.
+ */
+function normalizeTool(rawTool: string): string {
+  const mapped = toolNameMap[rawTool]
+  if (mapped) return mapped
+  // MCP tool names follow the pattern: server-name-tool_operand
+  // e.g. github-mcp-server-list_issues → mcp__github_mcp_server__list_issues
+  const dashIdx = rawTool.lastIndexOf('-')
+  if (dashIdx > 0 && rawTool.includes('_')) {
+    const server = rawTool.slice(0, dashIdx).replace(/-/g, '_')
+    const tool = rawTool.slice(dashIdx + 1)
+    return `mcp__${server}__${tool}`
+  }
+  return rawTool
 }
 
-function normalizeCopilotMcpTool(rawTool: string): string | null {
-  const serverSeparator = rawTool.lastIndexOf('-')
-  if (serverSeparator <= 0 || serverSeparator >= rawTool.length - 1) return null
-
-  const server = normalizeMcpSegment(rawTool.slice(0, serverSeparator))
-  const tool = normalizeMcpSegment(rawTool.slice(serverSeparator + 1))
-  if (!server || !tool) return null
+const modelDisplayEntries = Object.entries(modelDisplayNames).sort(
+  (a, b) => b[0].length - a[0].length
+)
 
-  return `mcp__${server}__${tool}`
+// ---------------------------------------------------------------------------
+// Types for JSONL session state events (unchanged from original)
+// ---------------------------------------------------------------------------
+type ToolRequest = {
+  toolName?: string  // older format
+  name?: string      // newer format (copilot-agent)
 }
 
-function normalizeToolName(rawTool?: unknown): string {
-  if (typeof rawTool !== 'string') return ''
-  if (!rawTool) return ''
-  if (rawTool.startsWith('mcp__')) return rawTool
-
-  const builtIn = toolNameMap[rawTool]
-  if (builtIn) return builtIn
-
-  // Copilot records MCP tools as `<server>-<tool>` instead of Claude's
-  // `mcp__server__tool`; built-ins are handled above before this heuristic.
-  return normalizeCopilotMcpTool(rawTool) ?? rawTool
+type SessionStartData = {
+  selectedModel?: string
 }
 
-const CHARS_PER_TOKEN = 4
-const COPILOT_OPENAI_AUTO = 'copilot-openai-auto'
-const COPILOT_ANTHROPIC_AUTO = 'copilot-anthropic-auto'
-
-const modelDisplayEntries = Object.entries(modelDisplayNames).sort((a, b) => b[0].length - a[0].length)
-
-// --- Legacy format (session-state/events.jsonl with outputTokens) ---
-
-type LegacyToolRequest = {
-  name?: string
-  toolCallId?: string
-  type?: string
+type ModelChangeData = {
+  newModel: string
+  previousModel?: string
 }
 
-// Per-event-type shapes. The previous union included a permissive catch-all
-// branch (`{ type: string; data: Record<string, unknown> }`); a literal type
-// like `'user.message'` is assignable to `string`, so TS picked the catch-all
-// over the specific branches when narrowing on `type`, which propagated
-// `unknown`/`{}` into `event.data.content` etc. We now keep only the three
-// shapes we actually read from. Unknown event types fall through the if/else
-// chain without further narrowing — they are not in the union, but JSON.parse
-// returns `any` so we re-type as LegacyCopilotEvent and let the runtime type
-// guards (`event.type === 'X'`) ignore anything else.
-type LegacyCopilotEvent =
-  | { type: 'session.model_change'; timestamp?: string; data: { newModel: string; model?: string } }
-  | { type: 'user.message'; timestamp?: string; data: { content: string; interactionId?: string; model?: string } }
-  | { type: 'assistant.message'; timestamp?: string; data: { messageId: string; outputTokens: number; interactionId?: string; toolRequests?: LegacyToolRequest[]; model?: string } }
-
-function parseLegacyEvents(content: string, sessionId: string, seenKeys: Set<string>): ParsedProviderCall[] {
-  const results: ParsedProviderCall[] = []
-  const lines = content.split('\n').filter(l => l.trim())
-  let currentModel = ''
-  let pendingUserMessage = ''
-
-  for (const line of lines) {
-    let event: LegacyCopilotEvent
-    try {
-      event = JSON.parse(line)
-    } catch {
-      continue
-    }
-
-    // Some newer events include the model ID explicitly.
-    const data = event.data as { newModel?: string; model?: string }
-    if (typeof data.model === 'string' && data.model) {
-      currentModel = data.model
-    }
+type UserMessageData = {
+  content: string
+  interactionId?: string
+}
 
-    if (event.type === 'session.model_change') {
-      currentModel = data.newModel ?? currentModel
-      continue
-    }
+type AssistantMessageData = {
+  messageId: string
+  model?: string       // present in newer copilot-agent format
+  outputTokens: number
+  interactionId?: string
+  toolRequests?: ToolRequest[]
+}
 
-    if (event.type === 'user.message') {
-      const userEvent = event as Extract<LegacyCopilotEvent, { type: 'user.message' }>
-      pendingUserMessage = userEvent.data.content ?? ''
-      continue
-    }
+type CopilotEvent =
+  | { type: 'session.start'; data: SessionStartData; timestamp?: string }
+  | { type: 'session.model_change'; data: ModelChangeData; timestamp?: string }
+  | { type: 'user.message'; data: UserMessageData; timestamp?: string }
+  | { type: 'assistant.message'; data: AssistantMessageData; timestamp?: string }
+
+// ---------------------------------------------------------------------------
+// Types for OTel span rows from agent-traces.db
+// ---------------------------------------------------------------------------
+
+// The OTel SQLite store schema uses a spans table where attributes are stored
+// either as a JSON blob or as individual columns. We handle both patterns.
+// The Copilot Budget extension reads from this same DB and uses per-span
+// token counts, confirming this schema is stable enough to depend on.
+
+interface OTelSpanRow {
+  trace_id: string
+  span_id: string
+  parent_span_id: string | null
+  name: string              // e.g. "chat gpt-4o" or "invoke_agent copilot"
+  start_time: number        // nanosecond epoch or millisecond epoch
+  end_time: number
+  attributes: string | null // JSON blob of all OTel attributes
+  // Some DB versions may use separate columns instead of a JSON blob.
+  // We try JSON parsing first, then fall back to individual column queries.
+  [key: string]: unknown
+}
 
-    if (event.type === 'assistant.message') {
-      const { messageId, outputTokens, toolRequests: rawToolRequests } = event.data
-      if (outputTokens === 0) continue
-      if (!currentModel) continue
+// Parsed attribute bag from a span
+interface SpanAttributes {
+  'gen_ai.operation.name'?: string
+  'gen_ai.response.model'?: string
+  'gen_ai.request.model'?: string
+  'gen_ai.usage.input_tokens'?: number
+  'gen_ai.usage.output_tokens'?: number
+  'gen_ai.usage.cache_read.input_tokens'?: number
+  'gen_ai.usage.cache_creation.input_tokens'?: number
+  'gen_ai.conversation.id'?: string
+  'gen_ai.agent.name'?: string
+  'gen_ai.tool.name'?: string
+  'github.copilot.chat.turn.id'?: string
+  [key: string]: unknown
+}
 
-      const dedupKey = `copilot:${sessionId}:${messageId}`
-      if (seenKeys.has(dedupKey)) continue
-      seenKeys.add(dedupKey)
+// ---------------------------------------------------------------------------
+// Paths
+// ---------------------------------------------------------------------------
 
-      // Defensive: legacy / corrupt sessions have shipped toolRequests as a
-      // string, null, or missing. Without this guard, .map throws and aborts
-      // the whole file's parse loop, silently dropping every legitimate call
-      // that follows the bad event.
-      const toolRequests = Array.isArray(rawToolRequests) ? rawToolRequests : []
-      const tools = toolRequests
-        .map(t => normalizeToolName(t?.name))
-        .filter(Boolean)
+function getCopilotSessionStateDir(override?: string): string {
+  return override ?? process.env['CODEBURN_COPILOT_SESSION_STATE_DIR'] ?? join(homedir(), '.copilot', 'session-state')
+}
 
-      const costUSD = calculateCost(currentModel, 0, outputTokens, 0, 0, 0)
+/**
+ * Locate the agent-traces.db file.
+ *
+ * Priority:
+ *   1. CODEBURN_COPILOT_OTEL_DB env var
+ *   2. Platform-specific default VS Code global storage path
+ *   3. VSCodium variant paths
+ */
+function getAgentTracesDbPath(): string | null {
+  // Allow explicit override
+  const envOverride = process.env['CODEBURN_COPILOT_OTEL_DB']
+  if (envOverride) {
+    return existsSync(envOverride) ? envOverride : null
+  }
 
-      results.push({
-        provider: 'copilot',
-        model: currentModel,
-        inputTokens: 0,
-        outputTokens,
-        cacheCreationInputTokens: 0,
-        cacheReadInputTokens: 0,
-        cachedInputTokens: 0,
-        reasoningTokens: 0,
-        webSearchRequests: 0,
-        costUSD,
-        tools,
-        bashCommands: [],
-        timestamp: event.timestamp ?? '',
-        speed: 'standard',
-        deduplicationKey: dedupKey,
-        userMessage: pendingUserMessage,
-        sessionId,
-      })
+  const home = homedir()
+  const candidates: string[] = []
 
-      pendingUserMessage = ''
-    }
+  const p = platform()
+  if (p === 'darwin') {
+    // macOS: VS Code, VS Code Insiders, VSCodium
+    candidates.push(
+      join(home, 'Library', 'Application Support', 'Code', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(home, 'Library', 'Application Support', 'Code - Insiders', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(home, 'Library', 'Application Support', 'VSCodium', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+    )
+  } else if (p === 'linux') {
+    // Linux: VS Code, VS Code Insiders, VSCodium
+    candidates.push(
+      join(home, '.config', 'Code', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(home, '.config', 'Code - Insiders', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(home, '.config', 'VSCodium', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+    )
+  } else if (p === 'win32') {
+    // Windows
+    const appdata = process.env['APPDATA'] ?? join(home, 'AppData', 'Roaming')
+    candidates.push(
+      join(appdata, 'Code', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(appdata, 'Code - Insiders', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+      join(appdata, 'VSCodium', 'User', 'globalStorage', 'github.copilot-chat', 'agent-traces.db'),
+    )
   }
 
-  return results
+  for (const candidate of candidates) {
+    if (existsSync(candidate)) return candidate
+  }
+  return null
 }
 
-// --- VS Code transcript format (workspaceStorage transcripts) ---
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
 
-type TranscriptToolRequest = {
-  toolCallId?: string
-  name?: string
-  arguments?: string
-  type?: string
+function parseCwd(yaml: string): string | null {
+  const match = yaml.match(/^cwd:\s*(.+)$/m)
+  if (!match?.[1]) return null
+  let raw = match[1].trim()
+  // Strip inline YAML comments (# preceded by optional whitespace)
+  raw = raw.replace(/\s*#.*$/, '')
+  // Strip surrounding single/double quotes
+  raw = raw.replace(/^['"]|['"]$/g, '').trim()
+  return raw || null
 }
 
-type TranscriptEvent =
-  | { type: 'session.start'; timestamp?: string; data: { sessionId: string; producer?: string } }
-  | { type: 'user.message'; timestamp?: string; data: { content: string; attachments?: unknown[] } }
-  | { type: 'assistant.message'; timestamp?: string; data: { messageId: string; content?: string; reasoningText?: string; toolRequests?: TranscriptToolRequest[]; outputTokens?: number } }
-  | { type: string; timestamp?: string; data: Record<string, unknown> }
-
-const transcriptToolCallModelHints: Array<{ prefix: string; model: string }> = [
-  // Anthropic tool-call ID variants observed in Copilot transcript logs.
-  { prefix: 'toolu_bdrk_', model: COPILOT_ANTHROPIC_AUTO },
-  { prefix: 'toolu_vrtx_', model: COPILOT_ANTHROPIC_AUTO },
-  { prefix: 'tooluse_', model: COPILOT_ANTHROPIC_AUTO },
-  { prefix: 'toolu_', model: COPILOT_ANTHROPIC_AUTO },
-  // OpenAI tool-call IDs.
-  { prefix: 'call_', model: COPILOT_OPENAI_AUTO },
-]
-
-function inferModelFromToolCallIds(events: TranscriptEvent[]): string {
-  const modelCounts = new Map<string, number>()
-
-  for (const e of events) {
-    // Some newer events (like tool.execution_complete) explicitly include the model ID.
-    const data = e.data as { model?: string }
-    if (typeof data.model === 'string' && data.model) {
-      modelCounts.set(data.model, (modelCounts.get(data.model) ?? 0) + 100)
-    }
-
-    if (e.type !== 'assistant.message') continue
-    const msg = e as { data: { toolRequests?: TranscriptToolRequest[] } }
-    for (const t of msg.data.toolRequests ?? []) {
-      const toolCallId = t.toolCallId ?? ''
-      for (const hint of transcriptToolCallModelHints) {
-        if (!toolCallId.startsWith(hint.prefix)) continue
-        modelCounts.set(hint.model, (modelCounts.get(hint.model) ?? 0) + 1)
-        break
-      }
-    }
-  }
-
-  if (modelCounts.size > 0) {
-    return [...modelCounts.entries()].sort((a, b) => b[1] - a[1])[0]![0]
+/**
+ * Parse the JSON attributes blob from an OTel span row.
+ * Returns an empty object if parsing fails.
+ */
+function parseSpanAttributes(raw: string | null): SpanAttributes {
+  if (!raw) return {}
+  try {
+    return JSON.parse(raw) as SpanAttributes
+  } catch {
+    return {}
   }
-
-  return 'copilot-auto'
 }
 
-/** Model inference for JB events — checks data.model (100x weight) and tool call
- *  ID prefixes on tool.execution_start/complete events. */
-function inferModelFromEvents(events: JBEvent[]): string {
-  const modelCounts = new Map<string, number>()
-
-  for (const e of events) {
-    const data = e.data as { model?: string; toolCallId?: string }
-    if (typeof data.model === 'string' && data.model) {
-      modelCounts.set(data.model, (modelCounts.get(data.model) ?? 0) + 100)
-    }
-
-    if (e.type === 'tool.execution_start' || e.type === 'tool.execution_complete') {
-      const toolCallId = data.toolCallId ?? ''
-      for (const hint of transcriptToolCallModelHints) {
-        if (!toolCallId.startsWith(hint.prefix)) continue
-        modelCounts.set(hint.model, (modelCounts.get(hint.model) ?? 0) + 1)
-        break
+/**
+ * Load span attributes from the span_attributes table (key-value pairs).
+ * This handles the modern VS Code Copilot Chat schema where attributes
+ * are stored as separate key-value rows rather than a JSON blob.
+ */
+function loadSpanAttributesFromTable(
+  db: ReturnType<typeof import('../sqlite.js')['openDatabase']>,
+  spanId: string
+): SpanAttributes {
+  try {
+    const rows = db.query<{ key: string; value: string | null }>(
+      `SELECT key, value FROM span_attributes WHERE span_id = ?`,
+      [spanId]
+    )
+    const attrs: SpanAttributes = {}
+    for (const row of rows) {
+      if (row.key && row.value) {
+        try {
+          // Try to parse numeric values
+          const numValue = Number(row.value)
+          attrs[row.key as keyof SpanAttributes] = Number.isNaN(numValue) 
+            ? row.value
+            : numValue
+        } catch {
+          attrs[row.key as keyof SpanAttributes] = row.value
+        }
       }
     }
+    return attrs
+  } catch (e) {
+    if (process.env['DEBUG_OTEL']) console.warn(`loadSpanAttributesFromTable error for span ${spanId}:`, e)
+    return {}
   }
+}
 
-  if (modelCounts.size > 0) {
-    return [...modelCounts.entries()].sort((a, b) => b[1] - a[1])[0]![0]
-  }
+/**
+ * Convert nanosecond or millisecond epoch to ISO timestamp.
+ * The OTel spec uses nanoseconds, but some implementations use milliseconds.
+ */
+function epochToISO(epoch: number): string {
+  // If the value looks like nanoseconds (> 1e15), convert to ms
+  const ms = epoch > 1e15 ? Math.floor(epoch / 1e6) : epoch > 1e12 ? epoch : epoch * 1000
+  return new Date(ms).toISOString()
+}
 
-  return 'copilot-auto'
+// ---------------------------------------------------------------------------
+// Helpers for JSONL / transcript parsing
+// ---------------------------------------------------------------------------
+
+/**
+ * Safely coerce a raw toolRequests value to an array of ToolRequest.
+ * Non-array values (string, null, undefined) are treated as empty arrays
+ * so that a corrupt event.data doesn't abort the whole file parse loop.
+ */
+function coerceToolRequests(raw: unknown): ToolRequest[] {
+  return Array.isArray(raw) ? (raw as ToolRequest[]) : []
 }
 
-function parseTranscriptEvents(content: string, sessionId: string, seenKeys: Set<string>): ParsedProviderCall[] {
-  const results: ParsedProviderCall[] = []
-  const lines = content.split('\n').filter(l => l.trim())
-  const events: TranscriptEvent[] = []
+/**
+ * Infer the model bucket for a VS Code transcript file by counting the
+ * toolCallId prefixes across all assistant messages:
+ *   call_*           → OpenAI
+ *   tooluse_* / toolu_*  → Anthropic
+ * The dominant prefix determines the model for the whole session.
+ * Returns '' if no toolCallIds are present.
+ */
+function inferTranscriptModel(lines: string[]): string {
+  let openaiCount = 0
+  let anthropicCount = 0
 
   for (const line of lines) {
     try {
-      events.push(JSON.parse(line))
+      const event = JSON.parse(line) as CopilotEvent
+      if (event.type !== 'assistant.message') continue
+      const data = event.data as AssistantMessageData & { toolRequests?: Array<{ toolCallId?: string }> }
+      const reqs = coerceToolRequests(data.toolRequests)
+      for (const req of reqs) {
+        const id = (req as { toolCallId?: unknown }).toolCallId
+        if (typeof id !== 'string') continue
+        if (id.startsWith('call_')) openaiCount++
+        else if (/^tooluse_|^toolu_/.test(id)) anthropicCount++
+      }
     } catch {
       continue
     }
   }
 
-  const model = inferModelFromToolCallIds(events)
-  let pendingUserMessage = ''
-
-  for (const event of events) {
-    if (event.type === 'user.message') {
-      const data = event.data as { content?: string }
-      pendingUserMessage = (data.content ?? '').slice(0, 500)
-      continue
-    }
-
-    if (event.type === 'assistant.message') {
-      const data = event.data as { messageId: string; content?: string; reasoningText?: string; toolRequests?: TranscriptToolRequest[]; outputTokens?: number }
-      const contentText = data.content ?? ''
-      const reasoningText = data.reasoningText ?? ''
+  if (openaiCount === 0 && anthropicCount === 0) return ''
+  return openaiCount >= anthropicCount ? 'copilot-openai-auto' : 'copilot-anthropic-auto'
+}
 
-      if (contentText.length === 0 && reasoningText.length === 0 && (data.toolRequests ?? []).length === 0) continue
+// ---------------------------------------------------------------------------
+// JSONL parser (handles both regular session-state events and VS Code
+// transcript format via session.start { producer: 'copilot-agent' })
+// ---------------------------------------------------------------------------
 
-      const dedupKey = `copilot:${sessionId}:${data.messageId}`
-      if (seenKeys.has(dedupKey)) continue
-      seenKeys.add(dedupKey)
+function createJsonlParser(
+  source: SessionSource,
+  seenKeys: Set<string>
+): SessionParser {
+  return {
+    async *parse(): AsyncGenerator<ParsedProviderCall> {
+      const content = await readSessionFile(source.path)
+      if (!content) return
+      const sessionId = basename(dirname(source.path))
+      const lines = content.split('\n').filter((l) => l.trim())
+
+      // Detect VS Code transcript format: the first session.start event has
+      // { producer: 'copilot-agent' } and no outputTokens in messages.
+      let isTranscript = false
+      let currentModel = ''
+      let pendingUserMessage = ''
+
+      // First pass: detect format and infer transcript model if needed.
+      for (const line of lines) {
+        try {
+          const ev = JSON.parse(line) as CopilotEvent
+          if (ev.type === 'session.start') {
+            const data = ev.data as SessionStartData & { producer?: string }
+            if (data.producer === 'copilot-agent') {
+              isTranscript = true
+            }
+            break
+          }
+          if (ev.type === 'session.model_change') break // regular format
+        } catch {
+          continue
+        }
+      }
 
-      let outputTokens = data.outputTokens ?? 0
-      let reasoningTokens = 0
-      if (outputTokens === 0) {
-        outputTokens = Math.ceil(contentText.length / CHARS_PER_TOKEN)
-        reasoningTokens = Math.ceil(reasoningText.length / CHARS_PER_TOKEN)
+      if (isTranscript) {
+        currentModel = inferTranscriptModel(lines)
+        if (!currentModel) return // no toolCallIds to infer model from
       }
 
-      const inputTokens = Math.ceil(pendingUserMessage.length / CHARS_PER_TOKEN)
+      for (const line of lines) {
+        let event: CopilotEvent
+        try {
+          event = JSON.parse(line) as CopilotEvent
+        } catch {
+          continue
+        }
 
-      // Same defensive guard as the modern event branch — corrupt legacy
-      // sessions have shipped toolRequests as non-array values.
-      const legacyToolRequests = Array.isArray(data.toolRequests) ? data.toolRequests : []
-      const tools = legacyToolRequests
-        .map(t => normalizeToolName(t?.name))
-        .filter(Boolean)
+        if (event.type === 'session.start') {
+          if (!isTranscript) {
+            currentModel = (event.data as SessionStartData).selectedModel ?? currentModel
+          }
+          continue
+        }
 
-      const costUSD = calculateCost(model, inputTokens, outputTokens + reasoningTokens, 0, 0, 0)
+        if (event.type === 'session.model_change') {
+          currentModel = (event.data as ModelChangeData).newModel ?? currentModel
+          continue
+        }
 
-      results.push({
-        provider: 'copilot',
-        model,
-        inputTokens,
-        outputTokens,
-        cacheCreationInputTokens: 0,
-        cacheReadInputTokens: 0,
-        cachedInputTokens: 0,
-        reasoningTokens,
-        webSearchRequests: 0,
-        costUSD,
-        tools,
-        bashCommands: [],
-        timestamp: event.timestamp ?? '',
-        speed: 'standard',
-        deduplicationKey: dedupKey,
-        userMessage: pendingUserMessage,
-        sessionId,
-      })
+        if (event.type === 'user.message') {
+          pendingUserMessage = (event.data as UserMessageData).content ?? ''
+          continue
+        }
 
-      pendingUserMessage = ''
-    }
+        if (event.type === 'assistant.message') {
+          const msgData = event.data as AssistantMessageData
+          const { messageId, model: msgModel, outputTokens = 0 } = msgData
+          const rawRequests = (msgData as { toolRequests?: unknown }).toolRequests
+          const toolRequests = coerceToolRequests(rawRequests)
+
+          // model may be carried per-message in newer copilot-agent format
+          if (msgModel) currentModel = msgModel
+          // Regular JSONL: skip zero-token messages; transcripts don't have tokens
+          if (!isTranscript && outputTokens === 0) continue
+          if (!currentModel) continue
+
+          const dedupKey = `copilot:${sessionId}:${messageId}`
+          if (seenKeys.has(dedupKey)) continue
+          seenKeys.add(dedupKey)
+
+          const tools = toolRequests
+            .map((t) => {
+              const raw = typeof t === 'object' && t !== null
+                ? ((t as { name?: unknown; toolName?: unknown }).name ?? (t as { name?: unknown; toolName?: unknown }).toolName)
+                : null
+              return typeof raw === 'string' ? normalizeTool(raw) : null
+            })
+            .filter((t): t is string => t !== null)
+
+          // Copilot JSONL only logs outputTokens; inputTokens are NOT available.
+          // Cost will be lower than actual API cost. This is the original
+          // behaviour — OTel data (below) replaces it when available.
+          const costUSD = calculateCost(currentModel, 0, outputTokens, 0, 0, 0)
+
+          yield {
+            provider: 'copilot',
+            sessionId,
+            model: currentModel,
+            inputTokens: 0,
+            outputTokens,
+            cacheCreationInputTokens: 0,
+            cacheReadInputTokens: 0,
+            cachedInputTokens: 0,
+            reasoningTokens: 0,
+            webSearchRequests: 0,
+            costUSD,
+            tools,
+            bashCommands: [],
+            timestamp: event.timestamp ?? '',
+            speed: 'standard' as const,
+            deduplicationKey: dedupKey,
+            userMessage: pendingUserMessage,
+          }
+          pendingUserMessage = ''
+        }
+      }
+    },
   }
-
-  return results
 }
 
-// --- Parser ---
+// ---------------------------------------------------------------------------
+// OTel SQLite parser — reads agent-traces.db for FULL token data
+// ---------------------------------------------------------------------------
 
-function isTranscriptFormat(content: string): boolean {
-  const firstLine = content.split('\n')[0] ?? ''
-  try {
-    const event = JSON.parse(firstLine)
-    return event.type === 'session.start' && event.data?.producer === 'copilot-agent'
-  } catch {
-    return false
-  }
-}
+function createOtelParser(
+  source: SessionSource,
+  seenKeys: Set<string>
+): SessionParser {
+  return {
+    async *parse(): AsyncGenerator<ParsedProviderCall> {
+      // Lazy-load the SQLite module (same pattern as Cursor/OpenCode providers)
+      const { openDatabase } = await import('../sqlite.js')
+
+      const db = openDatabase(source.path)
+      if (!db) return
+
+      try {
+        // The conversation_id is stored in source.project for OTel sources
+        // (set during discoverSessions). We use it to scope our queries.
+        const conversationId = (source as OTelSessionSource).conversationId
+
+        // ---------------------------------------------------------------
+        // Query all 'chat' spans for this conversation.
+        // 'chat' spans represent individual LLM API calls and carry the
+        // per-call token breakdown we need.
+        //
+        // DB schema (from VS Code Copilot Chat's otelSqliteStore):
+        //   Table: spans (with direct columns for denormalized data)
+        //   Table: span_attributes (key-value pairs for OTel semantics)
+        //   Join on span_id to get full attribute data
+        // ---------------------------------------------------------------
+
+        // First, get all spans with this conversation_id from span_attributes
+        const spanIdRows = db.query<{ span_id: string; trace_id: string }>(
+          `SELECT DISTINCT s.span_id, s.trace_id
+           FROM spans s
+           INNER JOIN span_attributes sa 
+             ON s.span_id = sa.span_id AND sa.key = 'gen_ai.conversation.id' AND sa.value = ?
+           ORDER BY s.start_time_ms ASC`,
+          [conversationId]
+        )
+
+        if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Found ${spanIdRows.length} spans for conversation ${conversationId}`)
+
+        // Collect trace IDs and span IDs belonging to this conversation
+        const traceIds = new Set<string>()
+        for (const row of spanIdRows) {
+          traceIds.add(row.trace_id)
+        }
 
-function isJetBrainsFormat(content: string): boolean {
-  const firstLine = content.split('\n')[0] ?? ''
-  try {
-    const event = JSON.parse(firstLine)
-    // JB format starts with user.message_rendered or partition.created (JB-specific).
-    // We intentionally exclude user.message here since legacy files can also start
-    // with that event type — routing them to the JB parser would misparse them.
-    return (
-      event.type === 'user.message_rendered' ||
-      event.type === 'partition.created'
-    )
-  } catch {
-    return false
-  }
-}
+        if (traceIds.size === 0) {
+          if (process.env['DEBUG_OTEL']) console.warn(`[OTel] No trace IDs found for conversation`)
+          return
+        }
 
-// --- JetBrains (IntelliJ/DataGrip) format parser ---
+        // Now query all spans within those traces to find chat and tool spans
+        const traceIdList = [...traceIds].map((id) => `'${id.replace(/'/g, "''")}'`).join(',')
+        const traceSpans = db.query<{ span_id: string; trace_id: string; operation_name: string | null }>(
+          `SELECT span_id, trace_id, operation_name FROM spans WHERE trace_id IN (${traceIdList})`
+        )
 
-type JBEvent = {
-  type: string
-  timestamp?: string
-  id?: string
-  data: Record<string, unknown>
-}
+        if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Found ${traceSpans.length} total spans across ${traceIds.size} traces`)
 
-function parseJetBrainsEvents(content: string, sessionId: string, seenKeys: Set<string>): ParsedProviderCall[] {
-  const results: ParsedProviderCall[] = []
-  const lines = content.split('\n').filter(l => l.trim())
-  const events: JBEvent[] = []
+        // Collect tool names from execute_tool spans for each trace
+        const toolsByTrace = new Map<string, string[]>()
+        const chatSpanIds: string[] = []
 
-  for (const line of lines) {
-    try {
-      events.push(JSON.parse(line))
-    } catch {
-      continue
-    }
-  }
+        for (const span of traceSpans) {
+          const opName = span.operation_name || ''
 
-  // Reuse the shared model inference logic: check explicit data.model fields
-  // (weighted 100x) and tool call ID prefix heuristics from both assistant.message
-  // toolRequests and tool.execution_start/complete events (JB-specific).
-  const model = inferModelFromEvents(events)
+          if (opName === 'chat') {
+            chatSpanIds.push(span.span_id)
+          }
 
-  // Collect tool names per turn
-  const toolsByTurn = new Map<string, string[]>()
-  let currentTurnId = ''
-  let userMsg = ''
-  let msgIndex = 0
+          if (opName === 'execute_tool') {
+            // Load tool name from attributes and normalise to display form
+            const attrs = loadSpanAttributesFromTable(db, span.span_id)
+            const rawToolName = attrs['gen_ai.tool.name'] as string | undefined
+            if (rawToolName) {
+              const existing = toolsByTrace.get(span.trace_id) ?? []
+              existing.push(normalizeTool(rawToolName))
+              toolsByTrace.set(span.trace_id, existing)
+            }
+          }
+        }
 
-  for (const e of events) {
-    if (e.type === 'user.message_rendered') {
-      userMsg = ((e.data.renderedMessage as string) ?? '').slice(0, 500)
-    }
-    if (e.type === 'user.message') {
-      const msg = (e.data.content as string) ?? ''
-      if (msg) userMsg = msg.slice(0, 500)
-    }
+        if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Found ${chatSpanIds.length} chat spans`)
 
-    if (e.type === 'assistant.turn_start') {
-      currentTurnId = (e.data.turnId as string) ?? ''
-    }
+        // Yield one ParsedProviderCall per chat span
+        for (const spanId of chatSpanIds) {
+          const attrs = loadSpanAttributesFromTable(db, spanId)
 
-    if (e.type === 'tool.execution_start') {
-      const toolName = (e.data.toolName as string) ?? ''
-      const normalized = normalizeToolName(toolName)
-      if (normalized) {
-        const msgId = currentTurnId || 'unknown'
-        const existing = toolsByTurn.get(msgId) ?? []
-        existing.push(normalized)
-        toolsByTurn.set(msgId, existing)
-      }
-    }
+          // Get span metadata from the spans table
+          const spanMetadata = db.query<{ trace_id: string; start_time_ms: number; response_model: string | null }>(
+            `SELECT trace_id, start_time_ms, response_model FROM spans WHERE span_id = ?`,
+            [spanId]
+          )?.[0]
 
-    if (e.type === 'assistant.message') {
-      const data = e.data as { messageId?: string; content?: string; text?: string; reasoningText?: string; thinking?: { text?: string }; iterationNumber?: number; outputTokens?: number }
-      const contentText = data.text ?? data.content ?? ''
-      const reasoningText = data.reasoningText ?? data.thinking?.text ?? ''
-
-      // Skip empty messages (streaming placeholders)
-      if (contentText.length === 0 && reasoningText.length === 0) continue
-
-      // Use messageId if available, otherwise fall back to an incrementing index
-      // to avoid dedup collisions when messageId is absent.
-      const messageId = data.messageId ?? e.id ?? ''
-      const dedupId = messageId || String(msgIndex++)
-      const dedupKey = `copilot:jb:${sessionId}:${dedupId}:${data.iterationNumber ?? 0}`
-      if (seenKeys.has(dedupKey)) continue
-      seenKeys.add(dedupKey)
-
-      let outputTokens = data.outputTokens ?? 0
-      let reasoningTokens = 0
-      if (outputTokens === 0) {
-        outputTokens = Math.ceil(contentText.length / CHARS_PER_TOKEN)
-        reasoningTokens = Math.ceil(reasoningText.length / CHARS_PER_TOKEN)
-      }
+          if (!spanMetadata) {
+            if (process.env['DEBUG_OTEL']) console.warn(`[OTel] No metadata for span ${spanId}`)
+            continue
+          }
 
-      const inputTokens = Math.ceil(userMsg.length / CHARS_PER_TOKEN)
-      const tools = toolsByTurn.get(currentTurnId || messageId) ?? []
-      const costUSD = calculateCost(model, inputTokens, outputTokens + reasoningTokens, 0, 0, 0)
+          const model =
+            (attrs['gen_ai.response.model'] as string | undefined) ??
+            (attrs['gen_ai.request.model'] as string | undefined) ??
+            spanMetadata.response_model ??
+            'unknown'
 
-      results.push({
-        provider: 'copilot',
-        model,
-        inputTokens,
-        outputTokens,
-        cacheCreationInputTokens: 0,
-        cacheReadInputTokens: 0,
-        cachedInputTokens: 0,
-        reasoningTokens,
-        webSearchRequests: 0,
-        costUSD,
-        tools,
-        bashCommands: [],
-        timestamp: e.timestamp ?? '',
-        speed: 'standard',
-        deduplicationKey: dedupKey,
-        userMessage: userMsg,
-        sessionId,
-      })
+          const inputTokens = Number(attrs['gen_ai.usage.input_tokens'] ?? 0)
+          const outputTokens = Number(attrs['gen_ai.usage.output_tokens'] ?? 0)
+          const cacheReadTokens = Number(attrs['gen_ai.usage.cache_read.input_tokens'] ?? 0)
+          const cacheCreationTokens = Number(attrs['gen_ai.usage.cache_creation.input_tokens'] ?? 0)
 
-      // Only count user message once per assistant turn
-      userMsg = ''
-    }
-  }
+          if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Span ${spanId.substring(0, 8)}: model=${model}, input=${inputTokens}, output=${outputTokens}, cache_read=${cacheReadTokens}, cache_creation=${cacheCreationTokens}`)
 
-  return results
-}
+          if (inputTokens === 0 && outputTokens === 0) {
+            if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Skipping span with 0 tokens`)
+            continue
+          }
 
-function createParser(source: SessionSource, seenKeys: Set<string>): SessionParser {
-  return {
-    async *parse(): AsyncGenerator<ParsedProviderCall> {
-      const content = await readSessionFile(source.path)
-      if (content === null) return
-      const sessionId = basename(source.path, '.jsonl').length === 36
-        ? basename(source.path, '.jsonl')
-        : basename(dirname(source.path))
-
-      let calls: ParsedProviderCall[]
-      if (isTranscriptFormat(content)) {
-        calls = parseTranscriptEvents(content, sessionId, seenKeys)
-      } else if (isJetBrainsFormat(content)) {
-        calls = parseJetBrainsEvents(content, sessionId, seenKeys)
-        // Infer project name from tool paths now that content is loaded
-        const inferredProject = inferJBProjectFromContent(content)
-        if (inferredProject) {
-          for (const call of calls) {
-            call.project = inferredProject
+          // Dedup key uses span_id which is globally unique
+          const dedupKey = `copilot-otel:${spanId}`
+          if (seenKeys.has(dedupKey)) continue
+          seenKeys.add(dedupKey)
+
+          // Also add a JSONL-style dedupKey pattern so that if the same
+          // interaction appears in both OTel and JSONL, we don't double-count.
+          // We use the turn ID from Copilot attributes if available.
+          const turnId = attrs['github.copilot.chat.turn.id'] as string | undefined
+          if (turnId) {
+            const jsonlDedupKey = `copilot:${conversationId}:${turnId}`
+            seenKeys.add(jsonlDedupKey)
           }
-        }
-      } else {
-        calls = parseLegacyEvents(content, sessionId, seenKeys)
-      }
 
-      for (const call of calls) {
-        yield call
+          const tools = toolsByTrace.get(spanMetadata.trace_id) ?? []
+          const timestamp = epochToISO(spanMetadata.start_time_ms)
+
+          // calculateCost with FULL token data — this is the key improvement.
+          const costUSD = calculateCost(
+            model,
+            inputTokens,
+            outputTokens,
+            cacheCreationTokens,
+            cacheReadTokens,
+            0 // reasoningTokens — not exposed in current OTel schema
+          )
+
+          yield {
+            provider: 'copilot',
+            sessionId: conversationId,
+            model,
+            inputTokens,
+            outputTokens,
+            cacheCreationInputTokens: cacheCreationTokens,
+            cacheReadInputTokens: cacheReadTokens,
+            cachedInputTokens: 0,
+            reasoningTokens: 0,
+            webSearchRequests: 0,
+            costUSD,
+            tools,
+            bashCommands: [],
+            timestamp,
+            speed: 'standard' as const,
+            deduplicationKey: dedupKey,
+            userMessage: '', // Not available in OTel spans by default
+          }
+        }
+      } finally {
+        db.close()
       }
     },
   }
 }
 
-// --- Discovery ---
-
-function getCopilotSessionStateDir(override?: string): string {
-  return override ?? join(homedir(), '.copilot', 'session-state')
-}
-
-export function getVSCodeWorkspaceStorageDirs(homeDir = homedir(), platform = process.platform): string[] {
-  const pathJoin = platform === 'win32' ? win32.join : posix.join
-
-  if (platform === 'darwin') {
-    return [
-      pathJoin(homeDir, 'Library', 'Application Support', 'Code', 'User', 'workspaceStorage'),
-      pathJoin(homeDir, 'Library', 'Application Support', 'Code - Insiders', 'User', 'workspaceStorage'),
-      pathJoin(homeDir, 'Library', 'Application Support', 'VSCodium', 'User', 'workspaceStorage'),
-    ]
-  }
-
-  if (platform === 'win32') {
-    return [
-      pathJoin(homeDir, 'AppData', 'Roaming', 'Code', 'User', 'workspaceStorage'),
-      pathJoin(homeDir, 'AppData', 'Roaming', 'Code - Insiders', 'User', 'workspaceStorage'),
-      pathJoin(homeDir, 'AppData', 'Roaming', 'VSCodium', 'User', 'workspaceStorage'),
-    ]
-  }
+// ---------------------------------------------------------------------------
+// Extended SessionSource for OTel sessions
+// ---------------------------------------------------------------------------
 
-  return [
-    pathJoin(homeDir, '.config', 'Code', 'User', 'workspaceStorage'),
-    pathJoin(homeDir, '.config', 'Code - Insiders', 'User', 'workspaceStorage'),
-    pathJoin(homeDir, '.config', 'VSCodium', 'User', 'workspaceStorage'),
-    pathJoin(homeDir, '.vscode-server', 'data', 'User', 'workspaceStorage'),
-  ]
+interface OTelSessionSource extends SessionSource {
+  conversationId: string
+  sourceType: 'otel'
 }
 
-function parseCwd(yaml: string): string | null {
-  const match = yaml.match(/^cwd:\s*(.+)$/m)
-  if (!match?.[1]) return null
-  const raw = match[1]
-    .replace(/\s*#.*$/, '')
-    .replace(/^['"]|['"]$/g, '')
-    .trim()
-  return raw || null
+interface JsonlSessionSource extends SessionSource {
+  sourceType: 'jsonl'
 }
 
-async function readWorkspaceProject(workspaceDir: string): Promise<string> {
-  try {
-    const raw = await readFile(join(workspaceDir, 'workspace.json'), 'utf-8')
-    const data = JSON.parse(raw) as { folder?: string }
-    if (data.folder) {
-      const url = data.folder.replace(/^file:\/\//, '')
-      return basename(decodeURIComponent(url))
-    }
-  } catch {}
-  return basename(workspaceDir)
+function isOtelSource(source: SessionSource): source is OTelSessionSource {
+  return (source as OTelSessionSource).sourceType === 'otel'
 }
 
-function getJetBrainsSessionDir(override?: string): string {
-  return override ?? join(homedir(), '.copilot', 'jb')
-}
+// ---------------------------------------------------------------------------
+// Session discovery: JSONL (original)
+// ---------------------------------------------------------------------------
 
-async function discoverJetBrainsSessions(jbDir: string): Promise<SessionSource[]> {
-  const sources: SessionSource[] = []
+async function discoverJsonlSessions(
+  sessionStateDir: string
+): Promise<JsonlSessionSource[]> {
+  const sources: JsonlSessionSource[] = []
 
   let sessionDirs: string[]
   try {
-    sessionDirs = await readdir(jbDir)
+    sessionDirs = await readdir(sessionStateDir)
   } catch {
     return sources
   }
 
   for (const sessionId of sessionDirs) {
-    const sessionPath = join(jbDir, sessionId)
-    const s = await stat(sessionPath).catch(() => null)
-    if (!s?.isDirectory()) continue
+    const eventsPath = join(sessionStateDir, sessionId, 'events.jsonl')
+    const s = await stat(eventsPath).catch(() => null)
+    if (!s?.isFile()) continue
 
-    let partitions: string[]
+    let project = sessionId
     try {
-      partitions = await readdir(sessionPath)
+      const yaml = await readSessionFile(
+        join(sessionStateDir, sessionId, 'workspace.yaml')
+      )
+      const cwd = parseCwd(yaml ?? '')
+      if (cwd) project = basename(cwd)
     } catch {
-      continue
+      // workspace.yaml may not exist
     }
 
-    for (const file of partitions) {
-      if (!file.endsWith('.jsonl')) continue
-      const filePath = join(sessionPath, file)
-      const fs = await stat(filePath).catch(() => null)
-      if (!fs?.isFile()) continue
-      sources.push({ path: filePath, project: sessionId, provider: 'copilot' })
-    }
+    sources.push({
+      path: eventsPath,
+      project,
+      provider: 'copilot',
+      sourceType: 'jsonl',
+    })
   }
 
   return sources
 }
 
-/** Infer a project name from tool execution paths in already-loaded content. */
-function inferJBProjectFromContent(content: string): string | null {
-  // Split on either separator so the home-depth math lines up with the recorded
-  // tool path on every platform (JetBrains records Windows paths with
-  // backslashes, and homedir() also uses backslashes there). Using a fixed '/'
-  // for the path while splitting home on the platform sep mismatched on Windows
-  // and made inference always fall back to the raw session id there.
-  const homeParts = homedir().split(/[/\\]/)
-  const homeDepth = homeParts.length
-  const lines = content.split('\n')
-  const limit = Math.min(lines.length, 200)
-
-  for (let i = 0; i < limit; i++) {
-    const line = lines[i]
-    if (!line) continue
-    try {
-      const e = JSON.parse(line)
-      if (e.type === 'tool.execution_start') {
-        const args = e.data?.arguments
-        if (typeof args === 'object' && args !== null && typeof args.path === 'string') {
-          const pathVal: string = args.path
-          const parts = pathVal.split(/[/\\]/)
-          if (parts.length > homeDepth + 1) {
-            const afterHome = parts.slice(homeDepth)
-            if (afterHome.length >= 2) {
-              return basename(afterHome.slice(0, afterHome.length > 2 ? 2 : afterHome.length).join('/'))
-                || afterHome[0] || null
-            }
-            return afterHome[0] || null
-          }
-        }
-      }
-    } catch {
-      continue
-    }
-  }
-  return null
-}
+// ---------------------------------------------------------------------------
+// Session discovery: OTel SQLite
+// ---------------------------------------------------------------------------
 
-async function discoverLegacySessions(sessionStateDir: string): Promise<SessionSource[]> {
-  const sources: SessionSource[] = []
+async function discoverOtelSessions(
+  dbPath: string
+): Promise<OTelSessionSource[]> {
+  const sources: OTelSessionSource[] = []
 
-  let sessionDirs: string[]
+  // Lazy-load SQLite
+  let openDatabase: (path: string) => ReturnType<typeof import('../sqlite.js')['openDatabase']>
   try {
-    sessionDirs = await readdir(sessionStateDir)
+    const sqliteModule = await import('../sqlite.js')
+    openDatabase = sqliteModule.openDatabase
   } catch {
+    if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Failed to import sqlite module`)
     return sources
   }
 
-  for (const sessionId of sessionDirs) {
-    const eventsPath = join(sessionStateDir, sessionId, 'events.jsonl')
-    const s = await stat(eventsPath).catch(() => null)
-    if (!s?.isFile()) continue
+  const db = openDatabase(dbPath)
+  if (!db) {
+    if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Failed to open database`)
+    return sources
+  }
 
-    let project = sessionId
-    const yaml = await readSessionFile(join(sessionStateDir, sessionId, 'workspace.yaml'))
-    if (yaml !== null) {
-      const cwd = parseCwd(yaml)
-      if (cwd) project = basename(cwd)
-    }
+  try {
+    // Find all unique conversation IDs from spans that have the attribute.
+    // Join with span_attributes to find spans with 'gen_ai.conversation.id'.
+    const rows = db.query<{
+      conversation_id: string
+      project: string
+      min_start: number
+    }>(
+      `SELECT DISTINCT
+         sa_conv.value AS conversation_id,
+         COALESCE(sa_repo.value, 'copilot-chat') AS project,
+         MIN(s.start_time_ms) AS min_start
+       FROM spans s
+       LEFT JOIN span_attributes sa_conv 
+         ON s.span_id = sa_conv.span_id AND sa_conv.key = 'gen_ai.conversation.id'
+       LEFT JOIN span_attributes sa_repo 
+         ON s.span_id = sa_repo.span_id AND sa_repo.key = 'github.copilot.git.repository'
+       WHERE sa_conv.value IS NOT NULL
+       GROUP BY conversation_id
+       ORDER BY min_start DESC`
+    )
 
-    sources.push({ path: eventsPath, project, provider: 'copilot' })
-  }
+    if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Discovery: Found ${rows.length} conversations`)
 
-  return sources
-}
+    for (const row of rows) {
+      if (!row.conversation_id) continue
 
-async function discoverVSCodeTranscripts(workspaceStorageDir: string): Promise<SessionSource[]> {
-  const sources: SessionSource[] = []
+      // Use the git repository name as the project, or fall back to 'copilot-chat'
+      let project = row.project ?? 'copilot-chat'
+      // Clean up repository URLs to just the repo name
+      if (project.includes('/')) {
+        project = basename(project.replace(/\.git$/, ''))
+      }
 
-  let workspaceDirs: string[]
-  try {
-    workspaceDirs = await readdir(workspaceStorageDir)
-  } catch {
-    return sources
+      sources.push({
+        path: dbPath,
+        project,
+        provider: 'copilot',
+        sourceType: 'otel',
+        conversationId: row.conversation_id,
+      })
+    }
+  } catch (e) {
+    // DB might have a different schema or be locked — fall through silently
+    if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Discovery error:`, e)
+  } finally {
+    db.close()
   }
 
-  for (const wsDir of workspaceDirs) {
-    const transcriptsDir = join(workspaceStorageDir, wsDir, 'GitHub.copilot-chat', 'transcripts')
-    if (!existsSync(transcriptsDir)) continue
+  if (process.env['DEBUG_OTEL']) console.warn(`[OTel] Discovery complete: ${sources.length} sessions found`)
+  return sources
+}
 
-    const project = await readWorkspaceProject(join(workspaceStorageDir, wsDir))
+// ---------------------------------------------------------------------------
+// Provider factory
+// ---------------------------------------------------------------------------
+
+/**
+ * Returns the VS Code workspaceStorage directories for all VS Code variants
+ * (Code, Code Insiders, VSCodium) on the given platform. Used to discover
+ * transcript sessions written by the Copilot Chat extension.
+ *
+ * Accepts explicit `home` and `os` arguments so callers (and tests) can pass
+ * custom values without relying on process-level globals.
+ */
+export function getVSCodeWorkspaceStorageDirs(home: string, os: string): string[] {
+  const j = os === 'win32' ? win32.join : posix.join
+  if (os === 'darwin') {
+    return [
+      j(home, 'Library', 'Application Support', 'Code', 'User', 'workspaceStorage'),
+      j(home, 'Library', 'Application Support', 'Code - Insiders', 'User', 'workspaceStorage'),
+      j(home, 'Library', 'Application Support', 'VSCodium', 'User', 'workspaceStorage'),
+    ]
+  }
+  if (os === 'linux') {
+    return [
+      j(home, '.config', 'Code', 'User', 'workspaceStorage'),
+      j(home, '.config', 'Code - Insiders', 'User', 'workspaceStorage'),
+      j(home, '.config', 'VSCodium', 'User', 'workspaceStorage'),
+    ]
+  }
+  // win32
+  return [
+    j(home, 'AppData', 'Roaming', 'Code', 'User', 'workspaceStorage'),
+    j(home, 'AppData', 'Roaming', 'Code - Insiders', 'User', 'workspaceStorage'),
+    j(home, 'AppData', 'Roaming', 'VSCodium', 'User', 'workspaceStorage'),
+  ]
+}
 
-    let files: string[]
+// ---------------------------------------------------------------------------
+// Session discovery: VS Code workspace transcripts
+// ---------------------------------------------------------------------------
+
+/**
+ * Discover Copilot Chat transcript sessions stored in VS Code workspaceStorage.
+ * Structure: {wsDir}/{hash}/GitHub.copilot-chat/transcripts/{session}.jsonl
+ * Project is read from {wsDir}/{hash}/workspace.json (folder URI).
+ */
+async function discoverTranscriptSessions(
+  workspaceStorageDirs: string[]
+): Promise<JsonlSessionSource[]> {
+  const sources: JsonlSessionSource[] = []
+
+  for (const wsDir of workspaceStorageDirs) {
+    let hashDirs: string[]
     try {
-      files = await readdir(transcriptsDir)
+      hashDirs = await readdir(wsDir)
     } catch {
       continue
     }
 
-    for (const file of files) {
-      if (!file.endsWith('.jsonl')) continue
-      const filePath = join(transcriptsDir, file)
-      const s = await stat(filePath).catch(() => null)
-      if (!s?.isFile()) continue
-      sources.push({ path: filePath, project, provider: 'copilot' })
+    for (const hashDir of hashDirs) {
+      const transcriptsDir = join(wsDir, hashDir, 'GitHub.copilot-chat', 'transcripts')
+
+      // Resolve project name from workspace.json
+      let project = hashDir
+      try {
+        const wsJson = await readSessionFile(join(wsDir, hashDir, 'workspace.json'))
+        if (wsJson) {
+          const data = JSON.parse(wsJson) as { folder?: string }
+          if (typeof data.folder === 'string') {
+            // folder is a URI like 'file:///home/user/myapp' or 'file:///C:/Users/...'
+            const folder = data.folder.replace(/^file:\/\//, '').replace(/\/+$/, '')
+            const name = basename(folder)
+            if (name) project = name
+          }
+        }
+      } catch {
+        // workspace.json may be absent or malformed
+      }
+
+      let transcriptFiles: string[]
+      try {
+        transcriptFiles = await readdir(transcriptsDir)
+      } catch {
+        continue
+      }
+
+      for (const file of transcriptFiles) {
+        if (!file.endsWith('.jsonl')) continue
+        const s = await stat(join(transcriptsDir, file)).catch(() => null)
+        if (!s?.isFile()) continue
+        sources.push({
+          path: join(transcriptsDir, file),
+          project,
+          provider: 'copilot',
+          sourceType: 'jsonl',
+        })
+      }
     }
   }
 
   return sources
 }
 
-export function createCopilotProvider(sessionStateDir?: string, workspaceStorageDirOverride?: string, jbDirOverride?: string): Provider {
-  const legacyDir = getCopilotSessionStateDir(sessionStateDir)
-  const vscodeDirs = workspaceStorageDirOverride != null ? [workspaceStorageDirOverride] : getVSCodeWorkspaceStorageDirs()
-  const jbDir = getJetBrainsSessionDir(jbDirOverride)
+export function createCopilotProvider(sessionStateDir?: string, workspaceStorageDir?: string): Provider {
+  // jsonlDir is resolved lazily inside discoverSessions so that env-var
+  // overrides set after module load (e.g. in tests) are respected.
+
+  /**
+   * Returns the workspaceStorage directories to scan for transcript sessions.
+   * When workspaceStorageDir is explicitly provided (e.g. in tests), that single
+   * directory is used. The CODEBURN_COPILOT_WS_STORAGE_DIR env var provides a
+   * single-dir override (useful for tests). Otherwise all platform-default VS
+   * Code variant paths are returned.
+   */
+  function getWsDirs(): string[] {
+    if (workspaceStorageDir !== undefined) return [workspaceStorageDir]
+    const envDir = process.env['CODEBURN_COPILOT_WS_STORAGE_DIR']
+    if (envDir) return [envDir]
+    return getVSCodeWorkspaceStorageDirs(homedir(), platform())
+  }
 
   return {
     name: 'copilot',
     displayName: 'Copilot',
 
     modelDisplayName(model: string): string {
-      if (model === 'copilot-auto') return 'Copilot (auto)'
-      if (model === COPILOT_OPENAI_AUTO) return 'Copilot (OpenAI auto)'
-      if (model === COPILOT_ANTHROPIC_AUTO) return 'Copilot (Anthropic auto)'
-      for (const [key, name] of modelDisplayEntries) {
-        if (model === key || model.startsWith(key + '-')) return name
+      for (const [key, display] of modelDisplayEntries) {
+        if (model.includes(key)) return display
       }
       return model
     },
 
     toolDisplayName(rawTool: string): string {
-      return normalizeToolName(rawTool)
+      return normalizeTool(rawTool)
     },
 
     async discoverSessions(): Promise<SessionSource[]> {
-      const [legacy, jb, ...vscodeResults] = await Promise.all([
-        discoverLegacySessions(legacyDir),
-        discoverJetBrainsSessions(jbDir),
-        ...vscodeDirs.map(discoverVSCodeTranscripts),
-      ])
-      return [...legacy, ...jb, ...vscodeResults.flat()]
+      const sources: SessionSource[] = []
+
+      // 1. Discover OTel sessions (preferred — full token data)
+      const disableOtel = process.env['CODEBURN_COPILOT_DISABLE_OTEL'] === '1'
+      if (!disableOtel) {
+        const dbPath = getAgentTracesDbPath()
+        if (dbPath) {
+          if (process.env['DEBUG_OTEL']) console.warn(`[Provider] Discovering OTel sessions from ${dbPath}`)
+          try {
+            const otelSources = await discoverOtelSessions(dbPath)
+            if (process.env['DEBUG_OTEL']) console.warn(`[Provider] Got ${otelSources.length} OTel sources`)
+            sources.push(...otelSources)
+          } catch (e) {
+            // OTel discovery failed — fall through to JSONL
+            if (process.env['DEBUG_OTEL']) console.warn(`[Provider] OTel discovery error:`, e)
+          }
+        } else {
+          if (process.env['DEBUG_OTEL']) console.warn(`[Provider] No OTel DB path found`)
+        }
+      }
+
+      // 2. Discover JSONL sessions (fallback — output tokens only)
+      try {
+        const jsonlDir = getCopilotSessionStateDir(sessionStateDir)
+        const jsonlSources = await discoverJsonlSessions(jsonlDir)
+        if (process.env['DEBUG_OTEL']) console.warn(`[Provider] Got ${jsonlSources.length} JSONL sources`)
+        sources.push(...jsonlSources)
+      } catch {
+        // JSONL discovery failed
+      }
+
+      // 3. Discover VS Code workspace transcript sessions
+      try {
+        const transcriptSources = await discoverTranscriptSessions(getWsDirs())
+        if (process.env['DEBUG_OTEL']) console.warn(`[Provider] Got ${transcriptSources.length} transcript sources`)
+        sources.push(...transcriptSources)
+      } catch {
+        // Transcript discovery failed
+      }
+
+      if (process.env['DEBUG_OTEL']) console.warn(`[Provider] Total sources: ${sources.length}`)
+      return sources
     },
 
-    createSessionParser(source: SessionSource, seenKeys: Set<string>): SessionParser {
-      return createParser(source, seenKeys)
+    createSessionParser(
+      source: SessionSource,
+      seenKeys: Set<string>
+    ): SessionParser {
+      // Route to the correct parser based on source type.
+      // The dedup key set (seenKeys) is shared across both parsers,
+      // so if OTel already yielded a span, the JSONL parser will skip
+      // the matching assistant.message (and vice versa).
+      if (process.env['DEBUG_OTEL']) {
+        const isOtel = isOtelSource(source)
+        console.warn(`[Provider] Creating ${isOtel ? 'OTel' : 'JSONL'} parser for source: ${source.path}`)
+      }
+      if (isOtelSource(source)) {
+        return createOtelParser(source, seenKeys)
+      }
+      return createJsonlParser(source, seenKeys)
     },
   }
 }
 
+// Default export for the provider registry
 export const copilot = createCopilotProvider()
diff --git a/tests/otel-cache-aggregation.test.ts b/tests/otel-cache-aggregation.test.ts
new file mode 100644
index 00000000..78f6f50b
--- /dev/null
+++ b/tests/otel-cache-aggregation.test.ts
@@ -0,0 +1,210 @@
+// Regression test for the OTel multi-conversation cache overwrite bug.
+//
+// Root cause: `parseProviderSources` in parser.ts calls
+//   `delete section.files[source.path]`
+// at the START of every loop iteration over changedSources. When multiple OTel
+// conversations from the same agent-traces.db share the same path key, each
+// iteration wiped the merged turns accumulated by all previous iterations, so
+// only the LAST conversation's data survived — a ~434x cost undercount in
+// practice (observed: $0.19 vs ~$85 ground truth from OTel DB).
+//
+// This test exercises the full `parseAllSessions` pipeline to catch any future
+// regression at the aggregation layer, not just the provider-level parser.
+
+import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest'
+import { mkdtemp, rm } from 'fs/promises'
+import { tmpdir } from 'os'
+import { join } from 'path'
+import { createRequire } from 'node:module'
+
+import { isSqliteAvailable } from '../src/sqlite.js'
+import { clearSessionCache, parseAllSessions } from '../src/parser.js'
+
+const requireForTest = createRequire(import.meta.url)
+
+type TestDb = {
+  exec(sql: string): void
+  prepare(sql: string): { run(...p: unknown[]): void }
+  close(): void
+}
+
+function createOtelDb(dbPath: string): void {
+  const { DatabaseSync } = requireForTest('node:sqlite') as { DatabaseSync: new (path: string) => TestDb }
+  const db = new DatabaseSync(dbPath)
+  db.exec(`
+    CREATE TABLE spans (
+      span_id        TEXT    PRIMARY KEY NOT NULL,
+      trace_id       TEXT    NOT NULL,
+      operation_name TEXT,
+      start_time_ms  INTEGER NOT NULL DEFAULT 0,
+      response_model TEXT
+    );
+    CREATE TABLE span_attributes (
+      id      INTEGER PRIMARY KEY AUTOINCREMENT,
+      span_id TEXT    NOT NULL,
+      key     TEXT    NOT NULL,
+      value   TEXT
+    );
+  `)
+  db.close()
+}
+
+interface ConvSpec {
+  spanId: string
+  traceId: string
+  convId: string
+  model: string
+  input: number
+  output: number
+  cacheRead: number
+  cacheCreate: number
+  startTimeMs?: number
+}
+
+function insertConversation(dbPath: string, spec: ConvSpec): void {
+  const { DatabaseSync } = requireForTest('node:sqlite') as { DatabaseSync: new (path: string) => TestDb }
+  const db = new DatabaseSync(dbPath)
+  db.prepare(
+    `INSERT INTO spans (span_id, trace_id, operation_name, start_time_ms, response_model)
+     VALUES (?, ?, ?, ?, ?)`
+  ).run(spec.spanId, spec.traceId, 'chat', spec.startTimeMs ?? Date.now(), spec.model)
+
+  const attrStmt = db.prepare(
+    `INSERT INTO span_attributes (span_id, key, value) VALUES (?, ?, ?)`
+  )
+  const attrs: Record<string, string | number> = {
+    'gen_ai.conversation.id':                   spec.convId,
+    'gen_ai.response.model':                    spec.model,
+    'gen_ai.usage.input_tokens':                spec.input,
+    'gen_ai.usage.output_tokens':               spec.output,
+    'gen_ai.usage.cache_read.input_tokens':     spec.cacheRead,
+    'gen_ai.usage.cache_creation.input_tokens': spec.cacheCreate,
+  }
+  for (const [key, value] of Object.entries(attrs)) {
+    attrStmt.run(spec.spanId, key, String(value))
+  }
+  db.close()
+}
+
+describe.skipIf(!isSqliteAvailable())(
+  'OTel multi-conversation cache aggregation (regression for 434x undercount)',
+  () => {
+    let tmpHome: string
+    let tmpCache: string
+    let dbPath: string
+    let prevHome: string | undefined
+    let prevCache: string | undefined
+
+    beforeEach(async () => {
+      tmpHome  = await mkdtemp(join(tmpdir(), 'cb-otel-agg-home-'))
+      tmpCache = await mkdtemp(join(tmpdir(), 'cb-otel-agg-cache-'))
+      dbPath   = join(tmpHome, 'agent-traces.db')
+
+      prevHome  = process.env['HOME']
+      prevCache = process.env['CODEBURN_CACHE_DIR']
+      process.env['HOME']              = tmpHome
+      process.env['CODEBURN_CACHE_DIR'] = tmpCache
+
+      vi.stubEnv('CODEBURN_COPILOT_OTEL_DB', dbPath)
+      vi.stubEnv('CODEBURN_COPILOT_DISABLE_OTEL', '')
+      // Redirect JSONL and transcript dirs to nonexistent paths so real
+      // developer session files don't contaminate the test results.
+      vi.stubEnv('CODEBURN_COPILOT_SESSION_STATE_DIR', join(tmpHome, 'no-jsonl'))
+      vi.stubEnv('CODEBURN_COPILOT_WS_STORAGE_DIR',   join(tmpHome, 'no-ws'))
+    })
+
+    afterEach(async () => {
+      clearSessionCache()
+      vi.unstubAllEnvs()
+      if (prevHome  === undefined) delete process.env['HOME']
+      else                          process.env['HOME'] = prevHome
+      if (prevCache === undefined) delete process.env['CODEBURN_CACHE_DIR']
+      else                          process.env['CODEBURN_CACHE_DIR'] = prevCache
+      await rm(tmpHome,  { recursive: true, force: true })
+      await rm(tmpCache, { recursive: true, force: true })
+    })
+
+    it('preserves cache tokens from all conversations, not just the last one', async () => {
+      // Pricing for claude-haiku-4-5 (per litellm-snapshot.json):
+      //   input:       $1.00 / M  → 1e-6
+      //   output:      $5.00 / M  → 5e-6
+      //   cache_read:  $0.10 / M  → 1e-7
+      //   cache_write: $1.25 / M  → 1.25e-6
+      createOtelDb(dbPath)
+
+      const conversations: ConvSpec[] = [
+        { spanId: 'span-1', traceId: 'trace-1', convId: 'conv-1', model: 'claude-haiku-4-5-20251001',
+          input: 1_000, output: 100, cacheRead: 50_000, cacheCreate: 500 },
+        { spanId: 'span-2', traceId: 'trace-2', convId: 'conv-2', model: 'claude-haiku-4-5-20251001',
+          input: 2_000, output: 200, cacheRead: 60_000, cacheCreate: 600 },
+        { spanId: 'span-3', traceId: 'trace-3', convId: 'conv-3', model: 'claude-haiku-4-5-20251001',
+          input: 3_000, output: 300, cacheRead: 70_000, cacheCreate: 700 },
+      ]
+      for (const c of conversations) insertConversation(dbPath, c)
+
+      const projects = await parseAllSessions(undefined, 'copilot')
+      const allCalls = projects
+        .flatMap(p => p.sessions)
+        .flatMap(s => s.turns)
+        .flatMap(t => t.assistantCalls)
+
+      // All three conversations must be present — before the fix only 1 survived.
+      expect(allCalls).toHaveLength(3)
+
+      const totalInput      = allCalls.reduce((s, c) => s + c.usage.inputTokens,                 0)
+      const totalOutput     = allCalls.reduce((s, c) => s + c.usage.outputTokens,                0)
+      const totalCacheRead  = allCalls.reduce((s, c) => s + c.usage.cacheReadInputTokens,        0)
+      const totalCacheCreate = allCalls.reduce((s, c) => s + c.usage.cacheCreationInputTokens,   0)
+
+      expect(totalInput).toBe(6_000)    // 1 000 + 2 000 + 3 000
+      expect(totalOutput).toBe(600)     // 100 + 200 + 300
+      expect(totalCacheRead).toBe(180_000)  // 50k + 60k + 70k — all must survive
+      expect(totalCacheCreate).toBe(1_800)  // 500 + 600 + 700
+
+      // Pre-fix regression check: if only the last conversation survived,
+      // totalCacheRead would be 70 000 (the last one). Assert it's 180 000.
+      expect(totalCacheRead).toBeGreaterThan(100_000)
+
+      // Cost sanity: input+output+cacheRead+cacheCreate with haiku-4-5 pricing
+      //   6000 * 1e-6   = 0.006
+      //   600  * 5e-6   = 0.003
+      //   180k * 1e-7   = 0.018
+      //   1800 * 1.25e-6 = 0.00225
+      //   total ≈ $0.029
+      const totalCostUSD = allCalls.reduce((s, c) => s + c.costUSD, 0)
+      expect(totalCostUSD).toBeCloseTo(0.029, 2)
+    })
+
+    it('second run from disk cache also delivers all conversations', async () => {
+      // Ensures the merged result written to the session-cache.json survives
+      // a reload and yields the same aggregated data on repeat invocations.
+      createOtelDb(dbPath)
+
+      const conversations: ConvSpec[] = [
+        { spanId: 'span-a', traceId: 'trace-a', convId: 'conv-a', model: 'claude-haiku-4-5-20251001',
+          input: 500, output: 50, cacheRead: 25_000, cacheCreate: 250 },
+        { spanId: 'span-b', traceId: 'trace-b', convId: 'conv-b', model: 'claude-haiku-4-5-20251001',
+          input: 500, output: 50, cacheRead: 25_000, cacheCreate: 250 },
+      ]
+      for (const c of conversations) insertConversation(dbPath, c)
+
+      // First run — parses and writes disk cache
+      await parseAllSessions(undefined, 'copilot')
+
+      // Clear in-memory cache only, leaving disk cache intact
+      clearSessionCache()
+
+      // Second run — should read from disk cache
+      const projects = await parseAllSessions(undefined, 'copilot')
+      const allCalls = projects
+        .flatMap(p => p.sessions)
+        .flatMap(s => s.turns)
+        .flatMap(t => t.assistantCalls)
+
+      expect(allCalls).toHaveLength(2)
+
+      const totalCacheRead = allCalls.reduce((s, c) => s + c.usage.cacheReadInputTokens, 0)
+      expect(totalCacheRead).toBe(50_000)  // 25k + 25k from both conversations
+    })
+  }
+)
diff --git a/tests/providers/copilot.test.ts b/tests/providers/copilot.test.ts
index e7a87a86..8dbe9d2f 100644
--- a/tests/providers/copilot.test.ts
+++ b/tests/providers/copilot.test.ts
@@ -1,9 +1,11 @@
-import { describe, it, expect, beforeEach, afterEach } from 'vitest'
+import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest'
 import { mkdtemp, mkdir, writeFile, rm } from 'fs/promises'
 import { join, posix, win32 } from 'path'
 import { tmpdir } from 'os'
+import { createRequire } from 'node:module'
 
 import { copilot, createCopilotProvider, getVSCodeWorkspaceStorageDirs } from '../../src/providers/copilot.js'
+import { isSqliteAvailable } from '../../src/sqlite.js'
 import type { ParsedProviderCall } from '../../src/providers/types.js'
 
 let tmpDir: string
@@ -363,10 +365,13 @@ describe('copilot provider - JSONL parsing', () => {
 describe('copilot provider - discoverSessions', () => {
   beforeEach(async () => {
     tmpDir = await mkdtemp(join(tmpdir(), 'copilot-test-'))
+    // Disable OTel discovery so tests aren't contaminated by real sessions
+    vi.stubEnv('CODEBURN_COPILOT_DISABLE_OTEL', '1')
   })
 
   afterEach(async () => {
     await rm(tmpDir, { recursive: true, force: true })
+    vi.unstubAllEnvs()
   })
 
   it('discovers sessions from directory', async () => {
@@ -481,85 +486,295 @@ describe('copilot provider - metadata', () => {
   })
 })
 
-// JetBrains (IntelliJ/DataGrip) format, added in #433. Discovery + parsing,
-// the isJetBrainsFormat routing guard, and the id-less dedup fallback.
-describe('copilot provider - JetBrains format', () => {
+// ---------------------------------------------------------------------------
+// OTel cache token tests
+//
+// These tests verify that the OTel SQLite parser correctly extracts
+// cacheReadInputTokens and cacheCreationInputTokens from the agent-traces.db
+// schema, and that multiple conversations from the same DB file are each
+// parsed independently with their full cache token data intact.
+//
+// This is the regression guard for the bug documented in DEBUG_HANDOFF.md:
+// cache tokens were extracted during parsing but lost in aggregation because
+// all conversations shared the same file path key in the session cache.
+// ---------------------------------------------------------------------------
+
+const requireForTest = createRequire(import.meta.url)
+
+type TestDb = {
+  exec(sql: string): void
+  prepare(sql: string): { run(...params: unknown[]): void }
+  close(): void
+}
+
+/** Creates a minimal agent-traces.db schema matching the VS Code Copilot Chat OTel store. */
+function createOtelDb(dbPath: string): void {
+  const { DatabaseSync } = requireForTest('node:sqlite') as { DatabaseSync: new (path: string) => TestDb }
+  const db = new DatabaseSync(dbPath)
+  db.exec(`
+    CREATE TABLE spans (
+      span_id      TEXT PRIMARY KEY NOT NULL,
+      trace_id     TEXT NOT NULL,
+      operation_name TEXT,
+      start_time_ms INTEGER NOT NULL DEFAULT 0,
+      response_model TEXT
+    );
+    CREATE TABLE span_attributes (
+      id      INTEGER PRIMARY KEY AUTOINCREMENT,
+      span_id TEXT NOT NULL,
+      key     TEXT NOT NULL,
+      value   TEXT
+    );
+  `)
+  db.close()
+}
+
+interface SpanDef {
+  spanId: string
+  traceId: string
+  operationName: string
+  startTimeMs?: number
+  responseModel?: string
+  attrs: Record<string, string | number>
+}
+
+function insertSpan(dbPath: string, span: SpanDef): void {
+  const { DatabaseSync } = requireForTest('node:sqlite') as { DatabaseSync: new (path: string) => TestDb }
+  const db = new DatabaseSync(dbPath)
+  db.prepare(
+    `INSERT INTO spans (span_id, trace_id, operation_name, start_time_ms, response_model)
+     VALUES (?, ?, ?, ?, ?)`
+  ).run(span.spanId, span.traceId, span.operationName, span.startTimeMs ?? 0, span.responseModel ?? null)
+  const attrStmt = db.prepare(
+    `INSERT INTO span_attributes (span_id, key, value) VALUES (?, ?, ?)`
+  )
+  for (const [key, value] of Object.entries(span.attrs)) {
+    attrStmt.run(span.spanId, key, String(value))
+  }
+  db.close()
+}
+
+describe('copilot provider - OTel cache token parsing', () => {
+  let tmpDir: string
+  let dbPath: string
+
   beforeEach(async () => {
-    tmpDir = await mkdtemp(join(tmpdir(), 'copilot-jb-'))
+    tmpDir = await mkdtemp(join(tmpdir(), 'copilot-otel-test-'))
+    dbPath = join(tmpDir, 'agent-traces.db')
+    vi.stubEnv('CODEBURN_COPILOT_OTEL_DB', dbPath)
+    vi.stubEnv('CODEBURN_COPILOT_DISABLE_OTEL', '')
   })
+
   afterEach(async () => {
     await rm(tmpDir, { recursive: true, force: true })
-  })
+    vi.unstubAllEnvs()
+  })
+
+  it('skips tests when node:sqlite is unavailable', () => {
+    if (!isSqliteAvailable()) return
+    // Placeholder — subsequent tests use isSqliteAvailable guard
+  })
+
+  it('extracts cache tokens from a single OTel conversation', async () => {
+    if (!isSqliteAvailable()) return
+
+    createOtelDb(dbPath)
+    insertSpan(dbPath, {
+      spanId: 'span-001',
+      traceId: 'trace-001',
+      operationName: 'chat',
+      startTimeMs: 1000,
+      responseModel: 'gpt-4.1',
+      attrs: {
+        'gen_ai.conversation.id': 'conv-001',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 1000,
+        'gen_ai.usage.output_tokens': 200,
+        'gen_ai.usage.cache_read.input_tokens': 50000,
+        'gen_ai.usage.cache_creation.input_tokens': 500,
+      },
+    })
 
-  const jbUser = (text: string) =>
-    JSON.stringify({ type: 'user.message_rendered', data: { renderedMessage: text } })
-  const jbTurnStart = (turnId: string) =>
-    JSON.stringify({ type: 'assistant.turn_start', data: { turnId } })
-  const jbToolStart = (toolName: string, toolCallId: string, path?: string) =>
-    JSON.stringify({ type: 'tool.execution_start', data: { toolName, toolCallId, arguments: path ? { path } : {} } })
-  const jbAssistant = (opts: { messageId?: string; text?: string; outputTokens?: number; iterationNumber?: number }) =>
-    JSON.stringify({ type: 'assistant.message', data: { ...opts } })
-
-  async function writeJbSession(workspaceId: string, lines: string[]) {
-    const dir = join(tmpDir, workspaceId)
-    await mkdir(dir, { recursive: true })
-    const filePath = join(dir, 'chat.jsonl')
-    await writeFile(filePath, lines.join('\n') + '\n')
-    return filePath
-  }
+    const provider = createCopilotProvider('/nonexistent/jsonl', '/nonexistent/ws')
+    const sources = await provider.discoverSessions()
+
+    const otelSources = sources.filter(s => s.path === dbPath)
+    expect(otelSources).toHaveLength(1)
+    expect(otelSources[0]!.provider).toBe('copilot')
 
-  async function parse(filePath: string, seen = new Set<string>()) {
-    const provider = createCopilotProvider('/nonexistent/legacy', '/nonexistent/vscode', tmpDir)
-    const source = { path: filePath, project: 'p', provider: 'copilot' }
     const calls: ParsedProviderCall[] = []
-    for await (const call of provider.createSessionParser(source, seen).parse()) calls.push(call)
-    return calls
-  }
+    for await (const call of provider.createSessionParser(otelSources[0]!, new Set()).parse()) {
+      calls.push(call)
+    }
+
+    expect(calls).toHaveLength(1)
+    const call = calls[0]!
+    expect(call.model).toBe('gpt-4.1')
+    expect(call.inputTokens).toBe(1000)
+    expect(call.outputTokens).toBe(200)
+    expect(call.cacheReadInputTokens).toBe(50000)
+    expect(call.cacheCreationInputTokens).toBe(500)
+    expect(call.costUSD).toBeGreaterThan(0)
+  })
+
+  it('discovers one source per conversation from the same DB file', async () => {
+    if (!isSqliteAvailable()) return
+
+    createOtelDb(dbPath)
 
-  it('discovers a JetBrains chat.jsonl under the jb dir', async () => {
-    const filePath = await writeJbSession('ws-abc', [jbUser('hello'), jbAssistant({ messageId: 'm1', text: 'hi', outputTokens: 10 })])
-    const provider = createCopilotProvider('/nonexistent/legacy', '/nonexistent/vscode', tmpDir)
+    // Two independent conversations in the same DB
+    insertSpan(dbPath, {
+      spanId: 'span-a1', traceId: 'trace-a', operationName: 'chat', startTimeMs: 1000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-alpha',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 800,
+        'gen_ai.usage.output_tokens': 100,
+        'gen_ai.usage.cache_read.input_tokens': 40000,
+        'gen_ai.usage.cache_creation.input_tokens': 400,
+      },
+    })
+    insertSpan(dbPath, {
+      spanId: 'span-b1', traceId: 'trace-b', operationName: 'chat', startTimeMs: 2000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-beta',
+        'gen_ai.response.model': 'claude-sonnet-4',
+        'gen_ai.usage.input_tokens': 600,
+        'gen_ai.usage.output_tokens': 80,
+        'gen_ai.usage.cache_read.input_tokens': 30000,
+        'gen_ai.usage.cache_creation.input_tokens': 300,
+      },
+    })
+
+    const provider = createCopilotProvider('/nonexistent/jsonl', '/nonexistent/ws')
     const sources = await provider.discoverSessions()
-    expect(sources.some(s => s.path === filePath && s.provider === 'copilot')).toBe(true)
+
+    const otelSources = sources.filter(s => s.path === dbPath)
+    // Exactly one source per conversation, both pointing to the same DB file
+    expect(otelSources).toHaveLength(2)
+    expect(otelSources.every(s => s.path === dbPath)).toBe(true)
+    // Each conversation should have a distinct identity (provider routes by conversationId)
+    const convIds = otelSources.map(s => (s as { conversationId?: string }).conversationId)
+    expect(new Set(convIds).size).toBe(2)
+  })
+
+  it('preserves cache tokens when parsing multiple conversations from one DB', async () => {
+    if (!isSqliteAvailable()) return
+
+    createOtelDb(dbPath)
+
+    insertSpan(dbPath, {
+      spanId: 'span-c1', traceId: 'trace-c', operationName: 'chat', startTimeMs: 1000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-c',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 500,
+        'gen_ai.usage.output_tokens': 100,
+        'gen_ai.usage.cache_read.input_tokens': 20000,
+        'gen_ai.usage.cache_creation.input_tokens': 200,
+      },
+    })
+    insertSpan(dbPath, {
+      spanId: 'span-d1', traceId: 'trace-d', operationName: 'chat', startTimeMs: 2000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-d',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 700,
+        'gen_ai.usage.output_tokens': 150,
+        'gen_ai.usage.cache_read.input_tokens': 35000,
+        'gen_ai.usage.cache_creation.input_tokens': 350,
+      },
+    })
+
+    const provider = createCopilotProvider('/nonexistent/jsonl', '/nonexistent/ws')
+    const sources = await provider.discoverSessions()
+    const otelSources = sources.filter(s => s.path === dbPath)
+    expect(otelSources).toHaveLength(2)
+
+    // Parse all sources; each must carry its own cache tokens
+    const seenKeys = new Set<string>()
+    const allCalls: ParsedProviderCall[] = []
+    for (const src of otelSources) {
+      for await (const call of provider.createSessionParser(src, seenKeys).parse()) {
+        allCalls.push(call)
+      }
+    }
+
+    expect(allCalls).toHaveLength(2)
+
+    const totalCacheRead = allCalls.reduce((sum, c) => sum + c.cacheReadInputTokens, 0)
+    const totalCacheCreate = allCalls.reduce((sum, c) => sum + c.cacheCreationInputTokens, 0)
+
+    // Both conversations' cache tokens must survive end-to-end
+    expect(totalCacheRead).toBe(55000)   // 20000 + 35000
+    expect(totalCacheCreate).toBe(550)   // 200 + 350
   })
 
-  it('parses a JetBrains session into a call with the inferred model and user message', async () => {
-    const filePath = await writeJbSession('ws-abc', [
-      jbUser('implement the feature'),
-      jbTurnStart('t1'),
-      jbToolStart('read_file', 'toolu_vrtx_x'),
-      jbAssistant({ messageId: 'm1', text: 'done', outputTokens: 42 }),
-    ])
-    const calls = await parse(filePath)
+  it('includes tool names from execute_tool spans in the same trace', async () => {
+    if (!isSqliteAvailable()) return
+
+    createOtelDb(dbPath)
+    // chat span
+    insertSpan(dbPath, {
+      spanId: 'span-e1', traceId: 'trace-e', operationName: 'chat', startTimeMs: 1000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-e',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 300,
+        'gen_ai.usage.output_tokens': 50,
+        'gen_ai.usage.cache_read.input_tokens': 10000,
+        'gen_ai.usage.cache_creation.input_tokens': 100,
+      },
+    })
+    // execute_tool span in the same trace
+    insertSpan(dbPath, {
+      spanId: 'span-e2', traceId: 'trace-e', operationName: 'execute_tool', startTimeMs: 1500,
+      attrs: {
+        'gen_ai.tool.name': 'readFile',
+      },
+    })
+
+    const provider = createCopilotProvider('/nonexistent/jsonl', '/nonexistent/ws')
+    const sources = await provider.discoverSessions()
+    const src = sources.find(s => s.path === dbPath)
+    expect(src).toBeDefined()
+
+    const calls: ParsedProviderCall[] = []
+    for await (const call of provider.createSessionParser(src!, new Set()).parse()) {
+      calls.push(call)
+    }
+
     expect(calls).toHaveLength(1)
-    expect(calls[0]!.provider).toBe('copilot')
-    expect(calls[0]!.model).toBe('copilot-anthropic-auto') // toolu_ prefix -> Anthropic
-    expect(calls[0]!.outputTokens).toBe(42)
-    expect(calls[0]!.userMessage).toBe('implement the feature')
-    expect(calls[0]!.tools).toEqual(['Read'])
-    expect(calls[0]!.deduplicationKey.startsWith('copilot:jb:')).toBe(true)
-  })
+    expect(calls[0]!.tools).toContain('Read')
+    expect(calls[0]!.cacheReadInputTokens).toBe(10000)
+  })
+
+  it('skips OTel spans with zero input and output tokens', async () => {
+    if (!isSqliteAvailable()) return
+
+    createOtelDb(dbPath)
+    insertSpan(dbPath, {
+      spanId: 'span-f1', traceId: 'trace-f', operationName: 'chat', startTimeMs: 1000,
+      attrs: {
+        'gen_ai.conversation.id': 'conv-f',
+        'gen_ai.response.model': 'gpt-4.1',
+        'gen_ai.usage.input_tokens': 0,
+        'gen_ai.usage.output_tokens': 0,
+        'gen_ai.usage.cache_read.input_tokens': 50000,
+        'gen_ai.usage.cache_creation.input_tokens': 500,
+      },
+    })
 
-  it('does NOT route a legacy file (first line user.message) to the JetBrains parser', async () => {
-    // Regression guard: isJetBrainsFormat must not match bare user.message.
-    const filePath = await writeJbSession('ws-legacy', [
-      JSON.stringify({ type: 'user.message', data: { content: 'hi' } }),
-      JSON.stringify({ type: 'session.model_change', data: { newModel: 'gpt-4.1' } }),
-      JSON.stringify({ type: 'assistant.message', data: { messageId: 'm1', outputTokens: 5 } }),
-    ])
-    const calls = await parse(filePath)
-    // Parsed by the legacy parser -> legacy dedup key, not a jb one.
-    expect(calls.every(c => !c.deduplicationKey.startsWith('copilot:jb:'))).toBe(true)
-  })
+    const provider = createCopilotProvider('/nonexistent/jsonl', '/nonexistent/ws')
+    const sources = await provider.discoverSessions()
+    const src = sources.find(s => s.path === dbPath)
+    expect(src).toBeDefined()
 
-  it('does not collapse id-less assistant messages (dedup fallback)', async () => {
-    const filePath = await writeJbSession('ws-noid', [
-      jbUser('q1'),
-      jbAssistant({ text: 'a1', outputTokens: 5 }),
-      jbAssistant({ text: 'a2', outputTokens: 6 }),
-    ])
-    const calls = await parse(filePath)
-    expect(calls).toHaveLength(2)
-    expect(new Set(calls.map(c => c.deduplicationKey)).size).toBe(2)
+    const calls: ParsedProviderCall[] = []
+    for await (const call of provider.createSessionParser(src!, new Set()).parse()) {
+      calls.push(call)
+    }
+    // Span with zero input AND output tokens is skipped
+    expect(calls).toHaveLength(0)
   })
 })