fix: use backend thread token usage for header total (#2800)

* fix: use backend thread token usage for header total * Refactor thread token usage fetch
2026-05-25 09:26:00 +00:00 · 2026-05-09 19:40:32 +08:00
parent 881ff71252
commit 417416087b
16 changed files with 540 additions and 35 deletions
@@ -310,7 +310,7 @@ export const enUS: Translations = {
    unavailable:
      "No token usage yet. Usage appears only after a successful model response when the provider returns usage_metadata.",
    unavailableShort: "No usage returned",
-    note: "Shown from provider-returned usage_metadata. Totals are best-effort conversation totals and may differ from provider billing pages.",
+    note: "Header totals use persisted thread usage when available. Per-turn and debug usage come from visible messages. Totals may differ from provider billing pages.",
    presets: {
      off: "Off",
      summary: "Summary",