fix(cost): make cost telemetry survive non-Anthropic models

leifericf · claude · leifericf · commit 8ea8da1c9064 · 2026-05-03T13:34:19.000+02:00
llm-cost-by-model and llm-cost-total returned empty against a fully
analyzed db with 358 analyze txes. Three compounding bugs:

1. model-pricing keyed by date-stamped ids
   Provider responses now carry undated model names ("claude-sonnet-4-6"
   from the LevelInfinite/Tencent gateway, "glm-4.6" from Z.ai). The
   pricing table only had "claude-sonnet-4-6-20250514" etc., so lookup
   missed every response and estimate-cost returned 0.0. Switched to
   prefix-match against undated keys so both bare and date-stamped
   ids hit. Also added claude-opus-4-7.

2. :tx/cost-usd asserted only when (pos? cost)
   With cost=0 for GLM-quota and now-misnamed Claude responses, the
   attribute was never written. Drop the guard — write 0.0 explicitly
   so the schema is uniform across txes.

3. cost queries used bare datalog clauses
   [?tx :tx/cost-usd ?cost] silently excludes any tx without the attr,
   which (after the bugs above) was every tx. Switch to get-else with
   0.0 default. llm-cost-total also gains a :tx/op anchor (analyze or
   synthesize) so it doesn't pull in import/enrich/seed rows that
   never had token attributes.

Probed both providers directly: neither GLM nor Tencent return cost
in usage — they relay Anthropic-format JSON unchanged. The fix is
local pricing and local query hygiene, nothing provider-side.

Co-Authored-By: Claude Opus 4.7 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/resources/queries/llm-cost-by-model.edn b/resources/queries/llm-cost-by-model.edn
@@ -3,6 +3,6 @@
  :query [:find ?model (sum ?in) (sum ?out) (sum ?cost)
          :where
          [?tx :tx/model ?model]
-         [?tx :tx/input-tokens ?in]
-         [?tx :tx/output-tokens ?out]
-         [?tx :tx/cost-usd ?cost]]}
+         [(get-else $ ?tx :tx/input-tokens 0) ?in]
+         [(get-else $ ?tx :tx/output-tokens 0) ?out]
+         [(get-else $ ?tx :tx/cost-usd 0.0) ?cost]]}
diff --git a/resources/queries/llm-cost-total.edn b/resources/queries/llm-cost-total.edn
@@ -2,6 +2,8 @@
  :description "Total LLM token usage and estimated cost"
  :query [:find (sum ?in) (sum ?out) (sum ?cost)
          :where
-         [?tx :tx/input-tokens ?in]
-         [?tx :tx/output-tokens ?out]
-         [?tx :tx/cost-usd ?cost]]}
+         [?tx :tx/op ?op]
+         [(contains? #{:analyze :synthesize} ?op)]
+         [(get-else $ ?tx :tx/input-tokens 0) ?in]
+         [(get-else $ ?tx :tx/output-tokens 0) ?out]
+         [(get-else $ ?tx :tx/cost-usd 0.0) ?cost]]}
diff --git a/src/noumenon/analyze.clj b/src/noumenon/analyze.clj
@@ -315,10 +315,10 @@
              :tx/analyzer        (or analyzer "noumenon.analyze/0.1.0")
              :prov/model-version (or model-version "unknown")
              :prov/prompt-hash   (or prompt-hash-val "")
-             :prov/analyzed-at   (Date.)}
+             :prov/analyzed-at   (Date.)
+             :tx/cost-usd        cost}
       (:input-tokens usage)  (assoc :tx/input-tokens (:input-tokens usage))
-      (:output-tokens usage) (assoc :tx/output-tokens (:output-tokens usage))
-      (pos? cost)            (assoc :tx/cost-usd cost))))
+      (:output-tokens usage) (assoc :tx/output-tokens (:output-tokens usage)))))
 
 (defn analysis->tx-data
   "Convert a parsed analysis map into Datomic tx-data for a file.
diff --git a/src/noumenon/llm.clj b/src/noumenon/llm.clj
@@ -85,16 +85,22 @@
 ;; --- Pricing ---
 
 (def model-pricing
-  "Per-token pricing in $/1M tokens. Only for direct Anthropic API models.
-   GLM uses quota-based pricing so is not listed here."
-  {"claude-sonnet-4-6-20250514" {:input 3.0  :output 15.0}
-   "claude-haiku-4-5-20251001"  {:input 0.80 :output 4.0}
-   "claude-opus-4-6-20250514"   {:input 15.0 :output 75.0}})
+  "Per-token pricing in $/1M tokens for direct Anthropic API models.
+   Keys are matched as prefixes against the model id returned by the
+   provider, so both bare names (claude-sonnet-4-6) and date-stamped
+   ids (claude-sonnet-4-6-20250514) hit the same entry. GLM and other
+   quota-priced providers return 0."
+  {"claude-sonnet-4-6" {:input 3.0  :output 15.0}
+   "claude-haiku-4-5"  {:input 0.80 :output 4.0}
+   "claude-opus-4-6"   {:input 15.0 :output 75.0}
+   "claude-opus-4-7"   {:input 15.0 :output 75.0}})
 
 (defn estimate-cost
   "Estimate USD cost for given model and token counts. Returns 0.0 for unknown models."
   [model-id input-tokens output-tokens]
-  (if-let [{:keys [input output]} (model-pricing model-id)]
+  (if-let [{:keys [input output]} (some (fn [[k v]]
+                                          (when (and model-id (str/starts-with? model-id k)) v))
+                                        model-pricing)]
     (+ (* input-tokens (/ input 1e6))
        (* output-tokens (/ output 1e6)))
     0.0))
diff --git a/src/noumenon/synthesize.clj b/src/noumenon/synthesize.clj
@@ -547,11 +547,11 @@
              :tx/provider (or provider "unknown")
              :tx/model-source model-source
              :tx/model (or resolved-model model-id "unknown")
+             :tx/cost-usd cost
              :prov/prompt-hash prompt-hash
              :prov/analyzed-at (Date.)}
       (:input-tokens usage)  (assoc :tx/input-tokens (:input-tokens usage))
-      (:output-tokens usage) (assoc :tx/output-tokens (:output-tokens usage))
-      (pos? cost)            (assoc :tx/cost-usd cost))))
+      (:output-tokens usage) (assoc :tx/output-tokens (:output-tokens usage)))))
 
 (defn- transact-and-finalize!
   "Retract old synthesis, transact new components, derive deps. Returns result map."