A bunch of fixes

ericallam · ericallam · commit 622bee1997e8 · 2026-03-13T15:21:43.000Z
diff --git a/apps/webapp/app/components/runs/v3/ai/AISpanDetails.tsx b/apps/webapp/app/components/runs/v3/ai/AISpanDetails.tsx
@@ -16,8 +16,7 @@ export function AISpanDetails({
   rawProperties?: string;
 }) {
   const [tab, setTab] = useState<AITab>("overview");
-  const hasTools =
-    (aiData.toolDefinitions && aiData.toolDefinitions.length > 0) || aiData.toolCount != null;
+  const toolCount = aiData.toolCount ?? aiData.toolDefinitions?.length ?? 0;
 
   return (
     <div className="flex h-full flex-col overflow-hidden">
@@ -40,16 +39,14 @@ export function AISpanDetails({
           >
             Messages
           </TabButton>
-          {hasTools && (
-            <TabButton
-              isActive={tab === "tools"}
-              layoutId="ai-span"
-              onClick={() => setTab("tools")}
-              shortcut={{ key: "t" }}
-            >
-              Tools{aiData.toolCount != null ? ` (${aiData.toolCount})` : ""}
-            </TabButton>
-          )}
+          <TabButton
+            isActive={tab === "tools"}
+            layoutId="ai-span"
+            onClick={() => setTab("tools")}
+            shortcut={{ key: "t" }}
+          >
+            Tools{toolCount > 0 ? ` (${toolCount})` : ""}
+          </TabButton>
         </TabContainer>
       </div>
 
diff --git a/apps/webapp/app/routes/admin.llm-models.$modelId.tsx b/apps/webapp/app/routes/admin.llm-models.$modelId.tsx
@@ -1,4 +1,4 @@
-import { Form, useNavigate } from "@remix-run/react";
+import { Form, useActionData, useNavigate } from "@remix-run/react";
 import type { ActionFunctionArgs, LoaderFunctionArgs } from "@remix-run/server-runtime";
 import { redirect } from "@remix-run/server-runtime";
 import { typedjson, useTypedLoaderData } from "remix-typedjson";
@@ -130,6 +130,7 @@ export async function action({ request, params }: ActionFunctionArgs) {
 
 export default function AdminLlmModelDetailRoute() {
   const { model } = useTypedLoaderData<typeof loader>();
+  const actionData = useActionData<{ success?: boolean; error?: string; details?: unknown[] }>();
   const navigate = useNavigate();
 
   const [modelName, setModelName] = useState(model.modelName);
@@ -273,6 +274,17 @@ export default function AdminLlmModelDetailRoute() {
               ))}
             </div>
 
+            {actionData?.error && (
+              <div className="rounded-md bg-red-500/10 border border-red-500/30 p-3 text-sm text-red-400">
+                {actionData.error}
+                {actionData.details && (
+                  <pre className="mt-1 text-xs text-red-300/70 overflow-auto">
+                    {JSON.stringify(actionData.details, null, 2)}
+                  </pre>
+                )}
+              </div>
+            )}
+
             {/* Actions */}
             <div className="flex items-center gap-2 border-t border-grid-dimmed pt-4">
               <Button type="submit" variant="primary/medium">
diff --git a/apps/webapp/app/v3/querySchemas.ts b/apps/webapp/app/v3/querySchemas.ts
@@ -746,7 +746,6 @@ export const llmUsageSchema: TableSchema = {
         description:
           "Key-value metadata from run tags (key:value format) and AI SDK telemetry metadata. Access keys with dot notation (metadata.userId) or bracket syntax (metadata['userId']).",
         example: "{'userId':'user_123','org':'acme'}",
-        coreColumn: true,
       }),
     },
   },
diff --git a/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts b/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts
@@ -79,7 +79,7 @@ function enrichLlmCost(event: CreateEventInput): void {
   // Add style accessories for model and tokens (even without cost data)
   const inputTokens = usageDetails["input"] ?? 0;
   const outputTokens = usageDetails["output"] ?? 0;
-  const totalTokens = inputTokens + outputTokens;
+  const totalTokens = usageDetails["total"] ?? inputTokens + outputTokens;
 
   const pillItems: Array<{ text: string; icon: string }> = [
     { text: responseModel, icon: "tabler-cube" },
@@ -165,7 +165,7 @@ function enrichLlmCost(event: CreateEventInput): void {
     pricingTierName: cost?.pricingTierName ?? (providerCost ? `${providerCost.source} reported` : ""),
     inputTokens: usageDetails["input"] ?? 0,
     outputTokens: usageDetails["output"] ?? 0,
-    totalTokens: Object.values(usageDetails).reduce((sum, v) => sum + v, 0),
+    totalTokens: usageDetails["total"] ?? (usageDetails["input"] ?? 0) + (usageDetails["output"] ?? 0),
     usageDetails,
     inputCost: cost?.inputCost ?? 0,
     outputCost: cost?.outputCost ?? 0,
diff --git a/apps/webapp/test/otlpExporter.test.ts b/apps/webapp/test/otlpExporter.test.ts
@@ -638,5 +638,69 @@ describe("OTLPExporter", () => {
       expect($events[0]._llmUsage.inputTokens).toBe(500);
       expect($events[0]._llmUsage.outputTokens).toBe(100);
     });
+
+    it("should prefer gen_ai.usage.total_tokens over input+output sum", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 100,
+          "gen_ai.usage.output_tokens": 50,
+          "gen_ai.usage.total_tokens": 200, // higher than 100+50 (e.g. includes cached/reasoning)
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      // Pills should show the explicit total, not input+output
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "200",
+        icon: "tabler-hash",
+      });
+
+      // LLM usage should also use the explicit total
+      expect(event._llmUsage.totalTokens).toBe(200);
+      expect(event._llmUsage.inputTokens).toBe(100);
+      expect(event._llmUsage.outputTokens).toBe(50);
+    });
+
+    it("should fall back to input+output when total_tokens is absent", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 300,
+          "gen_ai.usage.output_tokens": 75,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "375",
+        icon: "tabler-hash",
+      });
+      expect(event._llmUsage.totalTokens).toBe(375);
+    });
+
+    it("should use total_tokens when only total is present without input/output breakdown", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": undefined,
+          "gen_ai.usage.output_tokens": undefined,
+          "gen_ai.usage.total_tokens": 500,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      // Pills should show 500, not 0
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "500",
+        icon: "tabler-hash",
+      });
+    });
   });
 });
diff --git a/internal-packages/llm-pricing/src/registry.test.ts b/internal-packages/llm-pricing/src/registry.test.ts
@@ -174,6 +174,165 @@ describe("ModelPricingRegistry", () => {
     });
   });
 
+  describe("prefix stripping", () => {
+    it("should match gateway-prefixed model names", () => {
+      const result = registry.match("openai/gpt-4o");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should match openrouter-prefixed model names with date suffix", () => {
+      const result = registry.match("openai/gpt-4o-2024-08-06");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should return null for prefixed unknown model", () => {
+      const result = registry.match("xai/unknown-model");
+      expect(result).toBeNull();
+    });
+  });
+
+  describe("tier matching", () => {
+    const multiTierModel: LlmModelWithPricing = {
+      id: "model-gemini-pro",
+      friendlyId: "llm_model_gemini_pro",
+      modelName: "gemini-2.5-pro",
+      matchPattern: "^gemini-2\\.5-pro$",
+      startDate: null,
+      pricingTiers: [
+        {
+          id: "tier-large-context",
+          name: "Large Context",
+          isDefault: false,
+          priority: 0,
+          conditions: [
+            { usageDetailPattern: "input", operator: "gt" as const, value: 200000 },
+          ],
+          prices: [
+            { usageType: "input", price: 0.0000025 },
+            { usageType: "output", price: 0.00001 },
+          ],
+        },
+        {
+          id: "tier-standard",
+          name: "Standard",
+          isDefault: true,
+          priority: 1,
+          conditions: [],
+          prices: [
+            { usageType: "input", price: 0.00000125 },
+            { usageType: "output", price: 0.000005 },
+          ],
+        },
+      ],
+    };
+
+    it("should use conditional tier when conditions match", () => {
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([multiTierModel]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", {
+        input: 250000,
+        output: 1000,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Large Context");
+      expect(result!.inputCost).toBeCloseTo(0.625); // 250000 * 0.0000025
+    });
+
+    it("should fall back to default tier when conditions do not match", () => {
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([multiTierModel]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", {
+        input: 1000,
+        output: 100,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Standard");
+      expect(result!.inputCost).toBeCloseTo(0.00125); // 1000 * 0.00000125
+    });
+
+    it("should not let unconditional tier win over conditional match", () => {
+      // Model where unconditional tier has lower priority than conditional
+      const model: LlmModelWithPricing = {
+        ...multiTierModel,
+        pricingTiers: [
+          {
+            id: "tier-unconditional",
+            name: "Unconditional",
+            isDefault: false,
+            priority: 0,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.001 }],
+          },
+          {
+            id: "tier-conditional",
+            name: "Conditional",
+            isDefault: false,
+            priority: 1,
+            conditions: [
+              { usageDetailPattern: "input", operator: "gt" as const, value: 100 },
+            ],
+            prices: [{ usageType: "input", price: 0.0001 }],
+          },
+          {
+            id: "tier-default",
+            name: "Default",
+            isDefault: true,
+            priority: 2,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.01 }],
+          },
+        ],
+      };
+
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([model]);
+
+      // Condition matches — conditional tier should win, not the unconditional one
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", { input: 500 });
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Conditional");
+    });
+
+    it("should fall back to isDefault tier when no conditions match", () => {
+      const model: LlmModelWithPricing = {
+        ...multiTierModel,
+        pricingTiers: [
+          {
+            id: "tier-conditional",
+            name: "Conditional",
+            isDefault: false,
+            priority: 0,
+            conditions: [
+              { usageDetailPattern: "input", operator: "gt" as const, value: 999999 },
+            ],
+            prices: [{ usageType: "input", price: 0.001 }],
+          },
+          {
+            id: "tier-default",
+            name: "Default",
+            isDefault: true,
+            priority: 1,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.0001 }],
+          },
+        ],
+      };
+
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([model]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", { input: 100 });
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Default");
+    });
+  });
+
   describe("defaultModelPrices (Langfuse JSON)", () => {
     it("should load all models from the JSON file", () => {
       expect(defaultModelPrices.length).toBeGreaterThan(100);
diff --git a/internal-packages/llm-pricing/src/registry.ts b/internal-packages/llm-pricing/src/registry.ts
@@ -162,22 +162,20 @@ export class ModelPricingRegistry {
   ): LlmPricingTierWithPrices | null {
     if (tiers.length === 0) return null;
 
-    // Tiers are sorted by priority ascending (lowest first)
-    // Evaluate conditions — first tier whose conditions match wins
+    // Tiers are sorted by priority ascending (lowest first).
+    // First pass: evaluate tiers that have conditions — first match wins.
     for (const tier of tiers) {
-      if (tier.conditions.length === 0) {
-        // No conditions = default tier
-        return tier;
-      }
-
-      if (this._evaluateConditions(tier.conditions, usageDetails)) {
+      if (tier.conditions.length > 0 && this._evaluateConditions(tier.conditions, usageDetails)) {
         return tier;
       }
     }
 
-    // Fallback to default tier
+    // Second pass: fall back to the default tier, or first tier with no conditions
     const defaultTier = tiers.find((t) => t.isDefault);
-    return defaultTier ?? tiers[0] ?? null;
+    if (defaultTier) return defaultTier;
+
+    const unconditional = tiers.find((t) => t.conditions.length === 0);
+    return unconditional ?? tiers[0] ?? null;
   }
 
   private _evaluateConditions(