wip

khromov · khromov · commit 093996143dc2 · 2025-12-10T23:58:07.000+01:00
diff --git a/index.ts b/index.ts
@@ -242,7 +242,8 @@ function calculateTotalCost(
 
 /**
  * Resolve pricing lookup for a model
- * Returns the pricing lookup result or null if not found or disabled
+ * Returns the pricing lookup result or null if disabled
+ * Throws an error (exits process) if pricing cannot be found and is not disabled
  */
 function resolvePricingLookup(modelString: string): ModelPricingLookup | null {
   const costDisabled = process.env.MODEL_COST_DISABLED === "true";
@@ -255,30 +256,50 @@ function resolvePricingLookup(modelString: string): ModelPricingLookup | null {
 
   // Check if pricing data file exists
   if (!isPricingAvailable()) {
-    console.warn(
-      `⚠️  Model pricing file not found. Run 'bun run update-model-pricing' to download it.`,
+    console.error(
+      `\n✗ Model pricing file not found. Run 'bun run update-model-pricing' to download it.`,
     );
-    console.warn(`   Cost calculation will be skipped.`);
-    return null;
+    console.error(
+      `  Or set MODEL_COST_DISABLED=true to skip cost calculation.\n`,
+    );
+    process.exit(1);
   }
 
   // If explicit cost name is provided, use that
   if (explicitCostName) {
     const lookup = lookupModelPricingByKey(explicitCostName);
     if (!lookup) {
-      console.warn(
-        `⚠️  Could not find pricing for MODEL_COST_NAME="${explicitCostName}"`,
+      console.error(
+        `\n✗ Could not find pricing for MODEL_COST_NAME="${explicitCostName}" in model-pricing.json`,
       );
-      return null;
+      console.error(
+        `  Check that the key exists in data/model-pricing.json.\n`,
+      );
+      process.exit(1);
     }
     return lookup;
   }
 
   // Try automatic lookup
   const lookup = lookupModelPricing(modelString);
   if (!lookup) {
-    console.warn(`⚠️  Could not find pricing for model "${modelString}"`);
-    return null;
+    console.error(
+      `\n✗ Could not find pricing for model "${modelString}" in model-pricing.json`,
+    );
+    console.error(`\n  Options:`);
+    console.error(
+      `    1. Set MODEL_COST_NAME=<key> to explicitly specify the pricing key`,
+    );
+    console.error(
+      `       Example: MODEL_COST_NAME=vercel_ai_gateway/anthropic/claude-sonnet-4`,
+    );
+    console.error(
+      `    2. Set MODEL_COST_DISABLED=true to skip cost calculation`,
+    );
+    console.error(
+      `\n  Browse data/model-pricing.json to find the correct key for your model.\n`,
+    );
+    process.exit(1);
   }
 
   return lookup;
@@ -435,10 +456,15 @@ async function main() {
   const isHttpTransport = mcpServerUrl && isHttpUrl(mcpServerUrl);
   const mcpTransportType = isHttpTransport ? "HTTP" : "StdIO";
 
+  const costDisabled = process.env.MODEL_COST_DISABLED === "true";
+
   console.log("╔════════════════════════════════════════════════════╗");
   console.log("║            SvelteBench 2.0 - Multi-Test            ║");
   console.log("╚════════════════════════════════════════════════════╝");
   console.log(`Model(s): ${models.join(", ")}`);
+  if (costDisabled) {
+    console.log(`Pricing: Disabled (MODEL_COST_DISABLED=true)`);
+  }
   console.log(`MCP Integration: ${mcpEnabled ? "Enabled" : "Disabled"}`);
   if (mcpEnabled) {
     console.log(`MCP Transport: ${mcpTransportType}`);
@@ -464,6 +490,14 @@ async function main() {
     process.exit(1);
   }
 
+  // Pre-validate pricing for all models before starting any benchmarks
+  // This ensures we fail fast if any model's pricing is missing
+  const pricingLookups = new Map<string, ModelPricingLookup | null>();
+  for (const modelId of models) {
+    const pricingLookup = resolvePricingLookup(modelId);
+    pricingLookups.set(modelId, pricingLookup);
+  }
+
   // Set up outputs directory
   setupOutputsDirectory();
 
@@ -497,8 +531,8 @@ async function main() {
     console.log(`🤖 Running benchmark for model: ${modelId}`);
     console.log("═".repeat(50));
 
-    // Resolve pricing for this model
-    const pricingLookup = resolvePricingLookup(modelId);
+    // Get pre-validated pricing for this model
+    const pricingLookup = pricingLookups.get(modelId) ?? null;
     if (pricingLookup) {
       console.log(`💰 Pricing mapped: ${pricingLookup.matchedKey}`);
     }
diff --git a/lib/pricing.test.ts b/lib/pricing.test.ts
@@ -9,107 +9,74 @@ import {
 } from "./pricing.ts";
 
 describe("generateLookupCandidates", () => {
-  describe("openrouter provider (slash format)", () => {
-    it("should generate candidates for openrouter/anthropic/model", () => {
-      const candidates = generateLookupCandidates(
-        "openrouter/anthropic/claude-sonnet-4",
-      );
-      expect(candidates).toContain("openrouter/anthropic/claude-sonnet-4");
-      expect(candidates).toContain("anthropic/claude-sonnet-4");
-      expect(candidates).toContain("claude-sonnet-4");
-    });
-
-    it("should generate candidates for openrouter/openai/model", () => {
-      const candidates = generateLookupCandidates("openrouter/openai/gpt-4o");
-      expect(candidates).toContain("openrouter/openai/gpt-4o");
-      expect(candidates).toContain("openai/gpt-4o");
-      expect(candidates).toContain("gpt-4o");
-    });
-
-    it("should handle openrouter with simple model name", () => {
-      const candidates = generateLookupCandidates("openrouter/some-model");
-      expect(candidates).toContain("openrouter/some-model");
-      expect(candidates).toContain("some-model");
-    });
-  });
-
-  describe("anthropic provider (slash format)", () => {
-    it("should generate candidates for anthropic/model", () => {
-      const candidates = generateLookupCandidates("anthropic/claude-haiku-4-5");
-      expect(candidates).toContain("anthropic/claude-haiku-4-5");
-      expect(candidates).toContain("claude-haiku-4-5");
-    });
-  });
-
-  describe("Vercel AI Gateway format (colon separator)", () => {
-    it("should generate candidates for anthropic:model", () => {
-      const candidates = generateLookupCandidates("anthropic:claude-sonnet-4");
-      expect(candidates).toContain("anthropic:claude-sonnet-4");
-      expect(candidates).toContain("anthropic/claude-sonnet-4");
-      expect(candidates).toContain("claude-sonnet-4");
+  describe("Vercel AI Gateway format (provider/model)", () => {
+    it("should generate candidates for alibaba/qwen-3-14b", () => {
+      const candidates = generateLookupCandidates("alibaba/qwen-3-14b");
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/alibaba/qwen-3-14b",
+        "alibaba/qwen-3-14b",
+        "qwen-3-14b",
+      ]);
     });
 
-    it("should generate candidates for openai:model", () => {
-      const candidates = generateLookupCandidates("openai:gpt-4o");
-      expect(candidates).toContain("openai:gpt-4o");
-      expect(candidates).toContain("openai/gpt-4o");
-      expect(candidates).toContain("gpt-4o");
+    it("should generate candidates for anthropic/claude-sonnet-4", () => {
+      const candidates = generateLookupCandidates("anthropic/claude-sonnet-4");
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/anthropic/claude-sonnet-4",
+        "anthropic/claude-sonnet-4",
+        "claude-sonnet-4",
+      ]);
     });
 
-    it("should generate candidates for google:model", () => {
-      const candidates = generateLookupCandidates("google:gemini-2.0-flash");
-      expect(candidates).toContain("google:gemini-2.0-flash");
-      expect(candidates).toContain("google/gemini-2.0-flash");
-      expect(candidates).toContain("gemini-2.0-flash");
-    });
-
-    it("should generate candidates for x-ai:model", () => {
-      const candidates = generateLookupCandidates("x-ai:grok-2");
-      expect(candidates).toContain("x-ai:grok-2");
-      expect(candidates).toContain("x-ai/grok-2");
-      expect(candidates).toContain("grok-2");
-    });
-  });
-
-  describe("openai provider (slash format)", () => {
-    it("should generate candidates for openai/model", () => {
+    it("should generate candidates for openai/gpt-4o", () => {
       const candidates = generateLookupCandidates("openai/gpt-4o");
-      expect(candidates).toContain("openai/gpt-4o");
-      expect(candidates).toContain("gpt-4o");
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/openai/gpt-4o",
+        "openai/gpt-4o",
+        "gpt-4o",
+      ]);
     });
 
-    it("should handle openai/gpt-4o-mini", () => {
-      const candidates = generateLookupCandidates("openai/gpt-4o-mini");
-      expect(candidates).toContain("openai/gpt-4o-mini");
-      expect(candidates).toContain("gpt-4o-mini");
+    it("should generate candidates for google/gemini-2.0-flash", () => {
+      const candidates = generateLookupCandidates("google/gemini-2.0-flash");
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/google/gemini-2.0-flash",
+        "google/gemini-2.0-flash",
+        "gemini-2.0-flash",
+      ]);
     });
-  });
 
-  describe("lmstudio provider", () => {
-    it("should generate candidates for lmstudio/model", () => {
-      const candidates = generateLookupCandidates("lmstudio/llama-3-8b");
-      expect(candidates).toContain("lmstudio/llama-3-8b");
-      expect(candidates).toContain("llama-3-8b");
+    it("should generate candidates for x-ai/grok-2", () => {
+      const candidates = generateLookupCandidates("x-ai/grok-2");
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/x-ai/grok-2",
+        "x-ai/grok-2",
+        "grok-2",
+      ]);
     });
   });
 
-  describe("unknown provider", () => {
-    it("should return only the original string for unknown provider", () => {
-      const candidates = generateLookupCandidates("unknown/some-model");
-      expect(candidates).toEqual(["unknown/some-model"]);
-    });
-
-    it("should handle unknown provider with colon format", () => {
-      const candidates = generateLookupCandidates("unknown:some-model");
-      expect(candidates).toContain("unknown:some-model");
-      expect(candidates).toContain("unknown/some-model");
+  describe("nested paths (openrouter style)", () => {
+    it("should handle openrouter/anthropic/claude-sonnet-4", () => {
+      const candidates = generateLookupCandidates(
+        "openrouter/anthropic/claude-sonnet-4",
+      );
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/openrouter/anthropic/claude-sonnet-4",
+        "openrouter/anthropic/claude-sonnet-4",
+        "anthropic/claude-sonnet-4",
+        "claude-sonnet-4",
+      ]);
     });
   });
 
   describe("no provider prefix", () => {
-    it("should return only the original string when no separator", () => {
+    it("should return only the original string with gateway prefix when no separator", () => {
       const candidates = generateLookupCandidates("claude-sonnet-4");
-      expect(candidates).toEqual(["claude-sonnet-4"]);
+      expect(candidates).toEqual([
+        "vercel_ai_gateway/claude-sonnet-4",
+        "claude-sonnet-4",
+      ]);
     });
   });
 });
diff --git a/lib/pricing.ts b/lib/pricing.ts
@@ -46,29 +46,6 @@ export interface ModelPricingLookup {
   matchedKey: string;
 }
 
-/**
- * Provider normalization configuration
- * - strip: Remove the provider prefix when generating candidates
- * - keepNested: For nested paths like "openrouter/anthropic/model", also try "anthropic/model"
- */
-interface ProviderConfig {
-  strip: boolean;
-  keepNested: boolean;
-}
-
-const PROVIDER_CONFIGS: Record<string, ProviderConfig> = {
-  openrouter: { strip: true, keepNested: true },
-  anthropic: { strip: true, keepNested: false },
-  openai: { strip: true, keepNested: false },
-  lmstudio: { strip: true, keepNested: false },
-  google: { strip: true, keepNested: false },
-  meta: { strip: true, keepNested: false },
-  mistral: { strip: true, keepNested: false },
-  cohere: { strip: true, keepNested: false },
-  "x-ai": { strip: true, keepNested: false },
-  deepseek: { strip: true, keepNested: false },
-};
-
 // Cache the loaded pricing data
 let pricingData: Record<string, unknown> | null = null;
 
@@ -98,74 +75,38 @@ function loadPricingData(): Record<string, unknown> {
 }
 
 /**
- * Normalize a model string by converting different separator formats
- * Vercel AI Gateway uses "provider:model" format
- * Old multi-provider setup used "provider/model" format
- * LiteLLM pricing data uses various formats
- */
-function normalizeModelString(modelString: string): string {
-  // Convert colon separator to slash for unified processing
-  // e.g., "anthropic:claude-sonnet-4" -> "anthropic/claude-sonnet-4"
-  return modelString.replace(":", "/");
-}
-
-/**
- * Generate lookup candidates for a model string using provider configuration
+ * Generate lookup candidates for a model string
  * Returns candidates in priority order (most specific first)
  * 
- * Supports both formats:
- * - Vercel AI Gateway: "anthropic:claude-sonnet-4"
- * - Multi-provider: "anthropic/claude-sonnet-4"
+ * Vercel AI Gateway model IDs are in the format "provider/model-name"
+ * LiteLLM pricing data stores them as "vercel_ai_gateway/provider/model-name"
+ * 
+ * Examples:
+ * - "alibaba/qwen-3-14b" -> tries "vercel_ai_gateway/alibaba/qwen-3-14b", "alibaba/qwen-3-14b", "qwen-3-14b"
+ * - "anthropic/claude-sonnet-4" -> tries "vercel_ai_gateway/anthropic/claude-sonnet-4", "anthropic/claude-sonnet-4", "claude-sonnet-4"
  */
 function generateLookupCandidates(modelString: string): string[] {
   const candidates: string[] = [];
   
-  // Normalize the model string (convert : to /)
-  const normalizedString = normalizeModelString(modelString);
-
-  // Find matching provider config
-  const slashIndex = normalizedString.indexOf("/");
-  if (slashIndex === -1) {
-    // No provider prefix, just use as-is
-    return [modelString, normalizedString].filter((v, i, a) => a.indexOf(v) === i);
-  }
-
-  const provider = normalizedString.slice(0, slashIndex);
-  const config = PROVIDER_CONFIGS[provider];
-  const remainder = normalizedString.slice(slashIndex + 1);
-
-  // Always try the original string first
+  // Primary: Try with vercel_ai_gateway prefix (how LiteLLM stores gateway models)
+  candidates.push(`vercel_ai_gateway/${modelString}`);
+  
+  // Secondary: Try the model string as-is
   candidates.push(modelString);
   
-  // Also try the normalized version (with / instead of :)
-  if (normalizedString !== modelString) {
-    candidates.push(normalizedString);
-  }
-
-  if (!config) {
-    // Unknown provider, try original strings only
-    return candidates.filter((v, i, a) => a.indexOf(v) === i);
-  }
-
-  if (config.strip) {
-    // Try without our provider prefix (just the model name)
-    candidates.push(remainder);
-  }
-
-  if (config.keepNested) {
-    // For nested paths like "anthropic/claude-model", also try just "claude-model"
-    const nestedSlashIndex = remainder.indexOf("/");
+  // Tertiary: If there's a provider prefix, try just the model name
+  const slashIndex = modelString.indexOf("/");
+  if (slashIndex !== -1) {
+    const modelName = modelString.slice(slashIndex + 1);
+    candidates.push(modelName);
+    
+    // Also try nested paths (e.g., "openrouter/anthropic/claude" -> "anthropic/claude", "claude")
+    const nestedSlashIndex = modelName.indexOf("/");
     if (nestedSlashIndex !== -1) {
-      candidates.push(remainder.slice(nestedSlashIndex + 1));
+      candidates.push(modelName.slice(nestedSlashIndex + 1));
     }
   }
 
-  // Also try with common LiteLLM prefixes
-  // LiteLLM often uses "provider/model" format
-  if (!normalizedString.startsWith(provider + "/")) {
-    candidates.push(`${provider}/${remainder}`);
-  }
-
   // Remove duplicates while preserving order
   return candidates.filter((v, i, a) => a.indexOf(v) === i);
 }