feat(usage): implement cost tracking backend and pricing configuration

- Add pricing constants with default rates for all providers - Update localDb to support pricing configuration schema - Add cost calculation logic to usageDb - Add pricing management API endpoints - Fix provider alias mapping for accurate cost lookups 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
2026-01-06 23:59:49 +02:00 · 2026-01-06 23:59:49 +02:00 · a36afaa85e
commit a36afaa85e
parent 3ad2f8dc58
4 changed files with 960 additions and 3 deletions
--- a/src/shared/constants/pricing.js
+++ b/src/shared/constants/pricing.js
@ -0,0 +1,598 @@
+// Default pricing rates for AI models
+// All rates are in dollars per million tokens ($/1M tokens)
+// Based on user-provided pricing for Antigravity models and industry standards for others
+
+export const DEFAULT_PRICING = {
+  // OAuth Providers (using aliases)
+
+  // Claude Code (cc)
+  cc: {
+    "claude-opus-4-5-20251101": {
+      input: 15.00,
+      output: 75.00,
+      cached: 7.50,
+      reasoning: 75.00,
+      cache_creation: 15.00
+    },
+    "claude-sonnet-4-5-20250929": {
+      input: 3.00,
+      output: 15.00,
+      cached: 1.50,
+      reasoning: 15.00,
+      cache_creation: 3.00
+    },
+    "claude-haiku-4-5-20251001": {
+      input: 0.50,
+      output: 2.50,
+      cached: 0.25,
+      reasoning: 2.50,
+      cache_creation: 0.50
+    }
+  },
+
+  // OpenAI Codex (cx)
+  cx: {
+    "gpt-5.2-codex": {
+      input: 5.00,
+      output: 20.00,
+      cached: 2.50,
+      reasoning: 30.00,
+      cache_creation: 5.00
+    },
+    "gpt-5.2": {
+      input: 5.00,
+      output: 20.00,
+      cached: 2.50,
+      reasoning: 30.00,
+      cache_creation: 5.00
+    },
+    "gpt-5.1-codex-max": {
+      input: 8.00,
+      output: 32.00,
+      cached: 4.00,
+      reasoning: 48.00,
+      cache_creation: 8.00
+    },
+    "gpt-5.1-codex": {
+      input: 4.00,
+      output: 16.00,
+      cached: 2.00,
+      reasoning: 24.00,
+      cache_creation: 4.00
+    },
+    "gpt-5.1-codex-mini": {
+      input: 1.50,
+      output: 6.00,
+      cached: 0.75,
+      reasoning: 9.00,
+      cache_creation: 1.50
+    },
+    "gpt-5.1": {
+      input: 4.00,
+      output: 16.00,
+      cached: 2.00,
+      reasoning: 24.00,
+      cache_creation: 4.00
+    },
+    "gpt-5-codex": {
+      input: 3.00,
+      output: 12.00,
+      cached: 1.50,
+      reasoning: 18.00,
+      cache_creation: 3.00
+    },
+    "gpt-5-codex-mini": {
+      input: 1.00,
+      output: 4.00,
+      cached: 0.50,
+      reasoning: 6.00,
+      cache_creation: 1.00
+    }
+  },
+
+  // Gemini CLI (gc)
+  gc: {
+    "gemini-3-flash-preview": {
+      input: 0.50,
+      output: 3.00,
+      cached: 0.03,
+      reasoning: 4.50,
+      cache_creation: 0.50
+    },
+    "gemini-3-pro-preview": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-2.5-pro": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-2.5-flash": {
+      input: 0.30,
+      output: 2.50,
+      cached: 0.03,
+      reasoning: 3.75,
+      cache_creation: 0.30
+    },
+    "gemini-2.5-flash-lite": {
+      input: 0.15,
+      output: 1.25,
+      cached: 0.015,
+      reasoning: 1.875,
+      cache_creation: 0.15
+    }
+  },
+
+  // Qwen Code (qw)
+  qw: {
+    "qwen3-coder-plus": {
+      input: 1.00,
+      output: 4.00,
+      cached: 0.50,
+      reasoning: 6.00,
+      cache_creation: 1.00
+    },
+    "qwen3-coder-flash": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    },
+    "vision-model": {
+      input: 1.50,
+      output: 6.00,
+      cached: 0.75,
+      reasoning: 9.00,
+      cache_creation: 1.50
+    }
+  },
+
+  // iFlow AI (if)
+  if: {
+    "qwen3-coder-plus": {
+      input: 1.00,
+      output: 4.00,
+      cached: 0.50,
+      reasoning: 6.00,
+      cache_creation: 1.00
+    },
+    "kimi-k2": {
+      input: 1.00,
+      output: 4.00,
+      cached: 0.50,
+      reasoning: 6.00,
+      cache_creation: 1.00
+    },
+    "kimi-k2-thinking": {
+      input: 1.50,
+      output: 6.00,
+      cached: 0.75,
+      reasoning: 9.00,
+      cache_creation: 1.50
+    },
+    "deepseek-r1": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    },
+    "deepseek-v3.2-chat": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    },
+    "deepseek-v3.2-reasoner": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    },
+    "minimax-m2": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    },
+    "glm-4.6": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    },
+    "glm-4.7": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    }
+  },
+
+  // Antigravity (ag) - User-provided pricing
+  ag: {
+    "gemini-3-pro-low": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-3-pro-high": {
+      input: 4.00,
+      output: 18.00,
+      cached: 0.50,
+      reasoning: 27.00,
+      cache_creation: 4.00
+    },
+    "gemini-3-flash": {
+      input: 0.50,
+      output: 3.00,
+      cached: 0.03,
+      reasoning: 4.50,
+      cache_creation: 0.50
+    },
+    "gemini-2.5-flash": {
+      input: 0.30,
+      output: 2.50,
+      cached: 0.03,
+      reasoning: 3.75,
+      cache_creation: 0.30
+    },
+    "claude-sonnet-4-5": {
+      input: 3.00,
+      output: 15.00,
+      cached: 0.30,
+      reasoning: 22.50,
+      cache_creation: 3.00
+    },
+    "claude-sonnet-4-5-thinking": {
+      input: 3.00,
+      output: 15.00,
+      cached: 0.30,
+      reasoning: 22.50,
+      cache_creation: 3.00
+    },
+    "claude-opus-4-5-thinking": {
+      input: 5.00,
+      output: 25.00,
+      cached: 0.50,
+      reasoning: 37.50,
+      cache_creation: 5.00
+    }
+  },
+
+  // GitHub Copilot (gh)
+  gh: {
+    "gpt-5": {
+      input: 3.00,
+      output: 12.00,
+      cached: 1.50,
+      reasoning: 18.00,
+      cache_creation: 3.00
+    },
+    "gpt-5-mini": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    },
+    "gpt-5.1-codex": {
+      input: 4.00,
+      output: 16.00,
+      cached: 2.00,
+      reasoning: 24.00,
+      cache_creation: 4.00
+    },
+    "gpt-5.1-codex-max": {
+      input: 8.00,
+      output: 32.00,
+      cached: 4.00,
+      reasoning: 48.00,
+      cache_creation: 8.00
+    },
+    "gpt-4.1": {
+      input: 2.50,
+      output: 10.00,
+      cached: 1.25,
+      reasoning: 15.00,
+      cache_creation: 2.50
+    },
+    "claude-4.5-sonnet": {
+      input: 3.00,
+      output: 15.00,
+      cached: 0.30,
+      reasoning: 22.50,
+      cache_creation: 3.00
+    },
+    "claude-4.5-opus": {
+      input: 5.00,
+      output: 25.00,
+      cached: 0.50,
+      reasoning: 37.50,
+      cache_creation: 5.00
+    },
+    "claude-4.5-haiku": {
+      input: 0.50,
+      output: 2.50,
+      cached: 0.05,
+      reasoning: 3.75,
+      cache_creation: 0.50
+    },
+    "gemini-3-pro": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-3-flash": {
+      input: 0.50,
+      output: 3.00,
+      cached: 0.03,
+      reasoning: 4.50,
+      cache_creation: 0.50
+    },
+    "gemini-2.5-pro": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "grok-code-fast-1": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    }
+  },
+
+  // API Key Providers (alias = id)
+
+  // OpenAI
+  openai: {
+    "gpt-4o": {
+      input: 2.50,
+      output: 10.00,
+      cached: 1.25,
+      reasoning: 15.00,
+      cache_creation: 2.50
+    },
+    "gpt-4o-mini": {
+      input: 0.15,
+      output: 0.60,
+      cached: 0.075,
+      reasoning: 0.90,
+      cache_creation: 0.15
+    },
+    "gpt-4-turbo": {
+      input: 10.00,
+      output: 30.00,
+      cached: 5.00,
+      reasoning: 45.00,
+      cache_creation: 10.00
+    },
+    "o1": {
+      input: 15.00,
+      output: 60.00,
+      cached: 7.50,
+      reasoning: 90.00,
+      cache_creation: 15.00
+    },
+    "o1-mini": {
+      input: 3.00,
+      output: 12.00,
+      cached: 1.50,
+      reasoning: 18.00,
+      cache_creation: 3.00
+    }
+  },
+
+  // Anthropic
+  anthropic: {
+    "claude-sonnet-4-20250514": {
+      input: 3.00,
+      output: 15.00,
+      cached: 1.50,
+      reasoning: 15.00,
+      cache_creation: 3.00
+    },
+    "claude-opus-4-20250514": {
+      input: 15.00,
+      output: 75.00,
+      cached: 7.50,
+      reasoning: 112.50,
+      cache_creation: 15.00
+    },
+    "claude-3-5-sonnet-20241022": {
+      input: 3.00,
+      output: 15.00,
+      cached: 1.50,
+      reasoning: 15.00,
+      cache_creation: 3.00
+    }
+  },
+
+  // Gemini
+  gemini: {
+    "gemini-3-pro-preview": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-2.5-pro": {
+      input: 2.00,
+      output: 12.00,
+      cached: 0.25,
+      reasoning: 18.00,
+      cache_creation: 2.00
+    },
+    "gemini-2.5-flash": {
+      input: 0.30,
+      output: 2.50,
+      cached: 0.03,
+      reasoning: 3.75,
+      cache_creation: 0.30
+    },
+    "gemini-2.5-flash-lite": {
+      input: 0.15,
+      output: 1.25,
+      cached: 0.015,
+      reasoning: 1.875,
+      cache_creation: 0.15
+    }
+  },
+
+  // OpenRouter
+  openrouter: {
+    "auto": {
+      input: 2.00,
+      output: 8.00,
+      cached: 1.00,
+      reasoning: 12.00,
+      cache_creation: 2.00
+    }
+  },
+
+  // GLM
+  glm: {
+    "glm-4.7": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    },
+    "glm-4.6": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    },
+    "glm-4.6v": {
+      input: 0.75,
+      output: 3.00,
+      cached: 0.375,
+      reasoning: 4.50,
+      cache_creation: 0.75
+    }
+  },
+
+  // Kimi
+  kimi: {
+    "kimi-latest": {
+      input: 1.00,
+      output: 4.00,
+      cached: 0.50,
+      reasoning: 6.00,
+      cache_creation: 1.00
+    }
+  },
+
+  // MiniMax
+  minimax: {
+    "MiniMax-M2.1": {
+      input: 0.50,
+      output: 2.00,
+      cached: 0.25,
+      reasoning: 3.00,
+      cache_creation: 0.50
+    }
+  }
+};
+
+/**
+ * Get pricing for a specific provider and model
+ * @param {string} provider - Provider ID (e.g., "openai", "cc", "gc")
+ * @param {string} model - Model ID
+ * @returns {object|null} Pricing object or null if not found
+ */
+export function getPricingForModel(provider, model) {
+  if (!provider || !model) return null;
+
+  const providerPricing = DEFAULT_PRICING[provider];
+  if (!providerPricing) return null;
+
+  return providerPricing[model] || null;
+}
+
+/**
+ * Get all pricing data
+ * @returns {object} All default pricing
+ */
+export function getDefaultPricing() {
+  return DEFAULT_PRICING;
+}
+
+/**
+ * Format cost for display
+ * @param {number} cost - Cost in dollars
+ * @returns {string} Formatted cost string
+ */
+export function formatCost(cost) {
+  if (cost === null || cost === undefined || isNaN(cost)) return "$0.00";
+  return `$${cost.toFixed(2)}`;
+}
+
+/**
+ * Calculate cost from tokens and pricing
+ * @param {object} tokens - Token counts
+ * @param {object} pricing - Pricing object
+ * @returns {number} Cost in dollars
+ */
+export function calculateCostFromTokens(tokens, pricing) {
+  if (!tokens || !pricing) return 0;
+
+  let cost = 0;
+
+  // Input tokens (non-cached)
+  const inputTokens = tokens.prompt_tokens || tokens.input_tokens || 0;
+  const cachedTokens = tokens.cached_tokens || tokens.cache_read_input_tokens || 0;
+  const nonCachedInput = Math.max(0, inputTokens - cachedTokens);
+
+  cost += (nonCachedInput * (pricing.input / 1000000));
+
+  // Cached tokens
+  if (cachedTokens > 0) {
+    const cachedRate = pricing.cached || pricing.input; // Fallback to input rate
+    cost += (cachedTokens * (cachedRate / 1000000));
+  }
+
+  // Output tokens
+  const outputTokens = tokens.completion_tokens || tokens.output_tokens || 0;
+  cost += (outputTokens * (pricing.output / 1000000));
+
+  // Reasoning tokens
+  const reasoningTokens = tokens.reasoning_tokens || 0;
+  if (reasoningTokens > 0) {
+    const reasoningRate = pricing.reasoning || pricing.output; // Fallback to output rate
+    cost += (reasoningTokens * (reasoningRate / 1000000));
+  }
+
+  // Cache creation tokens
+  const cacheCreationTokens = tokens.cache_creation_input_tokens || 0;
+  if (cacheCreationTokens > 0) {
+    const cacheCreationRate = pricing.cache_creation || pricing.input; // Fallback to input rate
+    cost += (cacheCreationTokens * (cacheCreationRate / 1000000));
+  }
+
+  return cost;
+}