9router/open-sse/config/ttsModels.js
decolua d4bc42e1f5 feat: add STT support, Gemini TTS, and expand usage tracking
- Speech-to-Text: full pipeline with sttCore handler, /v1/audio/transcriptions
  endpoint, sttConfig for OpenAI, Gemini, Groq, Deepgram, AssemblyAI,
  HuggingFace, NVIDIA Parakeet; new 9router-stt skill
- Gemini TTS: add gemini provider with 30 prebuilt voices and TTS_PROVIDER_CONFIG
- Usage: implement GLM (intl/cn) and MiniMax (intl/cn) quota fetchers; refactor
  Gemini CLI usage to use retrieveUserQuota with per-model buckets
- Disabled models: lowdb-backed disabledModelsDb + /api/models/disabled route
- Header search: reusable Zustand store (headerSearchStore) wired into Header
- CLI tools: add Claude Cowork tool card and cowork-settings API
- Providers: introduce mediaPriority sorting in getProvidersByKind, add
  Kimi K2.6, reorder hermes, drop qwen STT kind
- UI: expand media-providers/[kind]/[id] page (+314), enhance OAuthModal,
  ModelSelectModal, ProviderTopology, ProxyPools, ProviderLimits
- Assets: refresh provider PNGs (alicode, byteplus, cloudflare-ai, nvidia,
  ollama, vertex, volcengine-ark) and add aws-polly, fal-ai, jina-ai, recraft,
  runwayml, stability-ai, topaz, black-forest-labs
2026-05-05 10:32:59 +07:00

129 lines
5.5 KiB
JavaScript

import { GOOGLE_TTS_LANGUAGES } from "./googleTtsLanguages.js";
// ── Voice definitions (DRY — reused across providers) ──────────────────────
const VOICES = {
alloy: { id: "alloy", name: "Alloy" },
ash: { id: "ash", name: "Ash" },
ballad: { id: "ballad", name: "Ballad" },
cedar: { id: "cedar", name: "Cedar" },
coral: { id: "coral", name: "Coral" },
echo: { id: "echo", name: "Echo" },
fable: { id: "fable", name: "Fable" },
marin: { id: "marin", name: "Marin" },
nova: { id: "nova", name: "Nova" },
onyx: { id: "onyx", name: "Onyx" },
sage: { id: "sage", name: "Sage" },
shimmer: { id: "shimmer", name: "Shimmer" },
verse: { id: "verse", name: "Verse" },
};
const v = (...keys) => keys.map((k) => ({ ...VOICES[k], type: "tts" }));
// 9 voices for tts-1 / tts-1-hd
const VOICES_STANDARD = v("alloy", "ash", "coral", "echo", "fable", "nova", "onyx", "sage", "shimmer");
// 13 voices for gpt-4o-mini-tts
const VOICES_FULL = v("alloy", "ash", "ballad", "cedar", "coral", "echo", "fable", "marin", "nova", "onyx", "sage", "shimmer", "verse");
// Gemini prebuilt voices (30 voices, multi-language auto-detect)
const GEMINI_VOICES = [
"Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda", "Orus", "Aoede",
"Callirrhoe", "Autonoe", "Enceladus", "Iapetus", "Umbriel", "Algieba",
"Despina", "Erinome", "Algenib", "Rasalgethi", "Laomedeia", "Achernar",
"Alnilam", "Schedar", "Gacrux", "Pulcherrima", "Achird", "Zubenelgenubi",
"Vindemiatrix", "Sadachbia", "Sadaltager", "Sulafat",
].map((id) => ({ id, name: id, type: "tts" }));
// ── TTS Config (config-driven, single source of truth) ─────────────────────
export const TTS_MODELS_CONFIG = {
openai: {
models: [
{ id: "gpt-4o-mini-tts", name: "GPT-4o Mini TTS", type: "tts" },
{ id: "tts-1-hd", name: "TTS-1 HD", type: "tts" },
{ id: "tts-1", name: "TTS-1", type: "tts" },
],
voices: {
"gpt-4o-mini-tts": VOICES_FULL,
"tts-1": VOICES_STANDARD,
"tts-1-hd": VOICES_STANDARD,
},
// Flat voice list (all unique voices) for backward compat
allVoices: VOICES_FULL,
},
openrouter: {
models: [
{ id: "openai/gpt-4o-mini-tts", name: "GPT-4o Mini TTS", type: "tts" },
{ id: "openai/tts-1-hd", name: "TTS-1 HD", type: "tts" },
{ id: "openai/tts-1", name: "TTS-1", type: "tts" },
],
voices: {
"openai/gpt-4o-mini-tts": VOICES_FULL,
"openai/tts-1": VOICES_STANDARD,
"openai/tts-1-hd": VOICES_STANDARD,
},
allVoices: VOICES_FULL,
},
elevenlabs: {
models: [
{ id: "eleven_flash_v2_5", name: "Flash v2.5 (Fastest)", type: "tts" },
{ id: "eleven_turbo_v2_5", name: "Turbo v2.5 (Fast)", type: "tts" },
{ id: "eleven_multilingual_v2", name: "Multilingual v2 (Quality)", type: "tts" },
{ id: "eleven_monolingual_v1", name: "Monolingual v1 (English)", type: "tts" },
],
// voices come from API, not hardcoded
},
"edge-tts": {
defaults: [
{ id: "en-US-AriaNeural", name: "Aria (en-US)", type: "tts" },
{ id: "en-US-GuyNeural", name: "Guy (en-US)", type: "tts" },
{ id: "en-GB-SoniaNeural", name: "Sonia (en-GB)", type: "tts" },
{ id: "vi-VN-HoaiMyNeural", name: "Hoai My (vi-VN)", type: "tts" },
{ id: "vi-VN-NamMinhNeural", name: "Nam Minh (vi-VN)", type: "tts" },
{ id: "zh-CN-XiaoxiaoNeural", name: "Xiaoxiao (zh-CN)", type: "tts" },
{ id: "zh-CN-YunxiNeural", name: "Yunxi (zh-CN)", type: "tts" },
{ id: "fr-FR-DeniseNeural", name: "Denise (fr-FR)", type: "tts" },
{ id: "de-DE-KatjaNeural", name: "Katja (de-DE)", type: "tts" },
{ id: "ja-JP-NanamiNeural", name: "Nanami (ja-JP)", type: "tts" },
{ id: "ko-KR-SunHiNeural", name: "SunHi (ko-KR)", type: "tts" },
],
},
"local-device": {
defaults: [
{ id: "default", name: "System Default Voice", type: "tts" },
],
},
"google-tts": {
defaults: GOOGLE_TTS_LANGUAGES,
},
gemini: {
models: [
{ id: "gemini-2.5-flash-preview-tts", name: "Gemini 2.5 Flash TTS", type: "tts" },
{ id: "gemini-2.5-pro-preview-tts", name: "Gemini 2.5 Pro TTS", type: "tts" },
],
voices: {
"gemini-2.5-flash-preview-tts": GEMINI_VOICES,
"gemini-2.5-pro-preview-tts": GEMINI_VOICES,
},
allVoices: GEMINI_VOICES,
},
};
// ── Helper: get voices for a specific model ────────────────────────────────
export function getTtsVoicesForModel(provider, modelId) {
const cfg = TTS_MODELS_CONFIG[provider];
if (!cfg?.voices) return null;
return cfg.voices[modelId] || cfg.allVoices || null;
}
// ── Build flat entries for PROVIDER_MODELS backward compat ─────────────────
export function buildTtsProviderModels() {
const entries = {};
for (const [provider, cfg] of Object.entries(TTS_MODELS_CONFIG)) {
if (cfg.models) entries[`${provider}-tts-models`] = cfg.models;
if (cfg.allVoices) entries[`${provider}-tts-voices`] = cfg.allVoices;
if (cfg.defaults) entries[provider] = cfg.defaults;
}
// Keep openai-tts-voices key pointing to full voice list for backward compat
entries["openai-tts-voices"] = TTS_MODELS_CONFIG.openai.allVoices;
entries["openrouter-tts-voices"] = TTS_MODELS_CONFIG.openrouter.allVoices;
return entries;
}