From 97e3236e760afb5863efb9ce3f047a02206a03f2 Mon Sep 17 00:00:00 2001
From: Xin Wang <wx44wx@XindeMac-mini.local>
Date: Sun, 8 Feb 2026 23:16:21 +0800
Subject: [PATCH] Update voice libary key form

---
 api/app/models.py          |  13 +-
 api/app/routers/voices.py  | 114 +----
 api/app/schemas.py         |  24 +-
 api/tests/test_voices.py   |  25 +-
 web/pages/VoiceLibrary.tsx | 987 +++++++++++++++++--------------------
 web/services/backendApi.ts |  33 +-
 web/types.ts               |   9 +-
 7 files changed, 503 insertions(+), 702 deletions(-)

diff --git a/api/app/models.py b/api/app/models.py
index 6cd5134..4e4c21a 100644
--- a/api/app/models.py
+++ b/api/app/models.py
@@ -28,6 +28,8 @@ class Voice(Base):
     description: Mapped[str] = mapped_column(String(255), nullable=False)
     model: Mapped[Optional[str]] = mapped_column(String(128), nullable=True)  # 厂商语音模型标识
     voice_key: Mapped[Optional[str]] = mapped_column(String(128), nullable=True)  # 厂商voice_key
+    api_key: Mapped[Optional[str]] = mapped_column(String(512), nullable=True)  # 每个声音独立 API key
+    base_url: Mapped[Optional[str]] = mapped_column(String(512), nullable=True)  # 每个声音独立 OpenAI-compatible base_url
     speed: Mapped[float] = mapped_column(Float, default=1.0)
     gain: Mapped[int] = mapped_column(Integer, default=0)
     pitch: Mapped[int] = mapped_column(Integer, default=0)
@@ -38,17 +40,6 @@ class Voice(Base):
     user = relationship("User", foreign_keys=[user_id])
 
 
-class VendorCredential(Base):
-    __tablename__ = "vendor_credentials"
-
-    vendor_key: Mapped[str] = mapped_column(String(64), primary_key=True)
-    vendor_name: Mapped[str] = mapped_column(String(128), nullable=False)
-    api_key: Mapped[str] = mapped_column(String(512), nullable=False)
-    base_url: Mapped[Optional[str]] = mapped_column(String(512), nullable=True)
-    created_at: Mapped[datetime] = mapped_column(DateTime, default=datetime.utcnow)
-    updated_at: Mapped[datetime] = mapped_column(DateTime, default=datetime.utcnow)
-
-
 # ============ LLM Model ============
 class LLMModel(Base):
     __tablename__ = "llm_models"
diff --git a/api/app/routers/voices.py b/api/app/routers/voices.py
index f7b078a..eab2298 100644
--- a/api/app/routers/voices.py
+++ b/api/app/routers/voices.py
@@ -1,7 +1,6 @@
 import base64
 import os
 import uuid
-from datetime import datetime
 from typing import Optional
 
 import httpx
@@ -9,16 +8,8 @@ from fastapi import APIRouter, Depends, HTTPException
 from sqlalchemy.orm import Session
 
 from ..db import get_db
-from ..models import VendorCredential, Voice
-from ..schemas import (
-    VendorCredentialOut,
-    VendorCredentialUpsert,
-    VoiceCreate,
-    VoiceOut,
-    VoicePreviewRequest,
-    VoicePreviewResponse,
-    VoiceUpdate,
-)
+from ..models import Voice
+from ..schemas import VoiceCreate, VoiceOut, VoicePreviewRequest, VoicePreviewResponse, VoiceUpdate
 
 router = APIRouter(prefix="/voices", tags=["Voices"])
 
@@ -29,28 +20,10 @@ def _is_siliconflow_vendor(vendor: str) -> bool:
     return vendor.strip().lower() in {"siliconflow", "硅基流动"}
 
 
-def _canonical_vendor_key(vendor: str) -> str:
-    normalized = vendor.strip().lower()
-    alias_map = {
-        "硅基流动": "siliconflow",
-        "siliconflow": "siliconflow",
-        "ali": "ali",
-        "volcano": "volcano",
-        "minimax": "minimax",
-    }
-    return alias_map.get(normalized, normalized)
-
-
-def _default_tts_base_url(vendor_key: str) -> Optional[str]:
-    defaults = {
-        "siliconflow": "https://api.siliconflow.cn/v1",
-    }
-    return defaults.get(vendor_key)
-
-
-def _resolve_vendor_credential(db: Session, vendor: str) -> Optional[VendorCredential]:
-    vendor_key = _canonical_vendor_key(vendor)
-    return db.query(VendorCredential).filter(VendorCredential.vendor_key == vendor_key).first()
+def _default_base_url(vendor: str) -> Optional[str]:
+    if _is_siliconflow_vendor(vendor):
+        return "https://api.siliconflow.cn/v1"
+    return None
 
 
 def _build_siliconflow_voice_key(voice: Voice, model: str) -> str:
@@ -108,6 +81,8 @@ def create_voice(data: VoiceCreate, db: Session = Depends(get_db)):
         description=data.description,
         model=model,
         voice_key=voice_key,
+        api_key=data.api_key,
+        base_url=data.base_url,
         speed=data.speed,
         gain=data.gain,
         pitch=data.pitch,
@@ -165,56 +140,6 @@ def delete_voice(id: str, db: Session = Depends(get_db)):
     return {"message": "Deleted successfully"}
 
 
-@router.get("/vendors/credentials")
-def list_vendor_credentials(db: Session = Depends(get_db)):
-    items = db.query(VendorCredential).order_by(VendorCredential.updated_at.desc()).all()
-    return {"list": items, "total": len(items)}
-
-
-@router.get("/vendors/credentials/{vendor_key}", response_model=VendorCredentialOut)
-def get_vendor_credential(vendor_key: str, db: Session = Depends(get_db)):
-    key = _canonical_vendor_key(vendor_key)
-    item = db.query(VendorCredential).filter(VendorCredential.vendor_key == key).first()
-    if not item:
-        raise HTTPException(status_code=404, detail="Vendor credential not found")
-    return item
-
-
-@router.put("/vendors/credentials/{vendor_key}", response_model=VendorCredentialOut)
-def upsert_vendor_credential(vendor_key: str, data: VendorCredentialUpsert, db: Session = Depends(get_db)):
-    key = _canonical_vendor_key(vendor_key)
-    item = db.query(VendorCredential).filter(VendorCredential.vendor_key == key).first()
-
-    if item:
-        item.vendor_name = data.vendor_name or item.vendor_name
-        item.api_key = data.api_key
-        item.base_url = data.base_url
-        item.updated_at = datetime.utcnow()
-    else:
-        item = VendorCredential(
-            vendor_key=key,
-            vendor_name=data.vendor_name or vendor_key,
-            api_key=data.api_key,
-            base_url=data.base_url,
-        )
-        db.add(item)
-
-    db.commit()
-    db.refresh(item)
-    return item
-
-
-@router.delete("/vendors/credentials/{vendor_key}")
-def delete_vendor_credential(vendor_key: str, db: Session = Depends(get_db)):
-    key = _canonical_vendor_key(vendor_key)
-    item = db.query(VendorCredential).filter(VendorCredential.vendor_key == key).first()
-    if not item:
-        raise HTTPException(status_code=404, detail="Vendor credential not found")
-    db.delete(item)
-    db.commit()
-    return {"message": "Deleted successfully"}
-
-
 @router.post("/{id}/preview", response_model=VoicePreviewResponse)
 def preview_voice(id: str, data: VoicePreviewRequest, db: Session = Depends(get_db)):
     """试听指定声音，基于 OpenAI-compatible /audio/speech 接口。"""
@@ -226,22 +151,17 @@ def preview_voice(id: str, data: VoicePreviewRequest, db: Session = Depends(get_
     if not text:
         raise HTTPException(status_code=400, detail="Preview text cannot be empty")
 
-    credential = _resolve_vendor_credential(db, voice.vendor)
-    api_key = (data.api_key or "").strip()
-    if not api_key and credential:
-        api_key = credential.api_key
+    api_key = (data.api_key or "").strip() or (voice.api_key or "").strip()
+    if not api_key and _is_siliconflow_vendor(voice.vendor):
+        api_key = os.getenv("SILICONFLOW_API_KEY", "").strip()
     if not api_key:
-        api_key = os.getenv("SILICONFLOW_API_KEY") if _is_siliconflow_vendor(voice.vendor) else ""
-    if not api_key:
-        raise HTTPException(status_code=400, detail=f"Vendor API key is required for {voice.vendor}")
+        raise HTTPException(status_code=400, detail=f"API key is required for voice: {voice.name}")
+
+    base_url = (voice.base_url or "").strip() or (_default_base_url(voice.vendor) or "")
+    if not base_url:
+        raise HTTPException(status_code=400, detail=f"Base URL is required for voice: {voice.name}")
 
     model = voice.model or SILICONFLOW_DEFAULT_MODEL
-    vendor_key = _canonical_vendor_key(voice.vendor)
-    base_url = (credential.base_url.strip() if credential and credential.base_url else "") or _default_tts_base_url(vendor_key)
-    if not base_url:
-        raise HTTPException(status_code=400, detail=f"Vendor base_url is required for {voice.vendor}")
-    tts_api_url = f"{base_url.rstrip('/')}/audio/speech"
-
     payload = {
         "model": model,
         "input": text,
@@ -253,7 +173,7 @@ def preview_voice(id: str, data: VoicePreviewRequest, db: Session = Depends(get_
     try:
         with httpx.Client(timeout=45.0) as client:
             response = client.post(
-                tts_api_url,
+                f"{base_url.rstrip('/')}/audio/speech",
                 headers={"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"},
                 json=payload,
             )
diff --git a/api/app/schemas.py b/api/app/schemas.py
index 9fd7567..5f718da 100644
--- a/api/app/schemas.py
+++ b/api/app/schemas.py
@@ -53,6 +53,8 @@ class VoiceCreate(VoiceBase):
     id: Optional[str] = None
     model: Optional[str] = None  # 厂商语音模型标识
     voice_key: Optional[str] = None  # 厂商voice_key
+    api_key: Optional[str] = None
+    base_url: Optional[str] = None
     speed: float = 1.0
     gain: int = 0
     pitch: int = 0
@@ -67,6 +69,8 @@ class VoiceUpdate(BaseModel):
     description: Optional[str] = None
     model: Optional[str] = None
     voice_key: Optional[str] = None
+    api_key: Optional[str] = None
+    base_url: Optional[str] = None
     speed: Optional[float] = None
     gain: Optional[int] = None
     pitch: Optional[int] = None
@@ -78,6 +82,8 @@ class VoiceOut(VoiceBase):
     user_id: Optional[int] = None
     model: Optional[str] = None
     voice_key: Optional[str] = None
+    api_key: Optional[str] = None
+    base_url: Optional[str] = None
     speed: float = 1.0
     gain: int = 0
     pitch: int = 0
@@ -104,24 +110,6 @@ class VoicePreviewResponse(BaseModel):
     error: Optional[str] = None
 
 
-class VendorCredentialUpsert(BaseModel):
-    vendor_name: Optional[str] = None
-    api_key: str
-    base_url: Optional[str] = None
-
-
-class VendorCredentialOut(BaseModel):
-    vendor_key: str
-    vendor_name: str
-    api_key: str
-    base_url: Optional[str] = None
-    created_at: Optional[datetime] = None
-    updated_at: Optional[datetime] = None
-
-    class Config:
-        from_attributes = True
-
-
 # ============ LLM Model ============
 class LLMModelBase(BaseModel):
     name: str
diff --git a/api/tests/test_voices.py b/api/tests/test_voices.py
index c77653e..73ed371 100644
--- a/api/tests/test_voices.py
+++ b/api/tests/test_voices.py
@@ -180,11 +180,12 @@ class TestVoiceAPI:
         encoded = payload["audio_url"].split(",", 1)[1]
         assert base64.b64decode(encoded) == b"fake-mp3-bytes"
 
-    def test_vendor_credential_persist_and_preview_use_db_key(self, client, monkeypatch):
-        """Test vendor credential persisted in DB and used by preview endpoint"""
+    def test_voice_credential_persist_and_preview_use_voice_key(self, client, monkeypatch):
+        """Test per-voice api_key/base_url persisted and used by preview endpoint"""
         from app.routers import voices as voice_router
 
         captured_auth = {"value": ""}
+        captured_url = {"value": ""}
 
         class DummyResponse:
             status_code = 200
@@ -207,22 +208,13 @@ class TestVoiceAPI:
             def post(self, *args, **kwargs):
                 headers = kwargs.get("headers", {})
                 captured_auth["value"] = headers.get("Authorization", "")
+                if args:
+                    captured_url["value"] = args[0]
                 return DummyResponse()
 
         monkeypatch.delenv("SILICONFLOW_API_KEY", raising=False)
         monkeypatch.setattr(voice_router.httpx, "Client", DummyClient)
 
-        save_cred = client.put(
-            "/api/voices/vendors/credentials/siliconflow",
-            json={
-                "vendor_name": "SiliconFlow",
-                "api_key": "db-key-123",
-                "base_url": "https://api.siliconflow.cn/v1"
-            },
-        )
-        assert save_cred.status_code == 200
-        assert save_cred.json()["vendor_key"] == "siliconflow"
-
         create_resp = client.post("/api/voices", json={
             "id": "anna2",
             "name": "Anna 2",
@@ -231,10 +223,13 @@ class TestVoiceAPI:
             "language": "zh",
             "description": "voice",
             "model": "FunAudioLLM/CosyVoice2-0.5B",
-            "voice_key": "FunAudioLLM/CosyVoice2-0.5B:anna"
+            "voice_key": "FunAudioLLM/CosyVoice2-0.5B:anna",
+            "api_key": "voice-key-123",
+            "base_url": "https://api.siliconflow.cn/v1"
         })
         assert create_resp.status_code == 200
 
         preview_resp = client.post("/api/voices/anna2/preview", json={"text": "hello"})
         assert preview_resp.status_code == 200
-        assert captured_auth["value"] == "Bearer db-key-123"
+        assert captured_auth["value"] == "Bearer voice-key-123"
+        assert captured_url["value"] == "https://api.siliconflow.cn/v1/audio/speech"
diff --git a/web/pages/VoiceLibrary.tsx b/web/pages/VoiceLibrary.tsx
index 5453a14..93a13a1 100644
--- a/web/pages/VoiceLibrary.tsx
+++ b/web/pages/VoiceLibrary.tsx
@@ -1,16 +1,8 @@
-
 import React, { useEffect, useState, useRef } from 'react';
-import { Search, Mic2, Play, Pause, Upload, X, Filter, Plus, Volume2, Sparkles, Wand2, ChevronDown, Pencil, Trash2 } from 'lucide-react';
+import { Search, Mic2, Play, Pause, Upload, Filter, Plus, Volume2, Sparkles, ChevronDown, Pencil, Trash2 } from 'lucide-react';
 import { Button, Input, TableHeader, TableRow, TableHead, TableCell, Dialog, Badge } from '../components/UI';
-import { VendorCredential, Voice } from '../types';
-import { createVoice, deleteVoice, fetchVendorCredentials, fetchVoices, previewVoice, saveVendorCredential, updateVoice } from '../services/backendApi';
-
-const VENDOR_OPTIONS = [
-  { key: 'siliconflow', label: '硅基流动 (SiliconFlow)' },
-  { key: 'ali', label: 'Ali' },
-  { key: 'volcano', label: 'Volcano' },
-  { key: 'minimax', label: 'Minimax' },
-];
+import { Voice } from '../types';
+import { createVoice, deleteVoice, fetchVoices, previewVoice, updateVoice } from '../services/backendApi';
 
 export const VoiceLibraryPage: React.FC = () => {
   const [voices, setVoices] = useState<Voice[]>([]);
@@ -18,31 +10,20 @@ export const VoiceLibraryPage: React.FC = () => {
   const [vendorFilter, setVendorFilter] = useState<'all' | 'Ali' | 'Volcano' | 'Minimax' | '硅基流动' | 'SiliconFlow'>('all');
   const [genderFilter, setGenderFilter] = useState<'all' | 'Male' | 'Female'>('all');
   const [langFilter, setLangFilter] = useState<'all' | 'zh' | 'en'>('all');
-  
+
   const [playingVoiceId, setPlayingVoiceId] = useState<string | null>(null);
   const [isCloneModalOpen, setIsCloneModalOpen] = useState(false);
   const [isAddModalOpen, setIsAddModalOpen] = useState(false);
   const [editingVoice, setEditingVoice] = useState<Voice | null>(null);
   const [isLoading, setIsLoading] = useState(true);
   const [playLoadingId, setPlayLoadingId] = useState<string | null>(null);
-  const [vendorCredentials, setVendorCredentials] = useState<Record<string, VendorCredential>>({});
-  const [credentialVendorKey, setCredentialVendorKey] = useState('siliconflow');
-  const [credentialApiKey, setCredentialApiKey] = useState('');
-  const [credentialBaseUrl, setCredentialBaseUrl] = useState('');
-  const [isSavingCredential, setIsSavingCredential] = useState(false);
   const audioRef = useRef<HTMLAudioElement | null>(null);
 
   useEffect(() => {
-    const loadVoicesAndCredentials = async () => {
+    const loadVoices = async () => {
       setIsLoading(true);
       try {
-        const [list, credentials] = await Promise.all([fetchVoices(), fetchVendorCredentials()]);
-        setVoices(list);
-        const mapped = credentials.reduce((acc, item) => {
-          acc[item.vendorKey] = item;
-          return acc;
-        }, {} as Record<string, VendorCredential>);
-        setVendorCredentials(mapped);
+        setVoices(await fetchVoices());
       } catch (error) {
         console.error(error);
         setVoices([]);
@@ -50,17 +31,10 @@ export const VoiceLibraryPage: React.FC = () => {
         setIsLoading(false);
       }
     };
-
-    loadVoicesAndCredentials();
+    loadVoices();
   }, []);
 
-  useEffect(() => {
-    const selected = vendorCredentials[credentialVendorKey];
-    setCredentialApiKey(selected?.apiKey || '');
-    setCredentialBaseUrl(selected?.baseUrl || '');
-  }, [credentialVendorKey, vendorCredentials]);
-
-  const filteredVoices = voices.filter(voice => {
+  const filteredVoices = voices.filter((voice) => {
     const matchesSearch = voice.name.toLowerCase().includes(searchTerm.toLowerCase());
     const matchesVendor = vendorFilter === 'all' || voice.vendor === vendorFilter;
     const matchesGender = genderFilter === 'all' || voice.gender === genderFilter;
@@ -75,6 +49,7 @@ export const VoiceLibraryPage: React.FC = () => {
       setPlayingVoiceId(null);
       return;
     }
+
     try {
       setPlayLoadingId(voice.id);
       const audioUrl = await previewVoice(
@@ -82,15 +57,18 @@ export const VoiceLibraryPage: React.FC = () => {
         voice.language === 'en' ? 'Hello, this is a voice preview.' : '你好，这是一段语音试听。',
         voice.speed
       );
+
       if (audioRef.current) {
         audioRef.current.pause();
       }
+
       const audio = new Audio(audioUrl);
       audio.onended = () => setPlayingVoiceId(null);
       audio.onerror = () => {
         setPlayingVoiceId(null);
-        alert('试听失败，请检查 SiliconFlow 配置。');
+        alert('试听失败，请检查该声音的 API Key / Base URL。');
       };
+
       audioRef.current = audio;
       setPlayingVoiceId(voice.id);
       await audio.play();
@@ -103,43 +81,22 @@ export const VoiceLibraryPage: React.FC = () => {
   };
 
   const handleAddSuccess = async (newVoice: Voice) => {
-      const created = await createVoice(newVoice);
-      setVoices((prev) => [created, ...prev]);
-      setIsAddModalOpen(false);
-      setIsCloneModalOpen(false);
+    const created = await createVoice(newVoice);
+    setVoices((prev) => [created, ...prev]);
+    setIsAddModalOpen(false);
+    setIsCloneModalOpen(false);
   };
 
   const handleUpdateSuccess = async (id: string, data: Voice) => {
-      const updated = await updateVoice(id, data);
-      setVoices((prev) => prev.map((voice) => (voice.id === id ? updated : voice)));
-      setEditingVoice(null);
+    const updated = await updateVoice(id, data);
+    setVoices((prev) => prev.map((voice) => (voice.id === id ? updated : voice)));
+    setEditingVoice(null);
   };
 
   const handleDelete = async (id: string) => {
-      if (!confirm('确认删除这个声音吗？')) return;
-      await deleteVoice(id);
-      setVoices((prev) => prev.filter((voice) => voice.id !== id));
-  };
-
-  const handleSaveVendorCredential = async () => {
-      if (!credentialApiKey.trim()) {
-        alert('请填写 API Key');
-        return;
-      }
-      try {
-        setIsSavingCredential(true);
-        const option = VENDOR_OPTIONS.find((item) => item.key === credentialVendorKey);
-        const saved = await saveVendorCredential(credentialVendorKey, {
-          vendorName: option?.label || credentialVendorKey,
-          apiKey: credentialApiKey.trim(),
-          baseUrl: credentialBaseUrl.trim(),
-        });
-        setVendorCredentials((prev) => ({ ...prev, [saved.vendorKey]: saved }));
-      } catch (error: any) {
-        alert(error?.message || '保存厂商配置失败');
-      } finally {
-        setIsSavingCredential(false);
-      }
+    if (!confirm('确认删除这个声音吗？')) return;
+    await deleteVoice(id);
+    setVoices((prev) => prev.filter((voice) => voice.id !== id));
   };
 
   return (
@@ -147,91 +104,62 @@ export const VoiceLibraryPage: React.FC = () => {
       <div className="flex items-center justify-between">
         <h1 className="text-2xl font-bold tracking-tight text-white">声音资源</h1>
         <div className="flex space-x-3">
-            <Button variant="primary" onClick={() => setIsAddModalOpen(true)} className="shadow-[0_0_15px_rgba(6,182,212,0.4)]">
-                <Plus className="mr-2 h-4 w-4" /> 添加声音
-            </Button>
-            <Button variant="primary" onClick={() => setIsCloneModalOpen(true)} className="shadow-[0_0_15px_rgba(6,182,212,0.4)]">
-                <Mic2 className="mr-2 h-4 w-4" /> 克隆声音
-            </Button>
+          <Button variant="primary" onClick={() => setIsAddModalOpen(true)} className="shadow-[0_0_15px_rgba(6,182,212,0.4)]">
+            <Plus className="mr-2 h-4 w-4" /> 添加声音
+          </Button>
+          <Button variant="primary" onClick={() => setIsCloneModalOpen(true)} className="shadow-[0_0_15px_rgba(6,182,212,0.4)]">
+            <Mic2 className="mr-2 h-4 w-4" /> 克隆声音
+          </Button>
         </div>
       </div>
 
-      {/* Filter Bar */}
       <div className="grid grid-cols-1 md:grid-cols-4 gap-4 bg-card/50 p-4 rounded-lg border border-white/5 shadow-sm">
-         <div className="relative">
-             <Search className="absolute left-2.5 top-2.5 h-4 w-4 text-muted-foreground" />
-             <Input 
-                placeholder="搜索声音名称..." 
-                className="pl-9 border-0 bg-white/5" 
-                value={searchTerm} 
-                onChange={e => setSearchTerm(e.target.value)}
-             />
-         </div>
-         <div className="flex items-center space-x-2">
-            <Filter className="h-4 w-4 text-muted-foreground" />
-            <select 
-                className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
-                value={vendorFilter}
-                onChange={(e) => setVendorFilter(e.target.value as any)}
-            >
-                <option value="all">所有厂商</option>
-                <option value="硅基流动">硅基流动 (SiliconFlow)</option>
-                <option value="SiliconFlow">SiliconFlow</option>
-                <option value="Ali">阿里 (Ali)</option>
-                <option value="Volcano">火山 (Volcano)</option>
-                <option value="Minimax">Minimax</option>
-            </select>
-         </div>
-         <div className="flex items-center space-x-2">
-            <select 
-                className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
-                value={genderFilter}
-                onChange={(e) => setGenderFilter(e.target.value as any)}
-            >
-                <option value="all">所有性别</option>
-                <option value="Male">男 (Male)</option>
-                <option value="Female">女 (Female)</option>
-            </select>
-         </div>
-         <div className="flex items-center space-x-2">
-             <select 
-                className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
-                value={langFilter}
-                onChange={(e) => setLangFilter(e.target.value as any)}
-            >
-                <option value="all">所有语言</option>
-                <option value="zh">中文 (Chinese)</option>
-                <option value="en">英文 (English)</option>
-            </select>
-         </div>
-      </div>
-
-      <div className="grid grid-cols-1 md:grid-cols-4 gap-3 bg-card/50 p-4 rounded-lg border border-white/5 shadow-sm">
-         <select
+        <div className="relative">
+          <Search className="absolute left-2.5 top-2.5 h-4 w-4 text-muted-foreground" />
+          <Input
+            placeholder="搜索声音名称..."
+            className="pl-9 border-0 bg-white/5"
+            value={searchTerm}
+            onChange={(e) => setSearchTerm(e.target.value)}
+          />
+        </div>
+        <div className="flex items-center space-x-2">
+          <Filter className="h-4 w-4 text-muted-foreground" />
+          <select
             className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
-            value={credentialVendorKey}
-            onChange={(e) => setCredentialVendorKey(e.target.value)}
-         >
-            {VENDOR_OPTIONS.map((item) => (
-              <option key={item.key} value={item.key}>{item.label}</option>
-            ))}
-         </select>
-         <Input
-            type="password"
-            placeholder="Vendor API Key (持久化到后端)"
-            className="border-0 bg-white/5"
-            value={credentialApiKey}
-            onChange={e => setCredentialApiKey(e.target.value)}
-         />
-         <Input
-            placeholder="Base URL (OpenAI compatible, 选填)"
-            className="border-0 bg-white/5"
-            value={credentialBaseUrl}
-            onChange={e => setCredentialBaseUrl(e.target.value)}
-         />
-         <Button onClick={handleSaveVendorCredential} disabled={isSavingCredential}>
-            {isSavingCredential ? '保存中...' : '保存厂商配置'}
-         </Button>
+            value={vendorFilter}
+            onChange={(e) => setVendorFilter(e.target.value as any)}
+          >
+            <option value="all">所有厂商</option>
+            <option value="硅基流动">硅基流动 (SiliconFlow)</option>
+            <option value="SiliconFlow">SiliconFlow</option>
+            <option value="Ali">阿里 (Ali)</option>
+            <option value="Volcano">火山 (Volcano)</option>
+            <option value="Minimax">Minimax</option>
+          </select>
+        </div>
+        <div className="flex items-center space-x-2">
+          <select
+            className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
+            value={genderFilter}
+            onChange={(e) => setGenderFilter(e.target.value as any)}
+          >
+            <option value="all">所有性别</option>
+            <option value="Male">男 (Male)</option>
+            <option value="Female">女 (Female)</option>
+          </select>
+        </div>
+        <div className="flex items-center space-x-2">
+          <select
+            className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
+            value={langFilter}
+            onChange={(e) => setLangFilter(e.target.value as any)}
+          >
+            <option value="all">所有语言</option>
+            <option value="zh">中文 (Chinese)</option>
+            <option value="en">英文 (English)</option>
+          </select>
+        </div>
       </div>
 
       <div className="rounded-md border border-white/5 bg-card/40 backdrop-blur-md overflow-hidden">
@@ -247,62 +175,58 @@ export const VoiceLibraryPage: React.FC = () => {
             </TableRow>
           </TableHeader>
           <tbody>
-            {!isLoading && filteredVoices.map(voice => (
+            {!isLoading && filteredVoices.map((voice) => (
               <TableRow key={voice.id}>
                 <TableCell className="font-medium">
-                    <div className="flex flex-col">
-                        <span className="flex items-center text-white">
-                            {voice.vendor === '硅基流动' && <Sparkles className="w-3 h-3 text-primary mr-1.5" />}
-                            {voice.name}
-                        </span>
-                        {voice.description && <span className="text-xs text-muted-foreground">{voice.description}</span>}
-                    </div>
+                  <div className="flex flex-col">
+                    <span className="flex items-center text-white">
+                      {voice.vendor === '硅基流动' && <Sparkles className="w-3 h-3 text-primary mr-1.5" />}
+                      {voice.name}
+                    </span>
+                    {voice.description && <span className="text-xs text-muted-foreground">{voice.description}</span>}
+                  </div>
                 </TableCell>
                 <TableCell>
-                    <Badge variant={voice.vendor === '硅基流动' ? 'default' : 'outline'}>{voice.vendor}</Badge>
+                  <Badge variant={voice.vendor === '硅基流动' ? 'default' : 'outline'}>{voice.vendor}</Badge>
                 </TableCell>
                 <TableCell className="text-muted-foreground">{voice.gender === 'Male' ? '男' : '女'}</TableCell>
                 <TableCell className="text-muted-foreground">{voice.language === 'zh' ? '中文' : 'English'}</TableCell>
                 <TableCell className="text-right">
-                    <Button 
-                        variant="ghost" 
-                        size="icon" 
-                        onClick={() => handlePlayToggle(voice)}
-                        disabled={playLoadingId === voice.id}
-                        className={playingVoiceId === voice.id ? "text-primary animate-pulse" : ""}
-                    >
-                        {playingVoiceId === voice.id ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
-                    </Button>
+                  <Button
+                    variant="ghost"
+                    size="icon"
+                    onClick={() => handlePlayToggle(voice)}
+                    disabled={playLoadingId === voice.id}
+                    className={playingVoiceId === voice.id ? 'text-primary animate-pulse' : ''}
+                  >
+                    {playingVoiceId === voice.id ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                  </Button>
                 </TableCell>
                 <TableCell className="text-right">
-                    <Button variant="ghost" size="icon" onClick={() => setEditingVoice(voice)}>
-                        <Pencil className="h-4 w-4" />
-                    </Button>
-                    <Button variant="ghost" size="icon" onClick={() => handleDelete(voice.id)} className="text-red-400">
-                        <Trash2 className="h-4 w-4" />
-                    </Button>
+                  <Button variant="ghost" size="icon" onClick={() => setEditingVoice(voice)}>
+                    <Pencil className="h-4 w-4" />
+                  </Button>
+                  <Button variant="ghost" size="icon" onClick={() => handleDelete(voice.id)} className="text-red-400">
+                    <Trash2 className="h-4 w-4" />
+                  </Button>
                 </TableCell>
               </TableRow>
             ))}
-             {!isLoading && filteredVoices.length === 0 && (
-                 <TableRow>
-                     <TableCell colSpan={6} className="text-center py-6 text-muted-foreground">暂无声音数据</TableCell>
-                 </TableRow>
-             )}
-             {isLoading && (
-                 <TableRow>
-                     <TableCell colSpan={6} className="text-center py-6 text-muted-foreground">加载中...</TableCell>
-                 </TableRow>
-             )}
+            {!isLoading && filteredVoices.length === 0 && (
+              <TableRow>
+                <TableCell colSpan={6} className="text-center py-6 text-muted-foreground">暂无声音数据</TableCell>
+              </TableRow>
+            )}
+            {isLoading && (
+              <TableRow>
+                <TableCell colSpan={6} className="text-center py-6 text-muted-foreground">加载中...</TableCell>
+              </TableRow>
+            )}
           </tbody>
         </table>
       </div>
 
-      <AddVoiceModal 
-        isOpen={isAddModalOpen}
-        onClose={() => setIsAddModalOpen(false)}
-        onSuccess={handleAddSuccess}
-      />
+      <AddVoiceModal isOpen={isAddModalOpen} onClose={() => setIsAddModalOpen(false)} onSuccess={handleAddSuccess} />
 
       <AddVoiceModal
         isOpen={!!editingVoice}
@@ -311,372 +235,379 @@ export const VoiceLibraryPage: React.FC = () => {
         initialVoice={editingVoice || undefined}
       />
 
-      <CloneVoiceModal 
-        isOpen={isCloneModalOpen} 
-        onClose={() => setIsCloneModalOpen(false)} 
-        onSuccess={handleAddSuccess} 
-      />
+      <CloneVoiceModal isOpen={isCloneModalOpen} onClose={() => setIsCloneModalOpen(false)} onSuccess={handleAddSuccess} />
     </div>
   );
 };
 
-// --- Unified Add Voice Modal ---
 const AddVoiceModal: React.FC<{
-    isOpen: boolean;
-    onClose: () => void;
-    onSuccess: (voice: Voice) => Promise<void>;
-    initialVoice?: Voice;
+  isOpen: boolean;
+  onClose: () => void;
+  onSuccess: (voice: Voice) => Promise<void>;
+  initialVoice?: Voice;
 }> = ({ isOpen, onClose, onSuccess, initialVoice }) => {
-    const [vendor, setVendor] = useState<'硅基流动' | 'Ali' | 'Volcano' | 'Minimax'>('硅基流动');
-    const [name, setName] = useState('');
-    
-    const [sfModel, setSfModel] = useState('FunAudioLLM/CosyVoice2-0.5B');
-    const [sfVoiceId, setSfVoiceId] = useState('FunAudioLLM/CosyVoice2-0.5B:anna');
-    const [sfSpeed, setSfSpeed] = useState(1);
-    const [sfGain, setSfGain] = useState(0);
-    const [sfPitch, setSfPitch] = useState(0);
+  const [vendor, setVendor] = useState<'硅基流动' | 'Ali' | 'Volcano' | 'Minimax'>('硅基流动');
+  const [name, setName] = useState('');
 
-    const [model, setModel] = useState('');
-    const [voiceKey, setVoiceKey] = useState('');
-    const [gender, setGender] = useState('Female');
-    const [language, setLanguage] = useState('zh');
-    const [description, setDescription] = useState('');
-    
-    const [testInput, setTestInput] = useState('你好，正在测试语音合成效果。');
-    const [isAuditioning, setIsAuditioning] = useState(false);
-    const [isSaving, setIsSaving] = useState(false);
-    const testAudioRef = useRef<HTMLAudioElement | null>(null);
+  const [sfModel, setSfModel] = useState('FunAudioLLM/CosyVoice2-0.5B');
+  const [sfVoiceId, setSfVoiceId] = useState('FunAudioLLM/CosyVoice2-0.5B:anna');
+  const [sfSpeed, setSfSpeed] = useState(1);
+  const [sfGain, setSfGain] = useState(0);
+  const [sfPitch, setSfPitch] = useState(0);
 
-    useEffect(() => {
-        if (!initialVoice) return;
-        const nextVendor = initialVoice.vendor === 'SiliconFlow' ? '硅基流动' : initialVoice.vendor;
-        setVendor((nextVendor as any) || '硅基流动');
-        setName(initialVoice.name || '');
-        setGender(initialVoice.gender || 'Female');
-        setLanguage(initialVoice.language || 'zh');
-        setDescription(initialVoice.description || '');
-        setModel(initialVoice.model || '');
-        setVoiceKey(initialVoice.voiceKey || '');
-        setSfModel(initialVoice.model || 'FunAudioLLM/CosyVoice2-0.5B');
-        setSfVoiceId(initialVoice.voiceKey || 'FunAudioLLM/CosyVoice2-0.5B:anna');
-        setSfSpeed(initialVoice.speed ?? 1);
-        setSfGain(initialVoice.gain ?? 0);
-        setSfPitch(initialVoice.pitch ?? 0);
-    }, [initialVoice, isOpen]);
+  const [model, setModel] = useState('');
+  const [voiceKey, setVoiceKey] = useState('');
+  const [gender, setGender] = useState('Female');
+  const [language, setLanguage] = useState('zh');
+  const [description, setDescription] = useState('');
+  const [apiKey, setApiKey] = useState('');
+  const [baseUrl, setBaseUrl] = useState('');
 
-    const handleAudition = async () => {
-        if (!testInput.trim()) return;
-        if (!initialVoice?.id) {
-            alert('请先创建声音，再进行试听。');
-            return;
-        }
-        try {
-            setIsAuditioning(true);
-            const audioUrl = await previewVoice(initialVoice.id, testInput, sfSpeed);
-            if (testAudioRef.current) {
-                testAudioRef.current.pause();
-            }
-            const audio = new Audio(audioUrl);
-            testAudioRef.current = audio;
-            await audio.play();
-        } catch (error: any) {
-            alert(error?.message || '试听失败');
-        } finally {
-            setIsAuditioning(false);
-        }
+  const [testInput, setTestInput] = useState('你好，正在测试语音合成效果。');
+  const [isAuditioning, setIsAuditioning] = useState(false);
+  const [isSaving, setIsSaving] = useState(false);
+  const testAudioRef = useRef<HTMLAudioElement | null>(null);
+
+  useEffect(() => {
+    if (!initialVoice) return;
+    const nextVendor = initialVoice.vendor === 'SiliconFlow' ? '硅基流动' : initialVoice.vendor;
+    setVendor((nextVendor as any) || '硅基流动');
+    setName(initialVoice.name || '');
+    setGender(initialVoice.gender || 'Female');
+    setLanguage(initialVoice.language || 'zh');
+    setDescription(initialVoice.description || '');
+    setModel(initialVoice.model || '');
+    setVoiceKey(initialVoice.voiceKey || '');
+    setSfModel(initialVoice.model || 'FunAudioLLM/CosyVoice2-0.5B');
+    setSfVoiceId(initialVoice.voiceKey || 'FunAudioLLM/CosyVoice2-0.5B:anna');
+    setSfSpeed(initialVoice.speed ?? 1);
+    setSfGain(initialVoice.gain ?? 0);
+    setSfPitch(initialVoice.pitch ?? 0);
+    setApiKey(initialVoice.apiKey || '');
+    setBaseUrl(initialVoice.baseUrl || '');
+  }, [initialVoice, isOpen]);
+
+  const handleAudition = async () => {
+    if (!testInput.trim()) return;
+    if (!initialVoice?.id) {
+      alert('请先创建声音，再进行试听。');
+      return;
+    }
+    try {
+      setIsAuditioning(true);
+      const audioUrl = await previewVoice(initialVoice.id, testInput, sfSpeed, apiKey || undefined);
+      if (testAudioRef.current) {
+        testAudioRef.current.pause();
+      }
+      const audio = new Audio(audioUrl);
+      testAudioRef.current = audio;
+      await audio.play();
+    } catch (error: any) {
+      alert(error?.message || '试听失败');
+    } finally {
+      setIsAuditioning(false);
+    }
+  };
+
+  const handleSubmit = async () => {
+    if (!name) {
+      alert('请填写声音显示名称');
+      return;
+    }
+
+    const newVoice: Voice = {
+      id: initialVoice?.id || `${vendor === '硅基流动' ? 'sf' : 'gen'}-${Date.now()}`,
+      name,
+      vendor,
+      gender,
+      language,
+      description: description || (vendor === '硅基流动' ? `Model: ${sfModel}` : `Model: ${model}`),
+      model: vendor === '硅基流动' ? sfModel : model,
+      voiceKey: vendor === '硅基流动' ? sfVoiceId : voiceKey,
+      apiKey,
+      baseUrl,
+      speed: sfSpeed,
+      gain: sfGain,
+      pitch: sfPitch,
     };
 
-    const handleSubmit = async () => {
-        if (!name) { alert("请填写声音显示名称"); return; }
+    try {
+      setIsSaving(true);
+      await onSuccess(newVoice);
+      setName('');
+      setVendor('硅基流动');
+      setDescription('');
+      setModel('');
+      setVoiceKey('');
+      setApiKey('');
+      setBaseUrl('');
+    } catch (error: any) {
+      alert(error?.message || '保存失败');
+    } finally {
+      setIsSaving(false);
+    }
+  };
 
-        const newVoice: Voice = {
-            id: initialVoice?.id || `${vendor === '硅基流动' ? 'sf' : 'gen'}-${Date.now()}`,
-            name: name,
-            vendor: vendor,
-            gender: gender,
-            language: language,
-            description: description || (vendor === '硅基流动' ? `Model: ${sfModel}` : `Model: ${model}`),
-            model: vendor === '硅基流动' ? sfModel : model,
-            voiceKey: vendor === '硅基流动' ? sfVoiceId : voiceKey,
-            speed: sfSpeed,
-            gain: sfGain,
-            pitch: sfPitch,
-        };
-        try {
-            setIsSaving(true);
-            await onSuccess(newVoice);
-            setName('');
-            setVendor('硅基流动');
-            setDescription('');
-            setModel('');
-            setVoiceKey('');
-        } catch (error: any) {
-            alert(error?.message || '保存失败');
-        } finally {
-            setIsSaving(false);
-        }
-    };
+  return (
+    <Dialog
+      isOpen={isOpen}
+      onClose={onClose}
+      title={initialVoice ? '编辑声音' : '添加声音'}
+      footer={
+        <>
+          <Button variant="ghost" onClick={onClose}>取消</Button>
+          <Button onClick={handleSubmit} className="bg-primary hover:bg-primary/90" disabled={isSaving}>
+            {isSaving ? '保存中...' : initialVoice ? '保存修改' : '确认添加'}
+          </Button>
+        </>
+      }
+    >
+      <div className="space-y-4 max-h-[75vh] overflow-y-auto px-1 custom-scrollbar">
+        <div className="space-y-1.5">
+          <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">厂商 (Vendor)</label>
+          <div className="relative">
+            <select
+              className="flex h-10 w-full rounded-md border border-white/10 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground appearance-none cursor-pointer [&>option]:bg-card"
+              value={vendor}
+              onChange={(e) => setVendor(e.target.value as any)}
+            >
+              <option value="硅基流动">硅基流动 (SiliconFlow)</option>
+              <option value="Ali">阿里 (Ali)</option>
+              <option value="Volcano">火山 (Volcano)</option>
+              <option value="Minimax">Minimax</option>
+            </select>
+            <ChevronDown className="absolute right-3 top-1/2 -translate-y-1/2 h-4 w-4 text-muted-foreground pointer-events-none" />
+          </div>
+        </div>
 
-    return (
-        <Dialog 
-            isOpen={isOpen} 
-            onClose={onClose} 
-            title={initialVoice ? "编辑声音" : "添加声音"}
-            footer={
-                <>
-                    <Button variant="ghost" onClick={onClose}>取消</Button>
-                    <Button onClick={handleSubmit} className="bg-primary hover:bg-primary/90" disabled={isSaving}>
-                        {isSaving ? '保存中...' : (initialVoice ? '保存修改' : '确认添加')}
-                    </Button>
-                </>
-            }
-        >
-            <div className="space-y-4 max-h-[75vh] overflow-y-auto px-1 custom-scrollbar">
-                <div className="space-y-1.5">
-                    <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">厂商 (Vendor)</label>
-                    <div className="relative">
-                        <select 
-                            className="flex h-10 w-full rounded-md border border-white/10 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground appearance-none cursor-pointer [&>option]:bg-card"
-                            value={vendor}
-                            onChange={(e) => setVendor(e.target.value as any)}
-                        >
-                            <option value="硅基流动">硅基流动 (SiliconFlow)</option>
-                            <option value="Ali">阿里 (Ali)</option>
-                            <option value="Volcano">火山 (Volcano)</option>
-                            <option value="Minimax">Minimax</option>
-                        </select>
-                        <ChevronDown className="absolute right-3 top-1/2 -translate-y-1/2 h-4 w-4 text-muted-foreground pointer-events-none" />
-                    </div>
-                </div>
+        <div className="h-px bg-white/5"></div>
 
-                <div className="h-px bg-white/5"></div>
+        <div className="space-y-1.5">
+          <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">声音名称</label>
+          <Input value={name} onChange={(e) => setName(e.target.value)} placeholder="例如: 客服小美" />
+        </div>
 
-                <div className="space-y-1.5">
-                    <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">声音名称</label>
-                    <Input value={name} onChange={e => setName(e.target.value)} placeholder="例如: 客服小美" />
-                </div>
-
-                {vendor === '硅基流动' ? (
-                    <div className="space-y-4 animate-in fade-in slide-in-from-top-1 duration-200">
-                        <div className="grid grid-cols-2 gap-4">
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">模型 (Model)</label>
-                                <select 
-                                    className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
-                                    value={sfModel}
-                                    onChange={e => setSfModel(e.target.value)}
-                                >
-                                    <option value="FunAudioLLM/CosyVoice2-0.5B">FunAudioLLM/CosyVoice2-0.5B</option>
-                                    <option value="fishaudio/fish-speech-1.5">fishaudio/fish-speech-1.5</option>
-                                    <option value="fishaudio/fish-speech-1.4">fishaudio/fish-speech-1.4</option>
-                                </select>
-                            </div>
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">声音 ID (Voice)</label>
-                                <Input value={sfVoiceId} onChange={e => setSfVoiceId(e.target.value)} placeholder="fishaudio:amy" />
-                            </div>
-                        </div>
-
-                        <div className="grid grid-cols-2 gap-4">
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">语速 (Speed)</label>
-                                <div className="flex items-center space-x-2">
-                                    <input type="range" min="0.5" max="2" step="0.1" value={sfSpeed} onChange={e => setSfSpeed(parseFloat(e.target.value))} className="flex-1 accent-primary" />
-                                    <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfSpeed}x</span>
-                                </div>
-                            </div>
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">增益 (Gain)</label>
-                                <div className="flex items-center space-x-2">
-                                    <input type="range" min="-10" max="10" step="1" value={sfGain} onChange={e => setSfGain(parseInt(e.target.value))} className="flex-1 accent-primary" />
-                                    <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfGain}dB</span>
-                                </div>
-                            </div>
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">音调 (Pitch)</label>
-                                <div className="flex items-center space-x-2">
-                                    <input type="range" min="-12" max="12" step="1" value={sfPitch} onChange={e => setSfPitch(parseInt(e.target.value))} className="flex-1 accent-primary" />
-                                    <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfPitch}</span>
-                                </div>
-                            </div>
-                        </div>
-                    </div>
-                ) : (
-                    <div className="space-y-4 animate-in fade-in slide-in-from-top-1 duration-200">
-                        <div className="grid grid-cols-2 gap-4">
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">模型标识</label>
-                                <Input value={model} onChange={e => setModel(e.target.value)} placeholder="API Model Key" />
-                            </div>
-                            <div className="space-y-1.5">
-                                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">发音人标识</label>
-                                <Input value={voiceKey} onChange={e => setVoiceKey(e.target.value)} placeholder="Voice Key" />
-                            </div>
-                        </div>
-                    </div>
-                )}
-
-                <div className="grid grid-cols-2 gap-4">
-                    <div className="space-y-1.5">
-                        <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">性别</label>
-                        <select 
-                            className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
-                            value={gender}
-                            onChange={e => setGender(e.target.value)}
-                        >
-                            <option value="Female">女 (Female)</option>
-                            <option value="Male">男 (Male)</option>
-                        </select>
-                    </div>
-                    <div className="space-y-1.5">
-                        <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">语言</label>
-                        <select 
-                            className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
-                            value={language}
-                            onChange={e => setLanguage(e.target.value)}
-                        >
-                            <option value="zh">中文 (Chinese)</option>
-                            <option value="en">英文 (English)</option>
-                        </select>
-                    </div>
-                </div>
-
-                <div className="space-y-1.5">
-                    <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">备注</label>
-                    <textarea 
-                        className="flex min-h-[60px] w-full rounded-md border-0 bg-white/5 px-3 py-2 text-sm shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-white"
-                        value={description}
-                        onChange={(e) => setDescription(e.target.value)}
-                        placeholder="记录该声音的特点..."
-                    />
-                </div>
-
-                <div className="p-4 rounded-xl border border-primary/20 bg-primary/5 space-y-3">
-                    <div className="flex items-center justify-between">
-                        <h4 className="text-[10px] font-black text-primary flex items-center tracking-widest uppercase">
-                            <Volume2 className="w-3.5 h-3.5 mr-1.5" /> 参数试听 (Preview)
-                        </h4>
-                        {vendor === '硅基流动' && <Badge variant="outline" className="text-[8px] border-primary/20 text-primary/70">SiliconFlow Audio API</Badge>}
-                    </div>
-                    <div className="flex gap-2">
-                        <Input 
-                            value={testInput} 
-                            onChange={e => setTestInput(e.target.value)}
-                            placeholder="输入测试文本..."
-                            className="text-xs bg-black/20"
-                        />
-                        <Button 
-                            variant="primary" 
-                            size="sm" 
-                            onClick={handleAudition} 
-                            disabled={isAuditioning || !initialVoice}
-                            className="shrink-0 h-9"
-                        >
-                            {isAuditioning ? <Pause className="h-3.5 w-3.5 animate-pulse" /> : <Play className="h-3.5 w-3.5" />}
-                        </Button>
-                    </div>
-                </div>
+        {vendor === '硅基流动' ? (
+          <div className="space-y-4 animate-in fade-in slide-in-from-top-1 duration-200">
+            <div className="grid grid-cols-2 gap-4">
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">模型 (Model)</label>
+                <select
+                  className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
+                  value={sfModel}
+                  onChange={(e) => setSfModel(e.target.value)}
+                >
+                  <option value="FunAudioLLM/CosyVoice2-0.5B">FunAudioLLM/CosyVoice2-0.5B</option>
+                  <option value="fishaudio/fish-speech-1.5">fishaudio/fish-speech-1.5</option>
+                  <option value="fishaudio/fish-speech-1.4">fishaudio/fish-speech-1.4</option>
+                </select>
+              </div>
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">声音 ID (Voice)</label>
+                <Input value={sfVoiceId} onChange={(e) => setSfVoiceId(e.target.value)} placeholder="FunAudioLLM/CosyVoice2-0.5B:anna" />
+              </div>
             </div>
-        </Dialog>
-    );
+
+            <div className="grid grid-cols-2 gap-4">
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">语速 (Speed)</label>
+                <div className="flex items-center space-x-2">
+                  <input type="range" min="0.5" max="2" step="0.1" value={sfSpeed} onChange={(e) => setSfSpeed(parseFloat(e.target.value))} className="flex-1 accent-primary" />
+                  <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfSpeed}x</span>
+                </div>
+              </div>
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">增益 (Gain)</label>
+                <div className="flex items-center space-x-2">
+                  <input type="range" min="-10" max="10" step="1" value={sfGain} onChange={(e) => setSfGain(parseInt(e.target.value, 10))} className="flex-1 accent-primary" />
+                  <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfGain}dB</span>
+                </div>
+              </div>
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">音调 (Pitch)</label>
+                <div className="flex items-center space-x-2">
+                  <input type="range" min="-12" max="12" step="1" value={sfPitch} onChange={(e) => setSfPitch(parseInt(e.target.value, 10))} className="flex-1 accent-primary" />
+                  <span className="text-[10px] font-mono text-primary bg-primary/10 px-1.5 py-0.5 rounded">{sfPitch}</span>
+                </div>
+              </div>
+            </div>
+          </div>
+        ) : (
+          <div className="space-y-4 animate-in fade-in slide-in-from-top-1 duration-200">
+            <div className="grid grid-cols-2 gap-4">
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">模型标识</label>
+                <Input value={model} onChange={(e) => setModel(e.target.value)} placeholder="API Model Key" />
+              </div>
+              <div className="space-y-1.5">
+                <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">发音人标识</label>
+                <Input value={voiceKey} onChange={(e) => setVoiceKey(e.target.value)} placeholder="Voice Key" />
+              </div>
+            </div>
+          </div>
+        )}
+
+        <div className="grid grid-cols-2 gap-4">
+          <div className="space-y-1.5">
+            <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">API Key</label>
+            <Input value={apiKey} type="password" onChange={(e) => setApiKey(e.target.value)} placeholder="每个声音独立 API Key" />
+          </div>
+          <div className="space-y-1.5">
+            <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">Base URL</label>
+            <Input value={baseUrl} onChange={(e) => setBaseUrl(e.target.value)} placeholder="https://.../v1" />
+          </div>
+        </div>
+
+        <div className="grid grid-cols-2 gap-4">
+          <div className="space-y-1.5">
+            <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">性别</label>
+            <select
+              className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
+              value={gender}
+              onChange={(e) => setGender(e.target.value)}
+            >
+              <option value="Female">女 (Female)</option>
+              <option value="Male">男 (Male)</option>
+            </select>
+          </div>
+          <div className="space-y-1.5">
+            <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">语言</label>
+            <select
+              className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
+              value={language}
+              onChange={(e) => setLanguage(e.target.value)}
+            >
+              <option value="zh">中文 (Chinese)</option>
+              <option value="en">英文 (English)</option>
+            </select>
+          </div>
+        </div>
+
+        <div className="space-y-1.5">
+          <label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">备注</label>
+          <textarea
+            className="flex min-h-[60px] w-full rounded-md border-0 bg-white/5 px-3 py-2 text-sm shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-white"
+            value={description}
+            onChange={(e) => setDescription(e.target.value)}
+            placeholder="记录该声音的特点..."
+          />
+        </div>
+
+        <div className="p-4 rounded-xl border border-primary/20 bg-primary/5 space-y-3">
+          <div className="flex items-center justify-between">
+            <h4 className="text-[10px] font-black text-primary flex items-center tracking-widest uppercase">
+              <Volume2 className="w-3.5 h-3.5 mr-1.5" /> 参数试听 (Preview)
+            </h4>
+          </div>
+          <div className="flex gap-2">
+            <Input
+              value={testInput}
+              onChange={(e) => setTestInput(e.target.value)}
+              placeholder="输入测试文本..."
+              className="text-xs bg-black/20"
+            />
+            <Button
+              variant="primary"
+              size="sm"
+              onClick={handleAudition}
+              disabled={isAuditioning || !initialVoice}
+              className="shrink-0 h-9"
+            >
+              {isAuditioning ? <Pause className="h-3.5 w-3.5 animate-pulse" /> : <Play className="h-3.5 w-3.5" />}
+            </Button>
+          </div>
+        </div>
+      </div>
+    </Dialog>
+  );
 };
 
-const CloneVoiceModal: React.FC<{ 
-    isOpen: boolean; 
-    onClose: () => void; 
-    onSuccess: (voice: Voice) => Promise<void> 
+const CloneVoiceModal: React.FC<{
+  isOpen: boolean;
+  onClose: () => void;
+  onSuccess: (voice: Voice) => Promise<void>;
 }> = ({ isOpen, onClose, onSuccess }) => {
-    const [name, setName] = useState('');
-    const [description, setDescription] = useState('');
-    const [file, setFile] = useState<File | null>(null);
-    const inputRef = useRef<HTMLInputElement>(null);
+  const [name, setName] = useState('');
+  const [description, setDescription] = useState('');
+  const [file, setFile] = useState<File | null>(null);
+  const inputRef = useRef<HTMLInputElement>(null);
 
-    const handleFileChange = (e: React.ChangeEvent<HTMLInputElement>) => {
-        if (e.target.files && e.target.files[0]) {
-            setFile(e.target.files[0]);
-        }
+  const handleFileChange = (e: React.ChangeEvent<HTMLInputElement>) => {
+    if (e.target.files && e.target.files[0]) {
+      setFile(e.target.files[0]);
+    }
+  };
+
+  const handleSubmit = async () => {
+    if (!name || !file) {
+      alert('请填写名称并上传音频文件');
+      return;
+    }
+
+    const newVoice: Voice = {
+      id: `v-${Date.now()}`,
+      name,
+      vendor: 'Volcano',
+      gender: 'Female',
+      language: 'zh',
+      description: description || 'User cloned voice',
     };
 
-    const handleSubmit = async () => {
-        if (!name || !file) {
-            alert("请填写名称并上传音频文件");
-            return;
-        }
-        
-        const newVoice: Voice = {
-            id: `v-${Date.now()}`,
-            name: name,
-            vendor: 'Volcano', 
-            gender: 'Female', 
-            language: 'zh',
-            description: description || 'User cloned voice'
-        };
+    await onSuccess(newVoice);
+    setName('');
+    setDescription('');
+    setFile(null);
+  };
 
-        await onSuccess(newVoice);
-        setName('');
-        setDescription('');
-        setFile(null);
-    };
+  return (
+    <Dialog
+      isOpen={isOpen}
+      onClose={onClose}
+      title="克隆声音"
+      footer={
+        <>
+          <Button variant="ghost" onClick={onClose}>取消</Button>
+          <Button onClick={handleSubmit}>开始克隆</Button>
+        </>
+      }
+    >
+      <div className="space-y-4">
+        <div className="space-y-2">
+          <label className="text-sm font-medium text-white">语音名称</label>
+          <Input value={name} onChange={(e) => setName(e.target.value)} placeholder="给新声音起个名字" />
+        </div>
 
-    return (
-        <Dialog 
-            isOpen={isOpen} 
-            onClose={onClose} 
-            title="克隆声音"
-            footer={
-                <>
-                    <Button variant="ghost" onClick={onClose}>取消</Button>
-                    <Button onClick={handleSubmit}>开始克隆</Button>
-                </>
-            }
-        >
-            <div className="space-y-4">
-                <div className="space-y-2">
-                    <label className="text-sm font-medium text-white">语音名称</label>
-                    <Input 
-                        value={name}
-                        onChange={(e) => setName(e.target.value)}
-                        placeholder="给新声音起个名字"
-                    />
-                </div>
-                
-                <div className="space-y-2">
-                     <label className="text-sm font-medium text-white">上传音频文件 (参考音频)</label>
-                     <div 
-                        className="flex flex-col items-center justify-center w-full h-32 rounded-lg border-2 border-dashed border-white/10 bg-white/5 hover:bg-white/10 transition-colors cursor-pointer"
-                        onClick={() => inputRef.current?.click()}
-                     >
-                        <input 
-                            ref={inputRef}
-                            type="file"
-                            accept="audio/*"
-                            className="hidden"
-                            onChange={handleFileChange}
-                        />
-                        {file ? (
-                             <div className="flex items-center space-x-2 text-primary">
-                                <Mic2 className="h-6 w-6" />
-                                <span className="text-sm font-medium">{file.name}</span>
-                             </div>
-                        ) : (
-                            <>
-                                <Upload className="h-8 w-8 mb-2 text-muted-foreground" />
-                                <p className="text-sm text-muted-foreground">点击上传 WAV/MP3 文件</p>
-                            </>
-                        )}
-                     </div>
-                </div>
+        <div className="space-y-2">
+          <label className="text-sm font-medium text-white">上传音频文件 (参考音频)</label>
+          <div
+            className="flex flex-col items-center justify-center w-full h-32 rounded-lg border-2 border-dashed border-white/10 bg-white/5 hover:bg-white/10 transition-colors cursor-pointer"
+            onClick={() => inputRef.current?.click()}
+          >
+            <input ref={inputRef} type="file" accept="audio/*" className="hidden" onChange={handleFileChange} />
+            {file ? (
+              <div className="flex items-center space-x-2 text-primary">
+                <Mic2 className="h-6 w-6" />
+                <span className="text-sm font-medium">{file.name}</span>
+              </div>
+            ) : (
+              <>
+                <Upload className="h-8 w-8 mb-2 text-muted-foreground" />
+                <p className="text-sm text-muted-foreground">点击上传 WAV/MP3 文件</p>
+              </>
+            )}
+          </div>
+        </div>
 
-                <div className="space-y-2">
-                    <label className="text-sm font-medium text-white">语音描述</label>
-                    <textarea 
-                        className="flex min-h-[80px] w-full rounded-md border-0 bg-white/5 px-3 py-2 text-sm shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-white"
-                        value={description}
-                        onChange={(e) => setDescription(e.target.value)}
-                        placeholder="描述声音特点（如：年轻、沉稳...）"
-                    />
-                </div>
-            </div>
-        </Dialog>
-    );
+        <div className="space-y-2">
+          <label className="text-sm font-medium text-white">语音描述</label>
+          <textarea
+            className="flex min-h-[80px] w-full rounded-md border-0 bg-white/5 px-3 py-2 text-sm shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-white"
+            value={description}
+            onChange={(e) => setDescription(e.target.value)}
+            placeholder="描述声音特点（如：年轻、沉稳...）"
+          />
+        </div>
+      </div>
+    </Dialog>
+  );
 };
diff --git a/web/services/backendApi.ts b/web/services/backendApi.ts
index ed9fa6c..fc618a5 100644
--- a/web/services/backendApi.ts
+++ b/web/services/backendApi.ts
@@ -1,4 +1,4 @@
-import { Assistant, CallLog, InteractionDetail, KnowledgeBase, KnowledgeDocument, VendorCredential, Voice, Workflow, WorkflowEdge, WorkflowNode } from '../types';
+import { Assistant, CallLog, InteractionDetail, KnowledgeBase, KnowledgeDocument, Voice, Workflow, WorkflowEdge, WorkflowNode } from '../types';
 import { apiRequest } from './apiClient';
 
 type AnyRecord = Record<string, any>;
@@ -55,6 +55,8 @@ const mapVoice = (raw: AnyRecord): Voice => ({
   description: readField(raw, ['description'], ''),
   model: readField(raw, ['model'], ''),
   voiceKey: readField(raw, ['voiceKey', 'voice_key'], ''),
+  apiKey: readField(raw, ['apiKey', 'api_key'], ''),
+  baseUrl: readField(raw, ['baseUrl', 'base_url'], ''),
   speed: Number(readField(raw, ['speed'], 1)),
   gain: Number(readField(raw, ['gain'], 0)),
   pitch: Number(readField(raw, ['pitch'], 0)),
@@ -62,13 +64,6 @@ const mapVoice = (raw: AnyRecord): Voice => ({
   isSystem: Boolean(readField(raw, ['isSystem', 'is_system'], false)),
 });
 
-const mapVendorCredential = (raw: AnyRecord): VendorCredential => ({
-  vendorKey: String(readField(raw, ['vendorKey', 'vendor_key'], '')),
-  vendorName: readField(raw, ['vendorName', 'vendor_name'], ''),
-  apiKey: readField(raw, ['apiKey', 'api_key'], ''),
-  baseUrl: readField(raw, ['baseUrl', 'base_url'], ''),
-});
-
 const mapWorkflowNode = (raw: AnyRecord): WorkflowNode => ({
   name: readField(raw, ['name'], ''),
   type: readField(raw, ['type'], 'conversation') as 'conversation' | 'tool' | 'human' | 'end',
@@ -205,6 +200,8 @@ export const createVoice = async (data: Partial<Voice>): Promise<Voice> => {
     description: data.description || '',
     model: data.model || undefined,
     voice_key: data.voiceKey || undefined,
+    api_key: data.apiKey || undefined,
+    base_url: data.baseUrl || undefined,
     speed: data.speed ?? 1,
     gain: data.gain ?? 0,
     pitch: data.pitch ?? 0,
@@ -223,6 +220,8 @@ export const updateVoice = async (id: string, data: Partial<Voice>): Promise<Voi
     description: data.description,
     model: data.model,
     voice_key: data.voiceKey,
+    api_key: data.apiKey,
+    base_url: data.baseUrl,
     speed: data.speed,
     gain: data.gain,
     pitch: data.pitch,
@@ -247,24 +246,6 @@ export const previewVoice = async (id: string, text: string, speed?: number, api
   return response.audio_url;
 };
 
-export const fetchVendorCredentials = async (): Promise<VendorCredential[]> => {
-  const response = await apiRequest<{ list?: AnyRecord[] }>('/voices/vendors/credentials');
-  const list = response.list || [];
-  return list.map((item) => mapVendorCredential(item));
-};
-
-export const saveVendorCredential = async (vendorKey: string, data: { vendorName: string; apiKey: string; baseUrl?: string }): Promise<VendorCredential> => {
-  const response = await apiRequest<AnyRecord>(`/voices/vendors/credentials/${vendorKey}`, {
-    method: 'PUT',
-    body: {
-      vendor_name: data.vendorName,
-      api_key: data.apiKey,
-      base_url: data.baseUrl || undefined,
-    },
-  });
-  return mapVendorCredential(response);
-};
-
 export const fetchWorkflows = async (): Promise<Workflow[]> => {
   const response = await apiRequest<{ list?: AnyRecord[] } | AnyRecord[]>('/workflows');
   const list = Array.isArray(response) ? response : (response.list || []);
diff --git a/web/types.ts b/web/types.ts
index 61e0f05..667ebe7 100644
--- a/web/types.ts
+++ b/web/types.ts
@@ -30,6 +30,8 @@ export interface Voice {
   description: string;
   model?: string;
   voiceKey?: string;
+  apiKey?: string;
+  baseUrl?: string;
   speed?: number;
   gain?: number;
   pitch?: number;
@@ -37,13 +39,6 @@ export interface Voice {
   isSystem?: boolean;
 }
 
-export interface VendorCredential {
-  vendorKey: string;
-  vendorName: string;
-  apiKey: string;
-  baseUrl?: string;
-}
-
 export interface KnowledgeBase {
   id: string;
   name: string;