Update asr library preview

This commit is contained in:
Xin Wang
2026-02-08 23:38:34 +08:00
parent 97e3236e76
commit 4bf2f788ad
5 changed files with 781 additions and 183 deletions

View File

@@ -1,103 +1,122 @@
import React, { useState } from 'react';
import { Search, Filter, Plus, Trash2, Key, Server, Ear, Globe, Languages } from 'lucide-react';
import React, { useEffect, useRef, useState } from 'react';
import { Search, Filter, Plus, Trash2, Key, Server, Ear, Globe, Languages, Pencil, Mic, Square, Upload } from 'lucide-react';
import { Button, Input, TableHeader, TableRow, TableHead, TableCell, Dialog, Badge } from '../components/UI';
import { mockASRModels } from '../services/mockData';
import { ASRModel } from '../types';
import { createASRModel, deleteASRModel, fetchASRModels, previewASRModel, updateASRModel } from '../services/backendApi';
const maskApiKey = (key?: string) => {
if (!key) return '********';
if (key.length < 8) return '********';
return `${key.slice(0, 3)}****${key.slice(-4)}`;
};
const parseHotwords = (value: string): string[] => {
return value
.split(/[\n,]/)
.map((item) => item.trim())
.filter(Boolean);
};
const toHotwordsValue = (hotwords?: string[]): string => (hotwords || []).join(', ');
export const ASRLibraryPage: React.FC = () => {
const [models, setModels] = useState<ASRModel[]>(mockASRModels);
const [models, setModels] = useState<ASRModel[]>([]);
const [searchTerm, setSearchTerm] = useState('');
const [vendorFilter, setVendorFilter] = useState<string>('all');
const [langFilter, setLangFilter] = useState<string>('all');
const [isAddModalOpen, setIsAddModalOpen] = useState(false);
const [editingModel, setEditingModel] = useState<ASRModel | null>(null);
const [previewingModel, setPreviewingModel] = useState<ASRModel | null>(null);
const [isLoading, setIsLoading] = useState(true);
// Form State
const [newModel, setNewModel] = useState<Partial<ASRModel>>({
vendor: 'OpenAI Compatible',
language: 'zh'
});
const loadModels = async () => {
setIsLoading(true);
try {
setModels(await fetchASRModels());
} catch (error) {
console.error(error);
setModels([]);
} finally {
setIsLoading(false);
}
};
const filteredModels = models.filter(m => {
const matchesSearch = m.name.toLowerCase().includes(searchTerm.toLowerCase());
useEffect(() => {
loadModels();
}, []);
const filteredModels = models.filter((m) => {
const q = searchTerm.toLowerCase();
const matchesSearch = m.name.toLowerCase().includes(q) || (m.modelName || '').toLowerCase().includes(q);
const matchesVendor = vendorFilter === 'all' || m.vendor === vendorFilter;
const matchesLang = langFilter === 'all' || m.language === langFilter || (langFilter !== 'all' && m.language === 'Multi-lingual');
return matchesSearch && matchesVendor && matchesLang;
});
const handleAddModel = () => {
if (!newModel.name || !newModel.baseUrl || !newModel.apiKey) {
alert("请填写完整信息");
return;
}
const model: ASRModel = {
id: `asr_${Date.now()}`,
name: newModel.name,
vendor: newModel.vendor as 'OpenAI Compatible',
language: newModel.language || 'zh',
baseUrl: newModel.baseUrl,
apiKey: newModel.apiKey
};
setModels([model, ...models]);
const handleCreate = async (data: Partial<ASRModel>) => {
const created = await createASRModel(data);
setModels((prev) => [created, ...prev]);
setIsAddModalOpen(false);
setNewModel({ vendor: 'OpenAI Compatible', language: 'zh', name: '', baseUrl: '', apiKey: '' });
};
const handleDeleteModel = (id: string) => {
if (confirm('确认删除该语音识别模型吗?')) {
setModels(prev => prev.filter(m => m.id !== id));
}
const handleUpdate = async (id: string, data: Partial<ASRModel>) => {
const updated = await updateASRModel(id, data);
setModels((prev) => prev.map((m) => (m.id === id ? updated : m)));
setEditingModel(null);
};
const maskApiKey = (key: string) => {
if (!key || key.length < 8) return '********';
return `${key.substring(0, 3)}****${key.substring(key.length - 4)}`;
const handleDelete = async (id: string) => {
if (!confirm('确认删除该语音识别模型吗?')) return;
await deleteASRModel(id);
setModels((prev) => prev.filter((m) => m.id !== id));
};
const vendorOptions = Array.from(new Set(models.map((m) => m.vendor).filter(Boolean)));
return (
<div className="space-y-6 animate-in fade-in py-4 pb-10">
<div className="flex items-center justify-between">
<h1 className="text-2xl font-bold tracking-tight text-white"></h1>
<Button onClick={() => setIsAddModalOpen(true)} className="shadow-[0_0_15px_rgba(6,182,212,0.4)]">
<Plus className="mr-2 h-4 w-4" />
<Plus className="mr-2 h-4 w-4" />
</Button>
</div>
<div className="grid grid-cols-1 md:grid-cols-4 gap-4 bg-card/50 p-4 rounded-lg border border-white/5 shadow-sm">
<div className="relative col-span-1 md:col-span-2">
<Search className="absolute left-2.5 top-2.5 h-4 w-4 text-muted-foreground" />
<Input
placeholder="搜索模型名称..."
className="pl-9 border-0 bg-white/5"
value={searchTerm}
onChange={e => setSearchTerm(e.target.value)}
/>
</div>
<div className="flex items-center space-x-2">
<Filter className="h-4 w-4 text-muted-foreground" />
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
value={vendorFilter}
onChange={(e) => setVendorFilter(e.target.value)}
>
<option value="all"></option>
<option value="OpenAI Compatible">OpenAI Compatible</option>
</select>
</div>
<div className="flex items-center space-x-2">
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
value={langFilter}
onChange={(e) => setLangFilter(e.target.value)}
>
<option value="all"></option>
<option value="zh"> (Chinese)</option>
<option value="en"> (English)</option>
<option value="Multi-lingual"> (Multi-lingual)</option>
</select>
</div>
<div className="relative col-span-1 md:col-span-2">
<Search className="absolute left-2.5 top-2.5 h-4 w-4 text-muted-foreground" />
<Input
placeholder="搜索模型名称/Model Name..."
className="pl-9 border-0 bg-white/5"
value={searchTerm}
onChange={(e) => setSearchTerm(e.target.value)}
/>
</div>
<div className="flex items-center space-x-2">
<Filter className="h-4 w-4 text-muted-foreground" />
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
value={vendorFilter}
onChange={(e) => setVendorFilter(e.target.value)}
>
<option value="all"></option>
{vendorOptions.map((vendor) => (
<option key={vendor} value={vendor}>{vendor}</option>
))}
</select>
</div>
<div className="flex items-center space-x-2">
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 [&>option]:bg-card text-foreground"
value={langFilter}
onChange={(e) => setLangFilter(e.target.value)}
>
<option value="all"></option>
<option value="zh"> (Chinese)</option>
<option value="en"> (English)</option>
<option value="Multi-lingual"> (Multi-lingual)</option>
</select>
</div>
</div>
<div className="rounded-md border border-white/5 bg-card/40 backdrop-blur-md overflow-hidden">
@@ -105,131 +124,435 @@ export const ASRLibraryPage: React.FC = () => {
<TableHeader>
<TableRow>
<TableHead></TableHead>
<TableHead></TableHead>
<TableHead></TableHead>
<TableHead></TableHead>
<TableHead></TableHead>
<TableHead>Base URL</TableHead>
<TableHead>API Key</TableHead>
<TableHead className="text-right"></TableHead>
</TableRow>
</TableHeader>
<tbody>
{filteredModels.map(model => (
{!isLoading && filteredModels.map((model) => (
<TableRow key={model.id}>
<TableCell className="font-medium text-white flex items-center">
<Ear className="w-4 h-4 mr-2 text-primary" />
{model.name}
</TableCell>
<TableCell>
<Badge variant="outline">{model.vendor}</Badge>
</TableCell>
<TableCell>
<Badge variant="default" className="bg-purple-500/10 text-purple-400 border-purple-500/20">
{model.language}
</Badge>
</TableCell>
<TableCell className="font-mono text-xs text-muted-foreground">
{model.baseUrl}
</TableCell>
<TableCell className="font-mono text-xs text-muted-foreground">
{maskApiKey(model.apiKey)}
<TableCell className="font-medium text-white">
<div className="flex flex-col">
<span className="flex items-center">
<Ear className="w-4 h-4 mr-2 text-primary" />
{model.name}
</span>
{model.hotwords && model.hotwords.length > 0 && (
<span className="text-xs text-muted-foreground">: {model.hotwords.join(', ')}</span>
)}
</div>
</TableCell>
<TableCell><Badge variant="outline">{model.vendor}</Badge></TableCell>
<TableCell>{model.language}</TableCell>
<TableCell className="font-mono text-xs text-muted-foreground">{model.modelName || '-'}</TableCell>
<TableCell className="font-mono text-xs text-muted-foreground max-w-[220px] truncate">{model.baseUrl}</TableCell>
<TableCell className="font-mono text-xs text-muted-foreground">{maskApiKey(model.apiKey)}</TableCell>
<TableCell className="text-right">
<Button
variant="ghost"
size="icon"
onClick={() => handleDeleteModel(model.id)}
className="text-muted-foreground hover:text-destructive transition-colors"
>
<Trash2 className="h-4 w-4" />
</Button>
<Button variant="ghost" size="icon" onClick={() => setPreviewingModel(model)}>
<Ear className="h-4 w-4" />
</Button>
<Button variant="ghost" size="icon" onClick={() => setEditingModel(model)}>
<Pencil className="h-4 w-4" />
</Button>
<Button variant="ghost" size="icon" onClick={() => handleDelete(model.id)} className="text-red-400">
<Trash2 className="h-4 w-4" />
</Button>
</TableCell>
</TableRow>
))}
{filteredModels.length === 0 && (
<TableRow>
<TableCell colSpan={6} className="text-center py-8 text-muted-foreground"></TableCell>
</TableRow>
)}
{!isLoading && filteredModels.length === 0 && (
<TableRow>
<TableCell colSpan={7} className="text-center py-8 text-muted-foreground"></TableCell>
</TableRow>
)}
{isLoading && (
<TableRow>
<TableCell colSpan={7} className="text-center py-8 text-muted-foreground">...</TableCell>
</TableRow>
)}
</tbody>
</table>
</div>
<Dialog
<ASRModelModal
isOpen={isAddModalOpen}
onClose={() => setIsAddModalOpen(false)}
title="添加语音识别模型"
footer={
<>
<Button variant="ghost" onClick={() => setIsAddModalOpen(false)}></Button>
<Button onClick={handleAddModel}></Button>
</>
}
>
<div className="space-y-4">
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"> (Interface Type)</label>
<select
className="flex h-10 w-full rounded-md border border-white/10 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground appearance-none cursor-pointer [&>option]:bg-card"
value={newModel.vendor}
onChange={e => setNewModel({...newModel, vendor: e.target.value as any})}
>
<option value="OpenAI Compatible">OpenAI Compatible</option>
</select>
</div>
onSubmit={handleCreate}
/>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"> (Language)</label>
<div className="flex bg-white/5 p-1 rounded-lg border border-white/10">
{(['zh', 'en', 'Multi-lingual'] as const).map(l => (
<button
key={l}
onClick={() => setNewModel({...newModel, language: l})}
className={`flex-1 flex items-center justify-center py-1.5 text-xs font-bold rounded-md transition-all ${newModel.language === l ? 'bg-primary text-primary-foreground shadow-lg' : 'text-muted-foreground hover:text-foreground'}`}
>
{l === 'zh' && <span className="mr-1">🇨🇳</span>}
{l === 'en' && <span className="mr-1">🇺🇸</span>}
{l === 'Multi-lingual' && <Globe className="w-3 h-3 mr-1.5" />}
{l === 'zh' ? '中文' : l === 'en' ? '英文' : '多语言'}
</button>
))}
</div>
</div>
<ASRModelModal
isOpen={!!editingModel}
onClose={() => setEditingModel(null)}
onSubmit={(data) => handleUpdate(editingModel!.id, data)}
initialModel={editingModel || undefined}
/>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"> (Model Name)</label>
<Input
value={newModel.name}
onChange={e => setNewModel({...newModel, name: e.target.value})}
placeholder="例如: whisper-1, funasr"
/>
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center">
<Server className="w-3 h-3 mr-1.5" /> Base URL
</label>
<Input
value={newModel.baseUrl}
onChange={e => setNewModel({...newModel, baseUrl: e.target.value})}
placeholder="https://api.openai.com/v1"
className="font-mono text-xs"
/>
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center">
<Key className="w-3 h-3 mr-1.5" /> API Key
</label>
<Input
type="password"
value={newModel.apiKey}
onChange={e => setNewModel({...newModel, apiKey: e.target.value})}
placeholder="sk-..."
className="font-mono text-xs"
/>
</div>
</div>
</Dialog>
<ASRPreviewModal
isOpen={!!previewingModel}
onClose={() => setPreviewingModel(null)}
model={previewingModel}
/>
</div>
);
};
const ASRModelModal: React.FC<{
isOpen: boolean;
onClose: () => void;
onSubmit: (model: Partial<ASRModel>) => Promise<void>;
initialModel?: ASRModel;
}> = ({ isOpen, onClose, onSubmit, initialModel }) => {
const [name, setName] = useState('');
const [vendor, setVendor] = useState('OpenAI Compatible');
const [language, setLanguage] = useState('zh');
const [modelName, setModelName] = useState('FunAudioLLM/SenseVoiceSmall');
const [baseUrl, setBaseUrl] = useState('https://api.siliconflow.cn/v1');
const [apiKey, setApiKey] = useState('');
const [hotwords, setHotwords] = useState('');
const [enablePunctuation, setEnablePunctuation] = useState(true);
const [enableNormalization, setEnableNormalization] = useState(true);
const [enabled, setEnabled] = useState(true);
const [saving, setSaving] = useState(false);
useEffect(() => {
if (!isOpen) return;
if (initialModel) {
setName(initialModel.name || '');
setVendor(initialModel.vendor || 'OpenAI Compatible');
setLanguage(initialModel.language || 'zh');
setModelName(initialModel.modelName || 'FunAudioLLM/SenseVoiceSmall');
setBaseUrl(initialModel.baseUrl || 'https://api.siliconflow.cn/v1');
setApiKey(initialModel.apiKey || '');
setHotwords(toHotwordsValue(initialModel.hotwords));
setEnablePunctuation(initialModel.enablePunctuation ?? true);
setEnableNormalization(initialModel.enableNormalization ?? true);
setEnabled(initialModel.enabled ?? true);
return;
}
setName('');
setVendor('OpenAI Compatible');
setLanguage('zh');
setModelName('FunAudioLLM/SenseVoiceSmall');
setBaseUrl('https://api.siliconflow.cn/v1');
setApiKey('');
setHotwords('');
setEnablePunctuation(true);
setEnableNormalization(true);
setEnabled(true);
}, [initialModel, isOpen]);
const handleSubmit = async () => {
if (!name.trim()) {
alert('请填写模型名称');
return;
}
if (!baseUrl.trim()) {
alert('请填写 Base URL');
return;
}
if (!apiKey.trim()) {
alert('请填写 API Key');
return;
}
try {
setSaving(true);
await onSubmit({
name: name.trim(),
vendor: vendor.trim(),
language,
modelName: modelName.trim(),
baseUrl: baseUrl.trim(),
apiKey: apiKey.trim(),
hotwords: parseHotwords(hotwords),
enablePunctuation,
enableNormalization,
enabled,
});
} catch (error: any) {
alert(error?.message || '保存失败');
} finally {
setSaving(false);
}
};
return (
<Dialog
isOpen={isOpen}
onClose={onClose}
title={initialModel ? '编辑语音识别模型' : '添加语音识别模型'}
footer={
<>
<Button variant="ghost" onClick={onClose}></Button>
<Button onClick={handleSubmit} disabled={saving}>{saving ? '保存中...' : (initialModel ? '保存修改' : '确认添加')}</Button>
</>
}
>
<div className="space-y-4 max-h-[75vh] overflow-y-auto px-1 custom-scrollbar">
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"></label>
<Input value={name} onChange={(e) => setName(e.target.value)} placeholder="例如: SenseVoice CN" />
</div>
<div className="grid grid-cols-1 md:grid-cols-2 gap-4">
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"></label>
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
value={vendor}
onChange={(e) => setVendor(e.target.value)}
>
<option value="OpenAI Compatible">OpenAI Compatible</option>
<option value="SiliconFlow">SiliconFlow</option>
</select>
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center"><Languages className="w-3 h-3 mr-1.5" /></label>
<select
className="flex h-9 w-full rounded-md border-0 bg-white/5 px-3 py-1 text-sm shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-primary/50 text-foreground [&>option]:bg-card"
value={language}
onChange={(e) => setLanguage(e.target.value)}
>
<option value="zh"> (Chinese)</option>
<option value="en"> (English)</option>
<option value="Multi-lingual"> (Multi-lingual)</option>
</select>
</div>
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block">Model Name</label>
<Input value={modelName} onChange={(e) => setModelName(e.target.value)} placeholder="FunAudioLLM/SenseVoiceSmall" />
</div>
<div className="grid grid-cols-1 md:grid-cols-2 gap-4">
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center"><Server className="w-3 h-3 mr-1.5" />Base URL</label>
<Input value={baseUrl} onChange={(e) => setBaseUrl(e.target.value)} placeholder="https://api.siliconflow.cn/v1" className="font-mono text-xs" />
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center"><Key className="w-3 h-3 mr-1.5" />API Key</label>
<Input value={apiKey} onChange={(e) => setApiKey(e.target.value)} type="password" placeholder="sk-..." className="font-mono text-xs" />
</div>
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block"> (comma separated)</label>
<Input value={hotwords} onChange={(e) => setHotwords(e.target.value)} placeholder="品牌名, 人名, 专有词" />
</div>
<div className="grid grid-cols-1 md:grid-cols-3 gap-2">
<label className="flex items-center space-x-2 text-xs text-muted-foreground">
<input type="checkbox" checked={enablePunctuation} onChange={(e) => setEnablePunctuation(e.target.checked)} />
<span></span>
</label>
<label className="flex items-center space-x-2 text-xs text-muted-foreground">
<input type="checkbox" checked={enableNormalization} onChange={(e) => setEnableNormalization(e.target.checked)} />
<span></span>
</label>
<label className="flex items-center space-x-2 text-xs text-muted-foreground">
<input type="checkbox" checked={enabled} onChange={(e) => setEnabled(e.target.checked)} />
<span></span>
</label>
</div>
</div>
</Dialog>
);
};
const ASRPreviewModal: React.FC<{
isOpen: boolean;
onClose: () => void;
model: ASRModel | null;
}> = ({ isOpen, onClose, model }) => {
const [selectedFile, setSelectedFile] = useState<File | null>(null);
const [isDragging, setIsDragging] = useState(false);
const [isTranscribing, setIsTranscribing] = useState(false);
const [transcript, setTranscript] = useState('');
const [latency, setLatency] = useState<number | null>(null);
const [confidence, setConfidence] = useState<number | null>(null);
const [language, setLanguage] = useState('');
const [isRecording, setIsRecording] = useState(false);
const inputRef = useRef<HTMLInputElement>(null);
const mediaRecorderRef = useRef<MediaRecorder | null>(null);
const streamRef = useRef<MediaStream | null>(null);
const chunksRef = useRef<Blob[]>([]);
useEffect(() => {
if (!isOpen) return;
setSelectedFile(null);
setTranscript('');
setLatency(null);
setConfidence(null);
setLanguage(model?.language || '');
setIsTranscribing(false);
setIsRecording(false);
}, [isOpen, model]);
useEffect(() => {
return () => {
if (streamRef.current) {
streamRef.current.getTracks().forEach((track) => track.stop());
}
};
}, []);
const pickFile = (file: File | null) => {
if (!file) return;
if (!file.type.startsWith('audio/')) {
alert('仅支持音频文件');
return;
}
setSelectedFile(file);
};
const handleDrop = (event: React.DragEvent<HTMLDivElement>) => {
event.preventDefault();
setIsDragging(false);
const file = event.dataTransfer.files?.[0] || null;
pickFile(file);
};
const startRecording = async () => {
if (!navigator.mediaDevices?.getUserMedia) {
alert('当前浏览器不支持麦克风录音');
return;
}
try {
const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
const recorder = new MediaRecorder(stream);
chunksRef.current = [];
streamRef.current = stream;
mediaRecorderRef.current = recorder;
recorder.ondataavailable = (event) => {
if (event.data.size > 0) {
chunksRef.current.push(event.data);
}
};
recorder.onstop = () => {
const blob = new Blob(chunksRef.current, { type: recorder.mimeType || 'audio/webm' });
const file = new File([blob], `mic-preview-${Date.now()}.webm`, { type: blob.type || 'audio/webm' });
setSelectedFile(file);
if (streamRef.current) {
streamRef.current.getTracks().forEach((track) => track.stop());
streamRef.current = null;
}
};
recorder.start();
setIsRecording(true);
} catch (error: any) {
alert(error?.message || '无法访问麦克风');
}
};
const stopRecording = () => {
if (!mediaRecorderRef.current) return;
mediaRecorderRef.current.stop();
setIsRecording(false);
};
const runPreview = async () => {
if (!model?.id) return;
if (!selectedFile) {
alert('请先上传或录制音频');
return;
}
try {
setIsTranscribing(true);
const result = await previewASRModel(model.id, selectedFile, { language: language || undefined });
setTranscript(result.transcript || result.message || '无识别内容');
setLatency(result.latency_ms ?? null);
setConfidence(result.confidence ?? null);
} catch (error: any) {
alert(error?.message || '识别失败');
} finally {
setIsTranscribing(false);
}
};
return (
<Dialog
isOpen={isOpen}
onClose={onClose}
title={`试听识别: ${model?.name || ''}`}
footer={
<>
<Button variant="ghost" onClick={onClose}></Button>
<Button onClick={runPreview} disabled={isTranscribing || !selectedFile}>
{isTranscribing ? '识别中...' : '开始识别'}
</Button>
</>
}
>
<div className="space-y-4">
<div
className={`rounded-lg border-2 border-dashed p-4 transition-colors ${isDragging ? 'border-primary bg-primary/10' : 'border-white/10 bg-white/5'}`}
onDragOver={(e) => {
e.preventDefault();
setIsDragging(true);
}}
onDragLeave={() => setIsDragging(false)}
onDrop={handleDrop}
>
<input
ref={inputRef}
type="file"
accept="audio/*"
className="hidden"
onChange={(e) => pickFile(e.target.files?.[0] || null)}
/>
<div className="flex flex-col items-center justify-center gap-2 text-sm text-muted-foreground">
<Upload className="h-6 w-6 text-primary" />
<p></p>
<Button variant="outline" size="sm" onClick={() => inputRef.current?.click()}></Button>
{selectedFile && <p className="text-primary text-xs">: {selectedFile.name}</p>}
</div>
</div>
<div className="flex items-center justify-between rounded-lg border border-white/10 bg-white/5 p-3">
<div className="text-sm text-muted-foreground"></div>
{!isRecording ? (
<Button size="sm" variant="outline" onClick={startRecording}><Mic className="h-4 w-4 mr-1" /></Button>
) : (
<Button size="sm" variant="destructive" onClick={stopRecording}><Square className="h-4 w-4 mr-1" /></Button>
)}
</div>
<div className="space-y-1.5">
<label className="text-[10px] font-black text-muted-foreground uppercase tracking-widest block flex items-center">
<Globe className="w-3 h-3 mr-1.5" /> (Optional)
</label>
<Input value={language} onChange={(e) => setLanguage(e.target.value)} placeholder="zh / en / auto" />
</div>
<div className="rounded-lg border border-primary/20 bg-primary/5 p-3 space-y-2">
<div className="flex items-center justify-between text-xs text-primary">
<span></span>
<span>
{latency !== null ? `Latency: ${latency}ms` : ''}
{confidence !== null ? ` Confidence: ${confidence.toFixed(3)}` : ''}
</span>
</div>
<textarea
readOnly
value={transcript}
className="flex min-h-[120px] w-full rounded-md border-0 bg-black/20 px-3 py-2 text-sm shadow-sm text-white"
placeholder="识别结果会显示在这里"
/>
</div>
</div>
</Dialog>
);
};