feat: Phase 5 STT — DashScope Gummy 实时语音识别 + 本地 Whisper 回退
- DashScope WebSocket STT 客户端 (gummy-chat-v1) - 双引擎架构: DashScope 优先, Whisper 本地回退 - 实时流式 STT WebSocket 端点 - DevTools 模型搜索框焦点修复 Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
This commit is contained in:
@@ -14,44 +14,50 @@ import (
|
||||
|
||||
func main() {
|
||||
logger.SetDefault(logger.New("voice-service"))
|
||||
logger.Println("🎤 Voice-Service (STT + TTS) 启动中...")
|
||||
logger.Println("Voice-Service (STT + TTS) 启动中...")
|
||||
|
||||
// 加载配置
|
||||
cfg := config.Load()
|
||||
|
||||
logger.Printf("配置: 端口=%s, WhisperBinary=%s, WhisperModel=%s, Language=%s",
|
||||
cfg.Port, cfg.WhisperBinary, cfg.WhisperModel, cfg.WhisperLanguage)
|
||||
logger.Printf("配置: 端口=%s, DashScope=%v, WhisperBinary=%s, WhisperModel=%s, Language=%s",
|
||||
cfg.Port, cfg.DashScopeAPIKey != "", cfg.WhisperBinary, cfg.WhisperModel, cfg.WhisperLanguage)
|
||||
|
||||
// 初始化 STT 服务
|
||||
// 初始化 STT 服务 (DashScope 优先, Whisper 回退)
|
||||
sttSvc := service.NewSTTService(cfg)
|
||||
|
||||
// 检查 whisper 引擎是否可用
|
||||
if !sttSvc.IsAvailable() {
|
||||
logger.Printf("⚠️ Whisper 引擎未安装 (%s),STT 功能不可用", cfg.WhisperBinary)
|
||||
logger.Printf(" 请运行: bash scripts/setup-whisper.sh")
|
||||
if sttSvc.IsAvailable() {
|
||||
dashAvailable := cfg.DashScopeAPIKey != ""
|
||||
if dashAvailable {
|
||||
logger.Println("STT: DashScope Gummy (主) + Whisper (回退)")
|
||||
} else {
|
||||
logger.Println("STT: Whisper 本地引擎")
|
||||
}
|
||||
} else {
|
||||
logger.Println("✅ Whisper 引擎已就绪")
|
||||
logger.Printf("STT 引擎不可用。请配置 DASHSCOPE_API_KEY 或安装 Whisper")
|
||||
logger.Printf(" Whisper 安装: bash scripts/setup-whisper.sh")
|
||||
}
|
||||
|
||||
// 初始化 TTS 服务
|
||||
ttsSvc := service.NewTTSService()
|
||||
|
||||
if !ttsSvc.IsAvailable() {
|
||||
logger.Println("⚠️ TTS 引擎不可用 (请安装: pip install edge-tts)")
|
||||
logger.Println("TTS 引擎不可用 (请安装: pip install edge-tts)")
|
||||
} else {
|
||||
ttsStatus := ttsSvc.GetEngineStatus()
|
||||
logger.Printf("✅ TTS 引擎已就绪 (引擎: %s)", ttsStatus["engine"])
|
||||
logger.Printf("TTS 引擎已就绪 (引擎: %s)", ttsStatus["engine"])
|
||||
}
|
||||
|
||||
// 初始化 HTTP 处理器
|
||||
sttHandler := handler.NewSTTHandler(sttSvc, cfg)
|
||||
sttHandler.SetTTSService(ttsSvc)
|
||||
ttsHandler := handler.NewTTSHandler(ttsSvc)
|
||||
streamingHandler := handler.NewStreamingSTTHandler(sttSvc)
|
||||
|
||||
// 注册路由
|
||||
mux := http.NewServeMux()
|
||||
sttHandler.RegisterRoutes(mux)
|
||||
ttsHandler.RegisterRoutes(mux)
|
||||
streamingHandler.RegisterStreamingRoutes(mux)
|
||||
|
||||
// 启动 HTTP 服务
|
||||
srv := &http.Server{
|
||||
@@ -60,7 +66,7 @@ func main() {
|
||||
}
|
||||
|
||||
go func() {
|
||||
logger.Printf("🚀 Voice-Service 已启动在端口 %s", cfg.Port)
|
||||
logger.Printf("Voice-Service 已启动在端口 %s", cfg.Port)
|
||||
if err := srv.ListenAndServe(); err != nil && err != http.ErrServerClosed {
|
||||
logger.Fatalf("服务启动失败: %v", err)
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user