Files
Cyrene/backend/ai-core/internal/llm/selector.go
T
AskaEth 91c9ee4b2d fix: 修复 AI 回复无法送达发送者 + 重复消息 + action角色泄露 + OS环境支持
广播逻辑重构:
- AI 回复 (stream_start/response/stream_segments/multi_message/stream_end) 改用 broadcastToUser 发送给所有客户端
- 用户消息回显保持 broadcastToUserExcept 排除发送者

消息去重与角色修复:
- CacheMessage(user) 移至回复生成后,避免本轮 LLM 调用出现重复用户消息
- action 角色消息在 DB 存储时映射为 assistant,DeepSeek 等模型不支持自定义角色
- stream_end defer 机制确保错误路径也会终止客户端思考指示器

OS 完整环境支持:
- host 包重构为 HostBackend 接口 + Direct/WSL/Docker 三种后端
- 新增 os_exec/os_file/os_system 工具供 AI 在完整 Linux 环境中自由操作

其他:
- 视觉模型注入 + 图片预处理后清空 Images 避免传给 Chat 模型
- 图片 URL 相对路径→绝对 URL 转换
- DevTools 链路追踪页面 + 重启修复
- 记忆搜索模糊匹配增强
- 后台思考定时调度支持
- 管理后台页面 (模型配置/用户管理等)
- docs/api 更新广播机制说明

Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
2026-05-29 12:46:17 +08:00

140 lines
3.7 KiB
Go

package llm
import (
"context"
"fmt"
"sync"
"time"
"github.com/yourname/cyrene-ai/ai-core/internal/config"
)
// ModelPurpose identifies the kind of LLM task.
type ModelPurpose string
const (
PurposeChat ModelPurpose = "chat"
PurposeDeepThinking ModelPurpose = "deep_thinking"
PurposeIntentAnalysis ModelPurpose = "intent_analysis"
PurposeToolCalling ModelPurpose = "tool_calling"
PurposeMemoryExtraction ModelPurpose = "memory_extraction"
PurposeVision ModelPurpose = "vision"
PurposeOCR ModelPurpose = "ocr"
)
// ErrModelNotRequired is returned when an optional model is unavailable.
var ErrModelNotRequired = fmt.Errorf("model not required, caller should degrade gracefully")
// ModelSelector routes requests to the best available LLMProvider based on purpose.
type ModelSelector struct {
loader *config.Loader
envCfg OpenAIConfig
mu sync.RWMutex
cache map[string]LLMProvider
cachedEnv LLMProvider // cached env fallback, created once
}
// NewModelSelector creates a ModelSelector. If loader is nil or has no config,
// all calls fall back to envCfg.
func NewModelSelector(loader *config.Loader, envFallback OpenAIConfig) *ModelSelector {
return &ModelSelector{
loader: loader,
envCfg: envFallback,
cache: make(map[string]LLMProvider),
}
}
// Select returns an LLMProvider for the given purpose. Falls back through the
// routing fallback chain; returns the env provider if nothing matches.
func (s *ModelSelector) Select(ctx context.Context, purpose ModelPurpose) (LLMProvider, error) {
if s.loader == nil || !s.loader.HasConfig() {
return s.envProvider(), nil
}
cfg := s.loader.GetConfig()
if cfg == nil {
return s.envProvider(), nil
}
route, ok := cfg.Routing[string(purpose)]
if !ok || len(route.FallbackChain) == 0 {
return s.envProvider(), nil
}
for _, modelID := range route.FallbackChain {
provider, err := s.getOrCreateProvider(modelID, cfg)
if err != nil {
continue
}
return provider, nil
}
if route.Required {
return nil, fmt.Errorf("all models unavailable for purpose %s", purpose)
}
return s.envProvider(), nil
}
// DefaultAdapter returns an *Adapter backed by the chat-purpose provider.
// This is the backward-compatible entry point: all existing consumers
// (Orchestrator, Synthesizer, BackgroundThinker, etc.) use this.
func (s *ModelSelector) DefaultAdapter() *Adapter {
provider, _ := s.Select(context.Background(), PurposeChat)
return NewAdapter(provider)
}
func (s *ModelSelector) envProvider() LLMProvider {
s.mu.Lock()
defer s.mu.Unlock()
if s.cachedEnv == nil {
s.cachedEnv = NewOpenAIProvider(s.envCfg)
}
return s.cachedEnv
}
func (s *ModelSelector) getOrCreateProvider(modelID string, cfg *config.ModelsConfigData) (LLMProvider, error) {
s.mu.RLock()
if p, ok := s.cache[modelID]; ok {
s.mu.RUnlock()
return p, nil
}
s.mu.RUnlock()
modelCfg, ok := cfg.Models[modelID]
if !ok {
return nil, fmt.Errorf("model %s not found", modelID)
}
if !modelCfg.Enabled {
return nil, fmt.Errorf("model %s is disabled", modelID)
}
provCfg, ok := cfg.Providers[modelCfg.Provider]
if !ok {
return nil, fmt.Errorf("provider %s not found for model %s", modelCfg.Provider, modelID)
}
timeout := time.Duration(provCfg.TimeoutSec) * time.Second
if timeout <= 0 {
timeout = 120 * time.Second
}
maxRetries := provCfg.MaxRetries
if maxRetries <= 0 {
maxRetries = 3
}
provider := NewOpenAIProvider(OpenAIConfig{
BaseURL: provCfg.BaseURL,
APIKey: provCfg.APIKey,
Model: modelCfg.Name,
FallbackModel: modelCfg.Name,
MaxRetries: maxRetries,
Timeout: timeout,
})
s.mu.Lock()
s.cache[modelID] = provider
s.mu.Unlock()
return provider, nil
}