Version: 0.9.65.dev.260503

后端： 1. 阶段 1.5/1.6 收口 llm-service / rag-service，统一模型出口与检索基础设施入口，清退 backend/infra/llm 与 backend/infra/rag 旧实现； 2. 同步更新相关调用链与微服务迁移计划文档
2026-05-03 23:21:03 +08:00
parent a6c1e5d077
commit 9902ca3563
65 changed files with 550 additions and 376 deletions
--- a/backend/memory/orchestrator/llm_decision_orchestrator.go
+++ b/backend/memory/orchestrator/llm_decision_orchestrator.go
@@ -6,8 +6,8 @@ import (
 	"log"
 	"strings"

-	infrallm "github.com/LoveLosita/smartflow/backend/infra/llm"
 	memorymodel "github.com/LoveLosita/smartflow/backend/memory/model"
+	llmservice "github.com/LoveLosita/smartflow/backend/services/llm"
 )

 const defaultDecisionCompareMaxTokens = 600
@@ -19,13 +19,13 @@ const defaultDecisionCompareMaxTokens = 600
 // 2. LLM 只输出 relation（关系类型），不输出 action，不输出 target ID；
 // 3. LLM 调用失败时返回 error，由上层决定是否视为 unrelated。
 type LLMDecisionOrchestrator struct {
-	client *infrallm.Client
+	client *llmservice.Client
 	cfg    memorymodel.Config
 	logger *log.Logger
 }

 // NewLLMDecisionOrchestrator 构造决策比对编排器。
-func NewLLMDecisionOrchestrator(client *infrallm.Client, cfg memorymodel.Config) *LLMDecisionOrchestrator {
+func NewLLMDecisionOrchestrator(client *llmservice.Client, cfg memorymodel.Config) *LLMDecisionOrchestrator {
 	return &LLMDecisionOrchestrator{
 		client: client,
 		cfg:    cfg,
@@ -52,14 +52,14 @@ func (o *LLMDecisionOrchestrator) Compare(
 	systemPrompt := buildDecisionCompareSystemPrompt()
 	userPrompt := buildDecisionCompareUserPrompt(fact, candidate)

-	messages := infrallm.BuildSystemUserMessages(systemPrompt, nil, userPrompt)
+	messages := llmservice.BuildSystemUserMessages(systemPrompt, nil, userPrompt)

 	// 2. 调用 LLM 做结构化输出，温度用低值保证判断稳定。
-	resp, _, err := infrallm.GenerateJSON[decisionCompareResponse](
+	resp, _, err := llmservice.GenerateJSON[decisionCompareResponse](
 		ctx,
 		o.client,
 		messages,
-		infrallm.GenerateOptions{
+		llmservice.GenerateOptions{
 			Temperature: 0.1,
 			MaxTokens:   defaultDecisionCompareMaxTokens,
 			Thinking:    resolveMemoryThinkingMode(o.cfg.LLMThinking),
@@ -127,9 +127,9 @@ func buildDecisionCompareUserPrompt(fact memorymodel.NormalizedFact, candidate m
 }

 // resolveMemoryThinkingMode 根据配置布尔值返回对应的 ThinkingMode。
-func resolveMemoryThinkingMode(enabled bool) infrallm.ThinkingMode {
+func resolveMemoryThinkingMode(enabled bool) llmservice.ThinkingMode {
 	if enabled {
-		return infrallm.ThinkingModeEnabled
+		return llmservice.ThinkingModeEnabled
 	}
-	return infrallm.ThinkingModeDisabled
+	return llmservice.ThinkingModeDisabled
 }
--- a/backend/memory/orchestrator/llm_write_orchestrator.go
+++ b/backend/memory/orchestrator/llm_write_orchestrator.go
@@ -7,9 +7,9 @@ import (
 	"log"
 	"strings"

-	infrallm "github.com/LoveLosita/smartflow/backend/infra/llm"
 	memorymodel "github.com/LoveLosita/smartflow/backend/memory/model"
 	memoryutils "github.com/LoveLosita/smartflow/backend/memory/utils"
+	llmservice "github.com/LoveLosita/smartflow/backend/services/llm"
 )

 const (
@@ -24,13 +24,13 @@ const (
 // 2. 不负责落库，不负责任务状态机推进；
 // 3. 当 LLM 不可用或输出异常时，回退到保守的本地抽取，保证链路不完全断。
 type LLMWriteOrchestrator struct {
-	client *infrallm.Client
+	client *llmservice.Client
 	cfg    memorymodel.Config
 	logger *log.Logger
 }

 // NewLLMWriteOrchestrator 构造 LLM 版记忆写入编排器。
-func NewLLMWriteOrchestrator(client *infrallm.Client, cfg memorymodel.Config) *LLMWriteOrchestrator {
+func NewLLMWriteOrchestrator(client *llmservice.Client, cfg memorymodel.Config) *LLMWriteOrchestrator {
 	return &LLMWriteOrchestrator{
 		client: client,
 		cfg:    cfg,
@@ -54,17 +54,17 @@ func (o *LLMWriteOrchestrator) ExtractFacts(ctx context.Context, payload memorym
 		return fallbackNormalizedFacts(payload), nil
 	}

-	messages := infrallm.BuildSystemUserMessages(
+	messages := llmservice.BuildSystemUserMessages(
 		buildMemoryExtractSystemPrompt(o.cfg.ExtractPrompt),
 		nil,
 		buildMemoryExtractUserPrompt(payload),
 	)

-	resp, rawResult, err := infrallm.GenerateJSON[memoryExtractResponse](
+	resp, rawResult, err := llmservice.GenerateJSON[memoryExtractResponse](
 		ctx,
 		o.client,
 		messages,
-		infrallm.GenerateOptions{
+		llmservice.GenerateOptions{
 			Temperature: clampTemperature(o.cfg.LLMTemperature),
 			MaxTokens:   defaultMemoryExtractMaxTokens,
 			Thinking:    resolveMemoryThinkingMode(o.cfg.LLMThinking),
@@ -319,7 +319,7 @@ func isSkipIntent(intent string) bool {
 	}
 }

-func truncateForLog(raw *infrallm.TextResult) string {
+func truncateForLog(raw *llmservice.TextResult) string {
 	if raw == nil {
 		return ""
 	}