Version: 0.9.16.dev.260413

后端： 1. RAG embedding 接入修正，并兼容 Ark 多模态 embedding 链路 - 更新 backend/infra/rag/embed/eino_embedder.go：文本 embedding 继续走 Eino OpenAI 兼容链路；`doubao-embedding-vision-*` 模型切到 Ark 原生 `/embeddings/multimodal` - 增加 embedding baseURL 归一化：兼容把 `.../embeddings` 或 `.../embeddings/multimodal` 误填进配置的情况，统一回退到 `/api/v3` - 为第三方 embedding 调用增加 panic recover，避免向量检索/写入异常直接打崩主进程 2. RAG runtime / pipeline / store 稳定性加固，统一降级为 error 语义 - 更新 backend/infra/rag/runtime.go：runtime 对外入口增加 panic recover 与观测打点 - 更新 backend/infra/rag/core/pipeline.go：ingest / retrieve 编排边界增加 panic recover - 更新 backend/infra/rag/retrieve/vector_retriever.go：向量检索边界补充 panic recover - 更新 backend/infra/rag/store/milvus_store.go、backend/infra/rag/store/inmemory_store.go：补齐未初始化保护，避免 nil 依赖直接异常退出 3. RAG embedding 配置口径与普通 LLM 链路对齐 - 更新 backend/infra/rag/factory.go：RAG embedding API Key 不再走 `apiKeyEnv` 间接映射，统一直接读取 `ARK_API_KEY` - 更新 backend/infra/rag/config/config.go：删除 `rag.embed.apiKeyEnv` 配置字段，收敛配置分叉 - 更新 backend/config.example.yaml：示例配置切到当前联调口径，保持 `rag.enabled=true`、`memory.rag.enabled=true`，并对齐 Milvus / embed 配置 4. Memory + RAG 联调链路可运行态修正 - 当前已验证 memory 抽取写库、RAG ingest 写入 Milvus、后续语义召回链路可继续联调 - 检索失败场景已从“直接 panic”收敛为“记录日志并降级”，不再阻断主聊天链路前端：无仓库：无 undo： 1. 增删改查的 mysql 记忆去重没实现 2. 提取用户话为记忆的过滤机制不足，有点无脑 3. RAG 召回也有问题
2026-04-13 23:18:59 +08:00
parent 070d4c3459
commit 863cba4e4e
9 changed files with 297 additions and 53 deletions
--- a/backend/infra/rag/core/pipeline.go
+++ b/backend/infra/rag/core/pipeline.go
@@ -5,6 +5,7 @@ import (
 	"errors"
 	"fmt"
 	"log"
+	"runtime/debug"
 	"strings"
 	"time"
 )
@@ -69,7 +70,9 @@ func (p *Pipeline) Ingest(
 	corpus CorpusAdapter,
 	input any,
 	opt IngestOption,
-) (*IngestResult, error) {
+) (result *IngestResult, err error) {
+	defer p.recoverExecutionPanic(ctx, "ingest", &err)
+
 	if p == nil || p.chunker == nil || p.embedder == nil || p.store == nil {
 		return nil, ErrNilDependency
 	}
@@ -95,7 +98,9 @@ func (p *Pipeline) IngestDocuments(
 	corpusName string,
 	docs []SourceDocument,
 	opt IngestOption,
-) (*IngestResult, error) {
+) (result *IngestResult, err error) {
+	defer p.recoverExecutionPanic(ctx, "ingest_documents", &err)
+
 	if p == nil || p.chunker == nil || p.embedder == nil || p.store == nil {
 		return nil, ErrNilDependency
 	}
@@ -170,7 +175,9 @@ func (p *Pipeline) Retrieve(
 	ctx context.Context,
 	corpus CorpusAdapter,
 	req RetrieveRequest,
-) (*RetrieveResult, error) {
+) (result *RetrieveResult, err error) {
+	defer p.recoverExecutionPanic(ctx, "retrieve", &err)
+
 	if p == nil || p.embedder == nil || p.store == nil {
 		return nil, ErrNilDependency
 	}
@@ -236,7 +243,7 @@ func (p *Pipeline) Retrieve(
 		})
 	}

-	result := &RetrieveResult{
+	result = &RetrieveResult{
 		Items:        candidates,
 		RawCount:     rawCount,
 		FallbackUsed: false,
@@ -273,6 +280,39 @@ func (p *Pipeline) Retrieve(
 	return result, nil
 }

+func (p *Pipeline) recoverExecutionPanic(ctx context.Context, operation string, errPtr *error) {
+	recovered := recover()
+	if recovered == nil || errPtr == nil {
+		return
+	}
+
+	panicErr := fmt.Errorf("rag pipeline panic recovered: operation=%s panic=%v", operation, recovered)
+	*errPtr = panicErr
+
+	// 1. Pipeline 是 chunk/embed/store/rerank 的统一编排边界，第三方依赖异常不应直接杀掉上层请求。
+	// 2. 这里统一 recover 后继续走 error 语义，让 runtime/service 决定降级、回退或记日志。
+	// 3. stack 只写观测层，不塞进返回值，避免把超长堆栈直接暴露给上层业务错误文案。
+	if p != nil && p.observer != nil {
+		p.observer.Observe(ctx, ObserveEvent{
+			Level:     ObserveLevelError,
+			Component: "pipeline",
+			Operation: operation + "_panic_recovered",
+			Fields: map[string]any{
+				"status":     "failed",
+				"panic":      fmt.Sprintf("%v", recovered),
+				"panic_type": fmt.Sprintf("%T", recovered),
+				"error":      panicErr,
+				"error_code": ClassifyErrorCode(panicErr),
+				"stack":      string(debug.Stack()),
+			},
+		})
+		return
+	}
+	if p != nil && p.logger != nil {
+		p.logger.Printf("rag pipeline panic recovered: operation=%s panic=%v stack=%s", operation, recovered, string(debug.Stack()))
+	}
+}
+
 func normalizeChunkOption(opt ChunkOption) ChunkOption {
 	if opt.ChunkSize <= 0 {
 		opt.ChunkSize = defaultChunkSize