后端: 1. 品牌文案与聊天定位统一切到 SmartMate,并放宽非排程问答能力 - 系统人设、路由、排程、查询、交付提示统一从 SmartFlow 改为 SmartMate - 明确普通问答/生活建议/开放讨论可正常回答,deep_answer 不再输出“让我想想”等占位话术 - thinkingMode=auto 时,deep_answer 默认开启 thinking,execute 继续跟随路由决策,其余路由默认关闭 2. Memory 读取链路升级为“结构化强约束 + 语义候选”hybrid 模式,并补齐注入渲染 / Execute 消费 - 新增 read.mode、四类记忆预算、inject.renderMode 等配置及默认值 - 落地 HybridRetrieve,统一 MySQL/RAG 读侧作用域、三级去重(ID/hash/text)、统一重排与按类型预算裁剪 - 新增 FindPinnedByUser、content_hash DTO/兜底补算、legacy/RAG 共用读侧查询口径与 fallback 逻辑 - 记忆注入支持 flat/typed_v2 两种渲染,execute msg3 正式消费 memory_context,主链路注入 MemoryReader 时同步透传 memory 配置 3. Memory 第二步/第三步 handoff 与治理文档补齐 - HANDOFF_Memory向Mem0靠拢三步冲刺计划.md 从 newAgent 迁到 memory 目录,并补充“我的记忆”增删改查与最小留痕口径 - 新增 backend/memory/记忆模块第二步计划.md、backend/memory/第三步治理与观测落地计划.md,分别拆解 hybrid 读取注入闭环与治理/观测/清理路线 - 同步更新 backend/memory/Log.txt 调试日志 前端: 1. 助手输入区新增“智能编排”任务类选择器,并把 task_class_ids 作为请求 extra 透传 - 新建 frontend/src/components/assistant/TaskClassPlanningPicker.vue,支持拉取任务类列表、临时勾选、已选标签回显与清空 - 更新 frontend/src/components/dashboard/AssistantPanel.vue、frontend/src/types/dashboard.ts:Chat extra 正式建模 task_class_ids / retry 字段;当本轮带编排任务类时强制新起会话,避免把现有会话历史误混入新编排 2. 会话上下文窗口统计接入前端展示 - 更新 frontend/src/api/agent.ts、新建 frontend/src/components/assistant/ContextWindowMeter.vue、更新 frontend/src/components/dashboard/AssistantPanel.vue、frontend/src/types/dashboard.ts:接入 /agent/context-stats,兼容 object/string/null 三种返回;在输入工具栏展示 msg0~msg3 占比与预算使用率 3. 助手面板交互细节优化 - 更新 frontend/src/components/dashboard/AssistantPanel.vue:thinking 开关改为 auto/true/false 三态选择;切会话与重试后同步刷新 context stats;历史列表首屏不足时自动继续分页直到形成滚动区 仓库:无
89 lines
3.4 KiB
Go
89 lines
3.4 KiB
Go
package service
|
|
|
|
import (
|
|
"time"
|
|
|
|
memorymodel "github.com/LoveLosita/smartflow/backend/memory/model"
|
|
"github.com/spf13/viper"
|
|
)
|
|
|
|
// LoadConfigFromViper 读取记忆模块配置并做默认值兜底。
|
|
//
|
|
// 默认策略:
|
|
// 1. temperature/top_p 使用低随机参数,提升可复现性;
|
|
// 2. Day1 先提供参数位,不强制所有参数立即生效;
|
|
// 3. 轮询与重试参数给出保守默认值,避免对主链路造成压力。
|
|
func LoadConfigFromViper() memorymodel.Config {
|
|
cfg := memorymodel.Config{
|
|
Enabled: viper.GetBool("memory.enabled"),
|
|
RAGEnabled: viper.GetBool("memory.rag.enabled"),
|
|
ReadMode: memorymodel.NormalizeReadMode(viper.GetString("memory.read.mode")),
|
|
InjectRenderMode: memorymodel.NormalizeInjectRenderMode(viper.GetString("memory.inject.renderMode")),
|
|
ExtractPrompt: viper.GetString("memory.prompt.extract"),
|
|
DecisionPrompt: viper.GetString("memory.prompt.decision"),
|
|
Threshold: viper.GetFloat64("memory.threshold"),
|
|
EnableReranker: viper.GetBool("memory.enableReranker"),
|
|
LLMTemperature: viper.GetFloat64("memory.llm.temperature"),
|
|
LLMTopP: viper.GetFloat64("memory.llm.topP"),
|
|
JobMaxRetry: viper.GetInt("memory.job.maxRetry"),
|
|
WorkerPollEvery: viper.GetDuration("memory.worker.pollEvery"),
|
|
WorkerClaimBatch: viper.GetInt("memory.worker.claimBatch"),
|
|
ReadConstraintLimit: viper.GetInt("memory.read.constraintLimit"),
|
|
ReadPreferenceLimit: viper.GetInt("memory.read.preferenceLimit"),
|
|
ReadFactLimit: viper.GetInt("memory.read.factLimit"),
|
|
ReadTodoHintLimit: viper.GetInt("memory.read.todoHintLimit"),
|
|
|
|
// 决策层配置:默认关闭,灰度开启后才会生效。
|
|
DecisionEnabled: viper.GetBool("memory.decision.enabled"),
|
|
DecisionCandidateTopK: viper.GetInt("memory.decision.candidateTopK"),
|
|
DecisionCandidateMinScore: viper.GetFloat64("memory.decision.candidateMinScore"),
|
|
DecisionFallbackMode: viper.GetString("memory.decision.fallbackMode"),
|
|
WriteMode: viper.GetString("memory.write.mode"),
|
|
}
|
|
|
|
if cfg.Threshold <= 0 {
|
|
cfg.Threshold = 0.55
|
|
}
|
|
if cfg.LLMTemperature <= 0 {
|
|
cfg.LLMTemperature = 0.1
|
|
}
|
|
if cfg.LLMTopP <= 0 {
|
|
cfg.LLMTopP = 0.2
|
|
}
|
|
if cfg.JobMaxRetry <= 0 {
|
|
cfg.JobMaxRetry = 6
|
|
}
|
|
if cfg.WorkerPollEvery <= 0 {
|
|
cfg.WorkerPollEvery = 2 * time.Second
|
|
}
|
|
if cfg.WorkerClaimBatch <= 0 {
|
|
cfg.WorkerClaimBatch = 1
|
|
}
|
|
cfg.ReadConstraintLimit = cfg.EffectiveReadConstraintLimit()
|
|
cfg.ReadPreferenceLimit = cfg.EffectiveReadPreferenceLimit()
|
|
cfg.ReadFactLimit = cfg.EffectiveReadFactLimit()
|
|
cfg.ReadTodoHintLimit = cfg.EffectiveReadTodoHintLimit()
|
|
cfg.ReadMode = cfg.EffectiveReadMode()
|
|
cfg.InjectRenderMode = cfg.EffectiveInjectRenderMode()
|
|
|
|
// 决策层配置默认值兜底。
|
|
// 说明:
|
|
// 1. TopK 和 MinScore 是 Milvus 召回参数,需要保守默认值避免召回过多噪声候选;
|
|
// 2. FallbackMode 默认退回旧路径新增,保证决策流程异常时不丢数据;
|
|
// 3. WriteMode 由 DecisionEnabled 隐式决定,这里不做强制联动。
|
|
if cfg.DecisionCandidateTopK <= 0 {
|
|
cfg.DecisionCandidateTopK = 5
|
|
}
|
|
if cfg.DecisionCandidateMinScore <= 0 {
|
|
cfg.DecisionCandidateMinScore = 0.6
|
|
}
|
|
if cfg.DecisionFallbackMode == "" {
|
|
cfg.DecisionFallbackMode = "legacy_add"
|
|
}
|
|
if cfg.WriteMode == "" {
|
|
cfg.WriteMode = "legacy"
|
|
}
|
|
|
|
return cfg
|
|
}
|