Version: 0.9.3.dev.260407

后端： 1.Execute 上下文修复（无限循环 / 重复确认根治） - 更新node/execute.go：speak 写入历史（修复旧 TODO）；confirm 动作 speak 不再丢失； continue 无工具调用时写 reason 保证上下文推进；区分 tool_call 数组/JSON损坏两种 correction hint；goal_check hint 区分 plan/ReAct 模式 - 更新node/execute.go：新增 AlwaysExecute 字段，extra.always_execute=true 时写工具跳过确认闸门直接执行并持久化 - 更新model/graph_run_state.go：AgentGraphRequest 新增 AlwaysExecute；新增 WriteSchedulePreviewFunc 类型和 WriteSchedulePreview Dep - 更新service/agentsvc/agent.go：新增 readAgentExtraBool 辅助 2.粗排全链路修复 - 更新service/agentsvc/agent_newagent.go：makeRoughBuildFunc 改用 HybridScheduleEntry 而非 TaskClassItem.EmbeddedTime，普通时段放置不再被丢弃 - 更新conv/schedule_provider.go：LoadScheduleState 从 task class 日期范围推算多周规划窗口，不再硬编码当前周 7 天；DayMapping 覆盖全部相关周，粗排跨周结果不再被 WeekDayToDay 静默丢弃 - 更新node/rough_build.go：pinned block 区分有/无未覆盖 pending 任务两种情况，有 pending 时明确操作顺序（find_free→place）和完成判定，防止 LLM 重复调 list_tasks；新增 countPendingTasks 辅助（只统计 Slots 为空的真正未覆盖任务） - 更新model/common_state.go：新增 StartDirectExecute()，Chat 直接路由 execute 时清空旧 PlanSteps，修复跨会话 HasPlan() 误判导致 ReAct 走 plan 模式的 bug - 更新node/chat.go：handleRouteExecute 改用 StartDirectExecute() 3.排程预览缓存迁移至 Deliver 节点 - 更新node/agent_nodes.go：Deliver 节点完成后调用 WriteSchedulePreview，只有任务真正完成才写预览缓存，中断路径不写中间态 - 更新service/agentsvc/agent_newagent.go：注入 makeWriteSchedulePreviewFunc；移除 graph 结束后的内联写入；makeRoughBuildFunc 注释修正 - 更新conv/schedule_preview.go：ScheduleStateToPreview 补设 GeneratedAt - 更新model/agent.go：GetSchedulePlanPreviewResponse 新增 HybridEntries 字段 - 更新service/agentsvc/agent_schedule_preview.go：GET handler Redis/MySQL 两条路径均透传 HybridEntries 4.Execute thinking 模式修复 - 更新newAgent/llm/ark_adapter.go：thinking 开启时强制 temperature=1，MaxTokens 自动托底至 16000，调用方与适配层行为对齐 - 更新node/execute.go：调用参数同步改为 temperature=1.0 / MaxTokens=16000 undo: 1.流式推送换行未修复(undo) 2.上下文依然待审视前端：无仓库：无
2026-04-07 12:10:56 +08:00
parent 2038185730
commit 32bb740b75
17 changed files with 410 additions and 148 deletions
--- a/backend/newAgent/node/agent_nodes.go
+++ b/backend/newAgent/node/agent_nodes.go
@@ -4,6 +4,7 @@ import (
 	"context"
 	"errors"
 	"fmt"
+	"log"

 	newagentmodel "github.com/LoveLosita/smartflow/backend/newAgent/model"
 	newagenttools "github.com/LoveLosita/smartflow/backend/newAgent/tools"
@@ -214,6 +215,7 @@ func (n *AgentNodes) Execute(ctx context.Context, st *newagentmodel.AgentGraphSt
 			ScheduleState:         scheduleState,
 			SchedulePersistor:     st.Deps.SchedulePersistor,
 			OriginalScheduleState: st.OriginalScheduleState,
+			AlwaysExecute:         st.Request.AlwaysExecute,
 		},
 	); err != nil {
 		return nil, err
@@ -247,6 +249,16 @@ func (n *AgentNodes) Deliver(ctx context.Context, st *newagentmodel.AgentGraphSt
 		return nil, err
 	}

+	// 任务完成后写排程预览缓存：只有走到 Deliver 才代表排程结果已稳定，
+	// 中断（confirm/ask_user）路径不写，避免把中间态暴露给前端。
+	if st.Deps.WriteSchedulePreview != nil && st.ScheduleState != nil {
+		flowState := st.EnsureFlowState()
+		if err := st.Deps.WriteSchedulePreview(ctx, st.ScheduleState, flowState.UserID, flowState.ConversationID, flowState.TaskClassIDs); err != nil {
+			// 写缓存失败不阻断主流程，降级为仅 log。
+			log.Printf("[WARN] deliver: 写入排程预览缓存失败 chat=%s: %v", flowState.ConversationID, err)
+		}
+	}
+
 	saveAgentState(ctx, st)
 	return st, nil
 }
--- a/backend/newAgent/node/chat.go
+++ b/backend/newAgent/node/chat.go
@@ -158,7 +158,8 @@ func handleRouteExecute(
 	// 推送轻量状态通知，让前端知道请求已接收。
 	_ = emitter.EmitStatus(chatStatusBlockID, chatStageName, "accepted", speak, false)

-	flowState.Phase = newagentmodel.PhaseExecuting
+	// 清空旧 PlanSteps 并设 PhaseExecuting，避免上一次任务残留的步骤被 HasPlan() 误判。
+	flowState.StartDirectExecute()

 	// 安全兜底：只有真正持有 task_class_ids 时才开粗排。
 	if decision.NeedsRoughBuild && len(flowState.TaskClassIDs) > 0 {
--- a/backend/newAgent/node/deliver.go
+++ b/backend/newAgent/node/deliver.go
@@ -122,7 +122,7 @@ func generateDeliverSummary(
 		return buildMechanicalSummary(flowState)
 	}

-	return strings.TrimSpace(result.Text)
+	return normalizeSpeak(result.Text)
 }

 // buildMechanicalSummary 在 LLM 不可用时，机械拼接一份最小可用总结。
--- a/backend/newAgent/node/execute.go
+++ b/backend/newAgent/node/execute.go
@@ -5,6 +5,7 @@ import (
 	"encoding/json"
 	"fmt"
 	"log"
+	"regexp"
 	"strings"
 	"time"

@@ -50,6 +51,7 @@ type ExecuteNodeInput struct {
 	ScheduleState         *newagenttools.ScheduleState
 	SchedulePersistor     newagentmodel.SchedulePersistor
 	OriginalScheduleState *newagenttools.ScheduleState
+	AlwaysExecute         bool // true 时写工具跳过确认闸门直接执行
 }

 // ExecuteRoundObservation 记录执行阶段每轮的关键观察。
@@ -141,9 +143,9 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 		input.Client,
 		messages,
 		newagentllm.GenerateOptions{
-			Temperature: 0.3,
-			MaxTokens:   1200,
-			Thinking:    newagentllm.ThinkingModeDisabled,
+			Temperature: 1.0,   // thinking 模式强制要求 temperature=1
+			MaxTokens:   16000, // 需为 thinking chain 留出足够预算
+			Thinking:    newagentllm.ThinkingModeEnabled,
 			Metadata: map[string]any{
 				"stage":      executeStageName,
 				"step_index": flowState.CurrentStep,
@@ -166,12 +168,18 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 				return fmt.Errorf("连续 %d 次输出非 JSON，终止执行: 原始输出=%s",
 					flowState.ConsecutiveCorrections, rawText)
 			}
-			AppendLLMCorrectionWithHint(
-				conversationContext,
-				rawText,
-				"你的输出不是合法 JSON，无法解析。",
-				"你必须输出严格的 JSON 格式，不要使用 [NEXT_PLAN] 等纯文本标记。合法格式示例：{\"speak\":\"...\",\"action\":\"next_plan\",\"goal_check\":\"...\",\"reason\":\"...\"}",
-			)
+			// 区分两种常见失败：
+			// 1. tool_call 是数组（LLM 想批量调工具）→ 告知只能单次调用，保留已有上下文；
+			// 2. 真正的 JSON 格式损坏 → 要求重新输出合法 JSON。
+			var errorDesc, optionHint string
+			if strings.Contains(rawText, `"tool_call": [`) || strings.Contains(rawText, `"tool_call":[`) {
+				errorDesc = "你在 tool_call 字段传入了数组，但每轮只能调用一个工具，不支持批量格式。"
+				optionHint = "请把多个工具调用拆开，每轮只调一个，拿到结果后再继续下一步。示例：{\"speak\":\"...\",\"action\":\"continue\",\"reason\":\"...\",\"tool_call\":{\"name\":\"get_task_info\",\"arguments\":{\"task_id\":1}}}"
+			} else {
+				errorDesc = "你的输出不是合法 JSON，无法解析。"
+				optionHint = "你必须输出严格的 JSON 格式。合法格式示例：{\"speak\":\"...\",\"action\":\"continue\",\"reason\":\"...\",\"tool_call\":{\"name\":\"工具名\",\"arguments\":{}}}"
+			}
+			AppendLLMCorrectionWithHint(conversationContext, rawText, errorDesc, optionHint)
 			return nil
 		}

@@ -223,6 +231,9 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 	// 决策合法，重置连续修正计数。
 	flowState.ConsecutiveCorrections = 0

+	// speak 后处理：补列表序号换行 + 末尾加 \n 防止连续 speak 在前端粘连。
+	decision.Speak = normalizeSpeak(decision.Speak) // 末尾已含 \n
+
 	// 自省校验：next_plan / done 必须附带 goal_check，否则不推进，追加修正让 LLM 重试。
 	if decision.Action == newagentmodel.ExecuteActionNextPlan ||
 		decision.Action == newagentmodel.ExecuteActionDone {
@@ -231,31 +242,52 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 			if flowState.ConsecutiveCorrections >= maxConsecutiveCorrections {
 				return fmt.Errorf("连续 %d 次 goal_check 为空，终止执行", flowState.ConsecutiveCorrections)
 			}
+			// hint 区分有 plan / ReAct 两种模式：
+			// - 有 plan：要求对照 done_when 逐条验证；
+			// - ReAct：没有 done_when，只要求总结完成事实。
+			var goalCheckHint string
+			if flowState.HasPlan() {
+				goalCheckHint = fmt.Sprintf("输出 %s 时，必须在 goal_check 中对照 done_when 逐条说明完成依据。", decision.Action)
+			} else {
+				goalCheckHint = fmt.Sprintf("输出 %s 时，必须在 goal_check 中总结任务已完成的事实证据（调用了哪些工具、得到了什么结果）。", decision.Action)
+			}
 			AppendLLMCorrectionWithHint(
 				conversationContext,
 				decision.Speak,
 				fmt.Sprintf("你输出了 action=%s，但 goal_check 为空。", decision.Action),
-				fmt.Sprintf("输出 %s 时，必须在 goal_check 中对照 done_when 逐条说明完成依据。", decision.Action),
+				goalCheckHint,
 			)
 			return nil
 		}
 	}

-	// 6. 若 LLM 先对用户说话，且不是 ask_user / confirm（二者交给下游节点收口），则伪流式推送。
-	if strings.TrimSpace(decision.Speak) != "" &&
-		decision.Action != newagentmodel.ExecuteActionAskUser &&
-		decision.Action != newagentmodel.ExecuteActionConfirm {
-		if err := emitter.EmitPseudoAssistantText(
-			ctx,
-			executeSpeakBlockID,
-			executeStageName,
-			decision.Speak,
-			newagentstream.DefaultPseudoStreamOptions(),
-		); err != nil {
-			return fmt.Errorf("执行文案推送失败: %w", err)
+	// 6. speak 推流与历史写入。
+	//
+	// AlwaysExecute=true 时，confirm 动作不走确认卡片，speak 和 continue 一样直接推流；
+	// AlwaysExecute=false 时，confirm 的 speak 不推流（由确认卡片展示），但仍写入历史，
+	// 防止 LLM 下一轮忘记自己的计划，形成重复确认循环。
+	speakText := decision.Speak // 已由 normalizeSpeak 处理，末尾含 \n
+	if speakText != "" {
+		isConfirmWithCard := decision.Action == newagentmodel.ExecuteActionConfirm && !input.AlwaysExecute
+		isAskUser := decision.Action == newagentmodel.ExecuteActionAskUser
+
+		if !isConfirmWithCard && !isAskUser {
+			// 推流给前端
+			if err := emitter.EmitPseudoAssistantText(
+				ctx,
+				executeSpeakBlockID,
+				executeStageName,
+				speakText,
+				newagentstream.DefaultPseudoStreamOptions(),
+			); err != nil {
+				return fmt.Errorf("执行文案推送失败: %w", err)
+			}
 		}
-		// 将 LLM 的话追加到对话历史，保证下一轮上下文连续。
-		// TODO: 后续需要把工具调用结果也追加到历史，这里先留占位。
+		// 始终写入历史（confirm 卡片场景下也写，保证上下文连续）
+		conversationContext.AppendHistory(&schema.Message{
+			Role:    schema.Assistant,
+			Content: speakText,
+		})
 	}

 	// 7. 按 LLM 决策执行动作，后端信任 LLM 判断，不做语义校验。
@@ -266,7 +298,15 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 		if decision.ToolCall != nil {
 			return executeToolCall(ctx, flowState, conversationContext, decision.ToolCall, emitter, input.ToolRegistry, input.ScheduleState)
 		}
-		// 无工具调用，仅对话，继续下一轮。
+		// 无工具调用且 speak 为空（speak 非空时已在步骤 6 写入历史）。
+		// 若 history 本轮完全没有更新，下一轮 LLM 会收到完全相同的上下文，容易死循环。
+		// 把 reason 写入历史，保证上下文向前推进。
+		if strings.TrimSpace(decision.Speak) == "" && strings.TrimSpace(decision.Reason) != "" {
+			conversationContext.AppendHistory(&schema.Message{
+				Role:    schema.Assistant,
+				Content: decision.Reason,
+			})
+		}
 		return nil

 	case newagentmodel.ExecuteActionAskUser:
@@ -276,8 +316,20 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 		return nil

 	case newagentmodel.ExecuteActionConfirm:
-		// LLM 申报了写操作意图，需要用户确认后才能真正执行。
-		// 步骤：1) 把 ToolCallIntent 转成快照暂存；2) 设 Phase → 下游 confirm 节点接管。
+		// AlwaysExecute=true：跳过确认闸门，直接执行写工具并持久化，不走 confirm 节点。
+		if input.AlwaysExecute && decision.ToolCall != nil {
+			if err := executeToolCall(ctx, flowState, conversationContext, decision.ToolCall, emitter, input.ToolRegistry, input.ScheduleState); err != nil {
+				return err
+			}
+			if input.SchedulePersistor != nil && input.OriginalScheduleState != nil {
+				cs := runtimeState.EnsureCommonState()
+				if persistErr := input.SchedulePersistor.PersistScheduleChanges(ctx, input.OriginalScheduleState, input.ScheduleState, cs.UserID); persistErr != nil {
+					log.Printf("[WARN] execute always-execute 持久化失败: %v", persistErr)
+				}
+			}
+			return nil
+		}
+		// AlwaysExecute=false（默认）：暂存工具意图，设 Phase → 下游 confirm 节点接管。
 		return handleExecuteActionConfirm(decision, runtimeState, flowState)

 	case newagentmodel.ExecuteActionNextPlan:
@@ -588,6 +640,24 @@ func executePendingTool(
 	return nil
 }

+// listItemRe 匹配被粘连在一起的列表序号（如 "）2. " "水课3. "），用于自动补换行。
+// 规则：非换行字符后紧跟 2-9 的序号（"2. " "3、" 等），说明 LLM 漏写了换行。
+var listItemRe = regexp.MustCompile(`([^\n])([2-9][\.、]\s)`)
+
+// normalizeSpeak 对 LLM 输出的 speak 做后处理：
+// 1. 在列表序号（2. 3. …）前补 \n，防止列表项粘连；
+// 2. 统一补尾部 \n，防止多轮 speak 推流时文字头尾粘连。
+func normalizeSpeak(speak string) string {
+	speak = strings.TrimSpace(speak)
+	if speak == "" {
+		return speak
+	}
+	if !strings.Contains(speak, "\n") {
+		speak = listItemRe.ReplaceAllString(speak, "$1\n$2")
+	}
+	return speak + "\n"
+}
+
 // truncateText 截断文本到指定长度。
 //
 // 用于状态推送时避免超长文本影响前端展示。
--- a/backend/newAgent/node/rough_build.go
+++ b/backend/newAgent/node/rough_build.go
@@ -80,17 +80,33 @@ func RunRoughBuildNode(ctx context.Context, st *newagentmodel.AgentGraphState) e
 		false,
 	)

-	// 8. 把粗排完成信息写入 pinned context，让 Execute 阶段的 LLM 直接跳过"触发粗排"，
-	//    进入验证和微调，避免 LLM 误以为需要自己运行算法而浪费一轮工具调用。
-	st.EnsureConversationContext().UpsertPinnedBlock(newagentmodel.ContextBlock{
-		Key:   "rough_build_done",
-		Title: "粗排已完成",
-		Content: fmt.Sprintf(
+	// 8. 把粗排完成信息写入 pinned context，让 Execute 阶段的 LLM 直接进入验证和微调。
+	stillPending := countPendingTasks(scheduleState)
+	var pinnedContent string
+	if stillPending > 0 {
+		pinnedContent = fmt.Sprintf(
 			"后端已自动运行粗排算法，初始排课方案已写入日程状态（共 %d 个任务已预排）。\n"+
+				"注意：仍有 %d 个任务未被粗排覆盖，处于待安排（pending）状态，必须在微调阶段手动安排完毕。\n\n"+
+				"处理 pending 任务的正确操作顺序：\n"+
+				"1. 调用 get_overview 或 find_free 确认可用空位（不要反复调用 list_tasks，list_tasks 只能看任务列表，看不出空位）\n"+
+				"2. 调用 place 将 pending 任务放入空位\n"+
+				"3. 重复上述步骤，直到 get_overview 显示待安排任务剩余为 0\n\n"+
+				"微调完成的判定标准：所有 pending 任务均已 place（待安排任务剩余=0），且现有排课无明显失衡。\n"+
+				"无需再次触发粗排。",
+			len(placements), stillPending,
+		)
+	} else {
+		pinnedContent = fmt.Sprintf(
+			"后端已自动运行粗排算法，初始排课方案已写入日程状态（共 %d 个任务已预排，无待安排任务）。\n"+
 				"请直接调用 get_overview 查看预排结果，然后用 move/swap 微调不合理的位置。\n"+
-				"无需再次触发粗排，也不要在 plan_steps 里描述触发粗排相关的操作。",
+				"无需再次触发粗排。",
 			len(placements),
-		),
+		)
+	}
+	st.EnsureConversationContext().UpsertPinnedBlock(newagentmodel.ContextBlock{
+		Key:     "rough_build_done",
+		Title:   "粗排已完成",
+		Content: pinnedContent,
 	})

 	// 9. 清除标记，进入执行阶段。
@@ -99,6 +115,24 @@ func RunRoughBuildNode(ctx context.Context, st *newagentmodel.AgentGraphState) e
 	return nil
 }

+// countPendingTasks 统计粗排后仍无位置的待安排任务数。
+//
+// 粗排只设 Slots，不改 Status（仍为 "pending"），
+// 所以"真正未覆盖"= pending 且 Slots 为空，需要手动 place。
+func countPendingTasks(state *newagenttools.ScheduleState) int {
+	if state == nil {
+		return 0
+	}
+	count := 0
+	for i := range state.Tasks {
+		t := &state.Tasks[i]
+		if t.Status == "pending" && len(t.Slots) == 0 {
+			count++
+		}
+	}
+	return count
+}
+
 // applyRoughBuildPlacements 把粗排结果写入 ScheduleState 对应任务的 Slots。
 //
 // 设计说明：