Version: 0.8.7.dev.260402

后端： 1.Plan节点实现两阶段LLM调用：Phase1无thinking快速评估复杂度，复杂任务自动开启Phase2深度规划 2.Execute节点新增GoalCheck自省机制：LLM输出next_plan/done时必须附带对照done_when的完成验证，为空则追加修正重试前端：无仓库：无
2026-04-02 22:56:06 +08:00
parent 2c64b37d00
commit 64b946816f
6 changed files with 136 additions and 41 deletions
--- a/backend/newAgent/node/execute.go
+++ b/backend/newAgent/node/execute.go
@@ -131,6 +131,20 @@ func RunExecuteNode(ctx context.Context, input ExecuteNodeInput) error {
 		return fmt.Errorf("执行决策不合法: %w", err)
 	}

+	// 自省校验：next_plan / done 必须附带 goal_check，否则不推进，追加修正让 LLM 重试。
+	if decision.Action == newagentmodel.ExecuteActionNextPlan ||
+		decision.Action == newagentmodel.ExecuteActionDone {
+		if strings.TrimSpace(decision.GoalCheck) == "" {
+			AppendLLMCorrectionWithHint(
+				conversationContext,
+				decision.Speak,
+				fmt.Sprintf("你输出了 action=%s，但 goal_check 为空。", decision.Action),
+				fmt.Sprintf("输出 %s 时，必须在 goal_check 中对照 done_when 逐条说明完成依据。", decision.Action),
+			)
+			return nil
+		}
+	}
+
 	// 6. 若 LLM 先对用户说话，则伪流式推送并写回历史。
 	if strings.TrimSpace(decision.Speak) != "" {
 		if err := emitter.EmitPseudoAssistantText(
--- a/backend/newAgent/node/plan.go
+++ b/backend/newAgent/node/plan.go
@@ -38,13 +38,14 @@ type PlanNodeInput struct {
 // RunPlanNode 执行一轮规划节点逻辑。
 //
 // 步骤说明：
-//  1. 先校验最小依赖，并推送一条“正在规划”的状态，避免用户空等；
-//  2. 再用 prompt/plan.go 组装 messages，请模型严格输出 PlanDecision JSON；
-//  3. 若模型先对用户说了话，则先把 speak 伪流式推给前端，并写回 history；
-//  4. 最后按 action 推进流程：
-//     4.1 continue：继续停留在 planning；
-//     4.2 ask_user：打开 pending interaction，后续交给 interrupt 收口；
-//     4.3 plan_done：固化完整计划，刷新 pinned context，并进入 waiting_confirm。
+//  1. 先校验最小依赖，并推送一条”正在规划”的状态，避免用户空等；
+//  2. Phase 1（快速评估）：不开 thinking，让 LLM 同时产出复杂度评估和规划结果；
+//  3. Phase 2（深度规划）：若 LLM 自评需要深度思考且规划已完成，开 thinking 重跑；
+//  4. 若模型先对用户说了话，则先把 speak 伪流式推给前端，并写回 history；
+//  5. 最后按 action 推进流程：
+//     5.1 continue：继续停留在 planning；
+//     5.2 ask_user：打开 pending interaction，后续交给 interrupt 收口；
+//     5.3 plan_done：固化完整计划，刷新 pinned context，并进入 waiting_confirm。
 func RunPlanNode(ctx context.Context, input PlanNodeInput) error {
 	runtimeState, conversationContext, emitter, err := preparePlanNodeInput(input)
 	if err != nil {
@@ -63,8 +64,10 @@ func RunPlanNode(ctx context.Context, input PlanNodeInput) error {
 		return fmt.Errorf("规划阶段状态推送失败: %w", err)
 	}

-	// 2. 构造本轮规划输入，并要求模型输出结构化 PlanDecision。
+	// 2. 构造本轮规划输入。
 	messages := newagentprompt.BuildPlanMessages(flowState, conversationContext, input.UserInput)
+
+	// 3. Phase 1：快速评估（不开 thinking），让 LLM 同时产出复杂度评估和规划结果。
 	decision, rawResult, err := newagentllm.GenerateJSON[newagentmodel.PlanDecision](
 		ctx,
 		input.Client,
@@ -72,23 +75,60 @@ func RunPlanNode(ctx context.Context, input PlanNodeInput) error {
 		newagentllm.GenerateOptions{
 			Temperature: 0.2,
 			MaxTokens:   1600,
-			Thinking:    newagentllm.ThinkingModeEnabled,
+			Thinking:    newagentllm.ThinkingModeDisabled,
 			Metadata: map[string]any{
 				"stage": planStageName,
+				"phase": "assessment",
 			},
 		},
 	)
 	if err != nil {
 		if rawResult != nil && strings.TrimSpace(rawResult.Text) != "" {
-			return fmt.Errorf("规划输出解析失败，原始输出=%s，错误=%w", strings.TrimSpace(rawResult.Text), err)
+			return fmt.Errorf("规划评估解析失败，原始输出=%s，错误=%w", strings.TrimSpace(rawResult.Text), err)
 		}
-		return fmt.Errorf("规划阶段模型调用失败: %w", err)
+		return fmt.Errorf("规划评估阶段模型调用失败: %w", err)
 	}
 	if err := decision.Validate(); err != nil {
-		return fmt.Errorf("规划决策不合法: %w", err)
+		return fmt.Errorf("规划评估决策不合法: %w", err)
 	}

-	// 3. 若模型先对用户说了话，则先以伪流式推送，再写回 history，保证上下文连续。
+	// 4. Phase 2：若 LLM 自评需要深度思考且本轮规划已完成，则开启 thinking 重跑。
+	//    条件：NeedThinking=true + Action=plan_done → 说明 LLM 认为当前无 thinking 的计划质量不够。
+	//    其他 action（continue / ask_user）不需要 thinking，直接用 Phase 1 结果。
+	if decision.NeedThinking && decision.Action == newagentmodel.PlanActionDone {
+		if err := emitter.EmitStatus(
+			planStatusBlockID,
+			planStageName,
+			"deep_planning",
+			"正在深入思考，生成更完善的计划。",
+			false,
+		); err != nil {
+			return fmt.Errorf("深度规划状态推送失败: %w", err)
+		}
+
+		deepDecision, _, deepErr := newagentllm.GenerateJSON[newagentmodel.PlanDecision](
+			ctx,
+			input.Client,
+			messages,
+			newagentllm.GenerateOptions{
+				Temperature: 0.2,
+				MaxTokens:   3200,
+				Thinking:    newagentllm.ThinkingModeEnabled,
+				Metadata: map[string]any{
+					"stage": planStageName,
+					"phase": "deep_planning",
+				},
+			},
+		)
+		if deepErr == nil && deepDecision != nil {
+			if validateErr := deepDecision.Validate(); validateErr == nil {
+				decision = deepDecision
+			}
+		}
+		// 深度规划失败时静默降级到 Phase 1 结果，不中断流程。
+	}
+
+	// 5. 若模型先对用户说了话，则先以伪流式推送，再写回 history，保证上下文连续。
 	if strings.TrimSpace(decision.Speak) != "" {
 		if err := emitter.EmitPseudoAssistantText(
 			ctx,
@@ -102,7 +142,7 @@ func RunPlanNode(ctx context.Context, input PlanNodeInput) error {
 		conversationContext.AppendHistory(schema.AssistantMessage(decision.Speak, nil))
 	}

-	// 4. 按规划动作推进流程状态。
+	// 6. 按规划动作推进流程状态。
 	switch decision.Action {
 	case newagentmodel.PlanActionContinue:
 		flowState.Phase = newagentmodel.PhasePlanning