feat：新增按顺序选择 fix：修复timing gate意外tool问题

2026-04-27 10:53:13 +08:00
parent 859bbb9cbf
commit d32be4741a
7 changed files with 247 additions and 8 deletions
--- a/pytests/test_maisaka_timing_gate.py
+++ b/pytests/test_maisaka_timing_gate.py
@@ -0,0 +1,148 @@
+from datetime import datetime
+from types import SimpleNamespace
+
+import pytest
+
+from src.core.tooling import ToolExecutionResult
+from src.llm_models.payload_content.tool_option import ToolCall
+from src.maisaka.chat_loop_service import ChatResponse, MaisakaChatLoopService
+from src.maisaka.context_messages import AssistantMessage, TIMING_GATE_INVALID_TOOL_HINT_SOURCE
+from src.maisaka.reasoning_engine import MaisakaReasoningEngine
+
+
+def _build_chat_response(tool_calls: list[ToolCall]) -> ChatResponse:
+    return ChatResponse(
+        content="The model returned an invalid timing tool.",
+        tool_calls=tool_calls,
+        request_messages=[],
+        raw_message=AssistantMessage(
+            content="",
+            timestamp=datetime.now(),
+            source_kind="perception",
+        ),
+        selected_history_count=1,
+        tool_count=len(tool_calls),
+        prompt_tokens=10,
+        built_message_count=1,
+        completion_tokens=3,
+        total_tokens=13,
+        prompt_section=None,
+    )
+
+
+@pytest.mark.asyncio
+async def test_timing_gate_invalid_tool_defaults_to_no_reply(monkeypatch: pytest.MonkeyPatch) -> None:
+    runtime = SimpleNamespace(
+        _force_next_timing_continue=False,
+        _chat_history=[],
+        log_prefix="[test]",
+        stopped=False,
+    )
+
+    def _enter_stop_state() -> None:
+        runtime.stopped = True
+
+    runtime._enter_stop_state = _enter_stop_state
+    engine = MaisakaReasoningEngine(runtime)  # type: ignore[arg-type]
+
+    async def _fake_timing_gate_sub_agent(**kwargs: object) -> ChatResponse:
+        del kwargs
+        return _build_chat_response([
+            ToolCall(call_id="invalid-timing-tool", func_name="finish", args={}),
+        ])
+
+    async def _fail_invoke_tool_call(*args: object, **kwargs: object) -> None:
+        del args, kwargs
+        raise AssertionError("invalid timing tools must not be executed")
+
+    monkeypatch.setattr(engine, "_run_timing_gate_sub_agent", _fake_timing_gate_sub_agent)
+    monkeypatch.setattr(engine, "_invoke_tool_call", _fail_invoke_tool_call)
+
+    action, response, tool_results, tool_monitor_results = await engine._run_timing_gate(object())  # type: ignore[arg-type]
+
+    assert action == "no_reply"
+    assert response.tool_calls[0].func_name == "finish"
+    assert runtime.stopped is True
+    assert tool_monitor_results == []
+    assert len(runtime._chat_history) == 1
+    assert runtime._chat_history[0].source == TIMING_GATE_INVALID_TOOL_HINT_SOURCE
+    assert "finish" in runtime._chat_history[0].processed_plain_text
+    assert tool_results == [
+        "- no_reply [非法 Timing 工具]: 返回了 finish，已停止本轮并等待新消息",
+    ]
+
+
+def test_timing_gate_invalid_tool_hint_keeps_only_latest() -> None:
+    old_hint = SimpleNamespace(source=TIMING_GATE_INVALID_TOOL_HINT_SOURCE)
+    runtime = SimpleNamespace(_chat_history=[old_hint])
+    engine = MaisakaReasoningEngine(runtime)  # type: ignore[arg-type]
+
+    engine._append_timing_gate_invalid_tool_hint("finish")
+    engine._append_timing_gate_invalid_tool_hint("reply")
+
+    assert len(runtime._chat_history) == 1
+    hint_message = runtime._chat_history[0]
+    assert hint_message.source == TIMING_GATE_INVALID_TOOL_HINT_SOURCE
+    assert "reply" in hint_message.processed_plain_text
+    assert "finish" not in hint_message.processed_plain_text
+
+
+def test_timing_gate_invalid_tool_hint_only_visible_to_timing_gate() -> None:
+    runtime = SimpleNamespace(_chat_history=[])
+    engine = MaisakaReasoningEngine(runtime)  # type: ignore[arg-type]
+    engine._append_timing_gate_invalid_tool_hint("finish")
+    hint_message = runtime._chat_history[0]
+
+    timing_history = MaisakaChatLoopService._filter_history_for_request_kind(
+        [hint_message],
+        request_kind="timing_gate",
+    )
+    planner_history = MaisakaChatLoopService._filter_history_for_request_kind(
+        [hint_message],
+        request_kind="planner",
+    )
+
+    assert timing_history == [hint_message]
+    assert planner_history == []
+
+
+def test_finish_tool_is_not_written_back_to_history() -> None:
+    finish_call = ToolCall(call_id="finish-call", func_name="finish", args={})
+    reply_call = ToolCall(call_id="reply-call", func_name="reply", args={})
+    assistant_message = AssistantMessage(
+        content="当前不需要继续回复。",
+        timestamp=datetime.now(),
+        tool_calls=[finish_call, reply_call],
+    )
+    runtime = SimpleNamespace(_chat_history=[assistant_message])
+    engine = MaisakaReasoningEngine(runtime)  # type: ignore[arg-type]
+
+    engine._append_tool_execution_result(
+        finish_call,
+        ToolExecutionResult(
+            tool_name="finish",
+            success=True,
+            content="当前对话循环已结束本轮思考，等待新的消息到来。",
+        ),
+    )
+
+    assert runtime._chat_history == [assistant_message]
+    assert [tool_call.func_name for tool_call in assistant_message.tool_calls] == ["reply"]
+
+
+def test_finish_tool_removes_empty_assistant_history_message() -> None:
+    finish_call = ToolCall(call_id="finish-call", func_name="finish", args={})
+    assistant_message = AssistantMessage(
+        content="",
+        timestamp=datetime.now(),
+        tool_calls=[finish_call],
+    )
+    runtime = SimpleNamespace(_chat_history=[assistant_message])
+    engine = MaisakaReasoningEngine(runtime)  # type: ignore[arg-type]
+
+    engine._append_tool_execution_result(
+        finish_call,
+        ToolExecutionResult(tool_name="finish", success=True),
+    )
+
+    assert runtime._chat_history == []
--- a/src/config/config.py
+++ b/src/config/config.py
@@ -57,7 +57,7 @@ MODEL_CONFIG_PATH: Path = (CONFIG_DIR / "model_config.toml").resolve().absolute(
 LEGACY_ENV_PATH: Path = (PROJECT_ROOT / ".env").resolve().absolute()
 MMC_VERSION: str = "1.0.0"
 CONFIG_VERSION: str = "8.9.17"
-MODEL_CONFIG_VERSION: str = "1.14.2"
+MODEL_CONFIG_VERSION: str = "1.14.3"

 logger = get_logger("config")

--- a/src/config/model_configs.py
+++ b/src/config/model_configs.py
@@ -406,9 +406,10 @@ class TaskConfig(ConfigBase):
        json_schema_extra={
            "x-widget": "select",
            "x-icon": "shuffle",
+            "options": ["balance", "random", "sequential"],
        },
    )
-    """模型选择策略：balance（负载均衡）或 random（随机选择）"""
+    """模型选择策略：balance（负载均衡）、random（随机选择）或 sequential（按配置顺序优先选择）"""


 class ModelTaskConfig(ConfigBase):
--- a/src/llm_models/utils_model.py
+++ b/src/llm_models/utils_model.py
@@ -683,11 +683,16 @@ class LLMOrchestrator:

        ensure_configured_clients_loaded()

-        strategy = self.model_for_task.selection_strategy.lower()
+        strategy = self.model_for_task.selection_strategy.strip().lower()

        if strategy == "random":
            # 随机选择策略
            selected_model_name = random.choice(list(available_models.keys()))
+        elif strategy == "sequential":
+            # 顺序优先策略：按照配置顺序选择第一个尚未失败的模型。
+            selected_model_name = next(
+                model_name for model_name in self.model_for_task.model_list if model_name in available_models
+            )
        elif strategy == "balance":
            # 负载均衡策略：根据总tokens和惩罚值选择
            selected_model_name = min(
--- a/src/maisaka/chat_loop_service.py
+++ b/src/maisaka/chat_loop_service.py
@@ -32,6 +32,7 @@ from .builtin_tool import get_builtin_tools
 from .context_messages import (
    AssistantMessage,
    LLMContextMessage,
+    TIMING_GATE_INVALID_TOOL_HINT_SOURCE,
    ToolResultMessage,
    build_llm_message_from_context,
 )
@@ -704,6 +705,15 @@ class MaisakaChatLoopService:
    ) -> List[LLMContextMessage]:
        """按请求类型过滤不应暴露的历史工具链。"""

+        if request_kind == "timing_gate":
+            return selected_history
+
+        selected_history = [
+            message
+            for message in selected_history
+            if message.source != TIMING_GATE_INVALID_TOOL_HINT_SOURCE
+        ]
+
        if request_kind != "planner":
            return selected_history

--- a/src/maisaka/context_messages.py
+++ b/src/maisaka/context_messages.py
@@ -29,6 +29,7 @@ from src.llm_models.payload_content.tool_option import ToolCall
 from .message_adapter import parse_speaker_content

 FORWARD_PREVIEW_LIMIT = 4
+TIMING_GATE_INVALID_TOOL_HINT_SOURCE = "timing_gate_invalid_tool_hint"


 def _guess_image_format(image_bytes: bytes) -> Optional[str]:
--- a/src/maisaka/reasoning_engine.py
+++ b/src/maisaka/reasoning_engine.py
@@ -11,7 +11,7 @@ import traceback

 from src.chat.heart_flow.heartFC_utils import CycleDetail
 from src.chat.message_receive.message import SessionMessage
-from src.common.data_models.message_component_data_model import EmojiComponent, ImageComponent, MessageSequence
+from src.common.data_models.message_component_data_model import EmojiComponent, ImageComponent, MessageSequence, TextComponent
 from src.common.logger import get_logger
 from src.common.prompt_i18n import load_prompt
 from src.core.tooling import ToolAvailabilityContext, ToolExecutionContext, ToolExecutionResult, ToolInvocation, ToolSpec
@@ -31,6 +31,7 @@ from .context_messages import (
    ComplexSessionMessage,
    LLMContextMessage,
    SessionBackedMessage,
+    TIMING_GATE_INVALID_TOOL_HINT_SOURCE,
    ToolResultMessage,
    contains_complex_message,
 )
@@ -54,6 +55,7 @@ logger = get_logger("maisaka_reasoning_engine")
 TIMING_GATE_CONTEXT_LIMIT = 24
 TIMING_GATE_MAX_TOKENS = 384
 TIMING_GATE_TOOL_NAMES = {"continue", "no_reply", "wait"}
+HISTORY_SILENT_TOOL_NAMES = {"finish"}


 class MaisakaReasoningEngine:
@@ -259,8 +261,21 @@ class MaisakaReasoningEngine:
                break

        if selected_tool_call is None:
-            logger.warning(f"{self._runtime.log_prefix} Timing Gate 未返回有效控制工具，默认继续执行 Action Loop")
-            return "continue", response, tool_result_summaries, tool_monitor_results
+            invalid_tool_names = [
+                str(tool_call.func_name).strip()
+                for tool_call in response.tool_calls
+                if str(tool_call.func_name).strip()
+            ]
+            invalid_tool_text = "、".join(invalid_tool_names) if invalid_tool_names else "无工具"
+            logger.warning(
+                f"{self._runtime.log_prefix} Timing Gate 未返回有效控制工具：{invalid_tool_text}，将按 no_reply 处理"
+            )
+            self._append_timing_gate_invalid_tool_hint(invalid_tool_text)
+            self._runtime._enter_stop_state()
+            tool_result_summaries.append(
+                f"- no_reply [非法 Timing 工具]: 返回了 {invalid_tool_text}，已停止本轮并等待新消息"
+            )
+            return "no_reply", response, tool_result_summaries, tool_monitor_results

        append_history = False
        store_record = selected_tool_call.func_name != "continue"
@@ -286,9 +301,13 @@ class MaisakaReasoningEngine:
        timing_action = str(result.metadata.get("timing_action") or selected_tool_call.func_name).strip()
        if timing_action not in TIMING_GATE_TOOL_NAMES:
            logger.warning(
-                f"{self._runtime.log_prefix} Timing Gate 返回未知动作 {timing_action!r}，将按 continue 处理"
+                f"{self._runtime.log_prefix} Timing Gate 返回未知动作 {timing_action!r}，将按 no_reply 处理"
            )
-            return "continue", response, tool_result_summaries, tool_monitor_results
+            self._runtime._enter_stop_state()
+            tool_result_summaries.append(
+                f"- no_reply [未知 Timing 动作]: 返回了 {timing_action!r}，已停止本轮并等待新消息"
+            )
+            return "no_reply", response, tool_result_summaries, tool_monitor_results
        return timing_action, response, tool_result_summaries, tool_monitor_results

    def _build_forced_continue_timing_result(
@@ -324,6 +343,29 @@ class MaisakaReasoningEngine:
            [],
        )

+    def _append_timing_gate_invalid_tool_hint(self, invalid_tool_text: str) -> None:
+        """写入一条仅 Timing Gate 可见的非法工具提示，并保证最多保留最新一条。"""
+
+        self._runtime._chat_history = [
+            message
+            for message in self._runtime._chat_history
+            if message.source != TIMING_GATE_INVALID_TOOL_HINT_SOURCE
+        ]
+        normalized_tool_text = invalid_tool_text.strip() or "无工具"
+        hint_content = (
+            "Timing Gate 上一轮选择了非法工具："
+            f"{normalized_tool_text}。\n"
+            "Timing Gate 只能调用 continue、wait 或 no_reply 中的一个工具。"
+        )
+        self._runtime._chat_history.append(
+            SessionBackedMessage(
+                raw_message=MessageSequence([TextComponent(hint_content)]),
+                visible_text=hint_content,
+                timestamp=datetime.now(),
+                source_kind=TIMING_GATE_INVALID_TOOL_HINT_SOURCE,
+            )
+        )
+
    @staticmethod
    def _mark_timing_gate_completed(timing_action: str) -> bool:
        """根据门控动作决定下一轮是否还需要重新执行 timing。"""
@@ -1210,6 +1252,10 @@ class MaisakaReasoningEngine:
            result: 统一工具执行结果。
        """

+        if tool_call.func_name in HISTORY_SILENT_TOOL_NAMES:
+            self._remove_tool_call_from_history(tool_call)
+            return
+
        history_content = result.get_history_content()
        if not history_content:
            history_content = "工具执行成功。" if result.success else f"工具 {tool_call.func_name} 执行失败。"
@@ -1224,6 +1270,34 @@ class MaisakaReasoningEngine:
            )
        )

+    def _remove_tool_call_from_history(self, tool_call: ToolCall) -> None:
+        """从历史里的 assistant 消息中移除控制类工具调用。"""
+
+        tool_call_id = str(tool_call.call_id or "").strip()
+        if not tool_call_id:
+            return
+
+        for index in range(len(self._runtime._chat_history) - 1, -1, -1):
+            message = self._runtime._chat_history[index]
+            if not isinstance(message, AssistantMessage) or not message.tool_calls:
+                continue
+
+            remaining_tool_calls = [
+                existing_tool_call
+                for existing_tool_call in message.tool_calls
+                if str(existing_tool_call.call_id or "").strip() != tool_call_id
+            ]
+            if len(remaining_tool_calls) == len(message.tool_calls):
+                continue
+
+            if remaining_tool_calls:
+                message.tool_calls = remaining_tool_calls
+            elif message.content.strip():
+                message.tool_calls = []
+            else:
+                del self._runtime._chat_history[index]
+            return
+
    def _append_timing_gate_execution_result(
        self,
        response: ChatResponse,