tests/gateway/test_auto_continue.py

"""Tests for the auto-continue feature (#4493).

When the gateway restarts mid-agent-work, the session transcript ends on a
tool result that the agent never processed.  The auto-continue logic detects
this and prepends a system note to the next user message so the model
finishes the interrupted work before addressing the new input.
"""

import pytest


def _simulate_auto_continue(agent_history: list, user_message: str) -> str:
    """Reproduce the auto-continue injection logic from _run_agent().

    This mirrors the exact code in gateway/run.py so we can test the
    detection and message transformation without spinning up a full
    gateway runner.
    """
    message = user_message
    if agent_history and agent_history[-1].get("role") == "tool":
        message = (
            "[System note: Your previous turn was interrupted before you could "
            "process the last tool result(s). The conversation history contains "
            "tool outputs you haven't responded to yet. Please finish processing "
            "those results and summarize what was accomplished, then address the "
            "user's new message below.]\n\n"
            + message
        )
    return message


class TestAutoDetection:
    """Test that trailing tool results are correctly detected."""

    def test_trailing_tool_result_triggers_note(self):
        history = [
            {"role": "user", "content": "deploy the app"},
            {"role": "assistant", "content": None, "tool_calls": [
                {"id": "call_1", "function": {"name": "terminal", "arguments": "{}"}}
            ]},
            {"role": "tool", "tool_call_id": "call_1", "content": "deployed successfully"},
        ]
        result = _simulate_auto_continue(history, "what happened?")
        assert "[System note:" in result
        assert "interrupted" in result
        assert "what happened?" in result

    def test_trailing_assistant_message_no_note(self):
        history = [
            {"role": "user", "content": "hello"},
            {"role": "assistant", "content": "Hi there!"},
        ]
        result = _simulate_auto_continue(history, "how are you?")
        assert "[System note:" not in result
        assert result == "how are you?"

    def test_empty_history_no_note(self):
        result = _simulate_auto_continue([], "hello")
        assert result == "hello"

    def test_trailing_user_message_no_note(self):
        """Shouldn't happen in practice, but ensure no false positive."""
        history = [
            {"role": "user", "content": "hello"},
        ]
        result = _simulate_auto_continue(history, "hello again")
        assert result == "hello again"

    def test_multiple_tool_results_still_triggers(self):
        """Multiple tool calls in a row — last one is still role=tool."""
        history = [
            {"role": "user", "content": "search and read"},
            {"role": "assistant", "content": None, "tool_calls": [
                {"id": "call_1", "function": {"name": "search", "arguments": "{}"}},
                {"id": "call_2", "function": {"name": "read", "arguments": "{}"}},
            ]},
            {"role": "tool", "tool_call_id": "call_1", "content": "found it"},
            {"role": "tool", "tool_call_id": "call_2", "content": "file content here"},
        ]
        result = _simulate_auto_continue(history, "continue")
        assert "[System note:" in result

    def test_original_message_preserved_after_note(self):
        """The user's actual message must appear after the system note."""
        history = [
            {"role": "assistant", "content": None, "tool_calls": [
                {"id": "c1", "function": {"name": "t", "arguments": "{}"}}
            ]},
            {"role": "tool", "tool_call_id": "c1", "content": "done"},
        ]
        result = _simulate_auto_continue(history, "now do X")
        # System note comes first, then user's message
        note_end = result.index("]\n\n")
        user_msg_start = result.index("now do X")
        assert user_msg_start > note_end
feat: auto-continue interrupted agent work after gateway restart (#4493) When the gateway restarts mid-agent-work, the session transcript ends on a tool result the agent never processed. Previously, the user had to type 'continue' or use /retry (which replays from scratch, losing all prior work). Now, when the next user message arrives and the loaded history ends with role='tool', a system note is prepended: [System note: Your previous turn was interrupted before you could process the last tool result(s). Please finish processing those results and summarize what was accomplished, then address the user's new message below.] This is injected in _run_agent()'s run_sync closure, right before calling agent.run_conversation(). The agent sees the full history (including the pending tool results) and the system note, so it can summarize what was accomplished and then handle the user's new input. Design decisions: - No new session flags or schema changes — purely detects trailing tool messages in the loaded history - Works for any restart scenario (clean, crash, SIGTERM, drain timeout) as long as the session wasn't suspended (suspended = fresh start) - The user's actual message is preserved after the note - If the session WAS suspended (unclean shutdown), the old history is abandoned and the user starts fresh — no false auto-continue Also updates the shutdown notification message from 'Use /retry after restart to continue' to 'Send any message after restart to resume where it left off' — which is now accurate. Test plan: - 6 new auto-continue tests (trailing tool detection, no false positives for assistant/user/empty history, multi-tool, message preservation) - All 13 restart drain tests pass (updated /retry assertion) 2026-04-14 16:55:30 -07:00			`"""Tests for the auto-continue feature (#4493).`

			`When the gateway restarts mid-agent-work, the session transcript ends on a`
			`tool result that the agent never processed. The auto-continue logic detects`
			`this and prepends a system note to the next user message so the model`
			`finishes the interrupted work before addressing the new input.`
			`"""`

			`import pytest`


			`def _simulate_auto_continue(agent_history: list, user_message: str) -> str:`
			`"""Reproduce the auto-continue injection logic from _run_agent().`

			`This mirrors the exact code in gateway/run.py so we can test the`
			`detection and message transformation without spinning up a full`
			`gateway runner.`
			`"""`
			`message = user_message`
			`if agent_history and agent_history[-1].get("role") == "tool":`
			`message = (`
			`"[System note: Your previous turn was interrupted before you could "`
			`"process the last tool result(s). The conversation history contains "`
			`"tool outputs you haven't responded to yet. Please finish processing "`
			`"those results and summarize what was accomplished, then address the "`
			`"user's new message below.]\n\n"`
			`+ message`
			`)`
			`return message`


			`class TestAutoDetection:`
			`"""Test that trailing tool results are correctly detected."""`

			`def test_trailing_tool_result_triggers_note(self):`
			`history = [`
			`{"role": "user", "content": "deploy the app"},`
			`{"role": "assistant", "content": None, "tool_calls": [`
			`{"id": "call_1", "function": {"name": "terminal", "arguments": "{}"}}`
			`]},`
			`{"role": "tool", "tool_call_id": "call_1", "content": "deployed successfully"},`
			`]`
			`result = _simulate_auto_continue(history, "what happened?")`
			`assert "[System note:" in result`
			`assert "interrupted" in result`
			`assert "what happened?" in result`

			`def test_trailing_assistant_message_no_note(self):`
			`history = [`
			`{"role": "user", "content": "hello"},`
			`{"role": "assistant", "content": "Hi there!"},`
			`]`
			`result = _simulate_auto_continue(history, "how are you?")`
			`assert "[System note:" not in result`
			`assert result == "how are you?"`

			`def test_empty_history_no_note(self):`
			`result = _simulate_auto_continue([], "hello")`
			`assert result == "hello"`

			`def test_trailing_user_message_no_note(self):`
			`"""Shouldn't happen in practice, but ensure no false positive."""`
			`history = [`
			`{"role": "user", "content": "hello"},`
			`]`
			`result = _simulate_auto_continue(history, "hello again")`
			`assert result == "hello again"`

			`def test_multiple_tool_results_still_triggers(self):`
			`"""Multiple tool calls in a row — last one is still role=tool."""`
			`history = [`
			`{"role": "user", "content": "search and read"},`
			`{"role": "assistant", "content": None, "tool_calls": [`
			`{"id": "call_1", "function": {"name": "search", "arguments": "{}"}},`
			`{"id": "call_2", "function": {"name": "read", "arguments": "{}"}},`
			`]},`
			`{"role": "tool", "tool_call_id": "call_1", "content": "found it"},`
			`{"role": "tool", "tool_call_id": "call_2", "content": "file content here"},`
			`]`
			`result = _simulate_auto_continue(history, "continue")`
			`assert "[System note:" in result`

			`def test_original_message_preserved_after_note(self):`
			`"""The user's actual message must appear after the system note."""`
			`history = [`
			`{"role": "assistant", "content": None, "tool_calls": [`
			`{"id": "c1", "function": {"name": "t", "arguments": "{}"}}`
			`]},`
			`{"role": "tool", "tool_call_id": "c1", "content": "done"},`
			`]`
			`result = _simulate_auto_continue(history, "now do X")`
			`# System note comes first, then user's message`
			`note_end = result.index("]\n\n")`
			`user_msg_start = result.index("now do X")`
			`assert user_msg_start > note_end`