mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-04-28 06:51:16 +08:00
Repeated /queue commands now each produce a full agent turn, in order, with no merging. Previously the second /queue overwrote the first because the handler wrote directly into the adapter's single-slot _pending_messages dict. - GatewayRunner grows a _queued_events overflow buffer (dict of list). - /queue puts new items in the adapter's next-up slot when free, otherwise appends to the overflow. After each run's drain consumes the slot, the next overflow item is promoted so the recursive run picks it up. - /new and /reset clear the overflow. - /status now reports queue depth when non-zero. - Ack message shows the depth once it exceeds 1. Helpers (_enqueue_fifo, _promote_queued_event, _queue_depth) use the getattr default-fallback pattern so existing tests that build bare GatewayRunner instances via object.__new__ keep working.
364 lines
14 KiB
Python
364 lines
14 KiB
Python
"""Tests for /queue message consumption after normal agent completion.
|
|
|
|
Verifies that messages queued via /queue (which store in
|
|
adapter._pending_messages WITHOUT triggering an interrupt) are consumed
|
|
after the agent finishes its current task — not silently dropped.
|
|
"""
|
|
|
|
import asyncio
|
|
from unittest.mock import AsyncMock, MagicMock, patch
|
|
|
|
import pytest
|
|
|
|
from gateway.run import _dequeue_pending_event
|
|
from gateway.platforms.base import (
|
|
BasePlatformAdapter,
|
|
MessageEvent,
|
|
MessageType,
|
|
PlatformConfig,
|
|
Platform,
|
|
)
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Minimal adapter for testing pending message storage
|
|
# ---------------------------------------------------------------------------
|
|
|
|
class _StubAdapter(BasePlatformAdapter):
|
|
def __init__(self):
|
|
super().__init__(PlatformConfig(enabled=True, token="test"), Platform.TELEGRAM)
|
|
|
|
async def connect(self) -> bool:
|
|
return True
|
|
|
|
async def disconnect(self) -> None:
|
|
self._mark_disconnected()
|
|
|
|
async def send(self, chat_id, content, reply_to=None, metadata=None):
|
|
from gateway.platforms.base import SendResult
|
|
return SendResult(success=True, message_id="msg-1")
|
|
|
|
async def get_chat_info(self, chat_id):
|
|
return {"id": chat_id, "type": "dm"}
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Tests
|
|
# ---------------------------------------------------------------------------
|
|
|
|
class TestQueueMessageStorage:
|
|
"""Verify /queue stores messages correctly in adapter._pending_messages."""
|
|
|
|
def test_queue_stores_message_in_pending(self):
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
event = MessageEvent(
|
|
text="do this next",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(chat_id="123", platform=Platform.TELEGRAM),
|
|
message_id="q1",
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
|
|
assert session_key in adapter._pending_messages
|
|
assert adapter._pending_messages[session_key].text == "do this next"
|
|
|
|
def test_get_pending_message_consumes_and_clears(self):
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
event = MessageEvent(
|
|
text="queued prompt",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(chat_id="123", platform=Platform.TELEGRAM),
|
|
message_id="q2",
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
|
|
retrieved = adapter.get_pending_message(session_key)
|
|
assert retrieved is not None
|
|
assert retrieved.text == "queued prompt"
|
|
# Should be consumed (cleared)
|
|
assert adapter.get_pending_message(session_key) is None
|
|
|
|
def test_dequeue_pending_event_preserves_voice_media_metadata(self):
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:voice"
|
|
event = MessageEvent(
|
|
text="",
|
|
message_type=MessageType.VOICE,
|
|
source=MagicMock(chat_id="123", platform=Platform.TELEGRAM),
|
|
message_id="voice-q1",
|
|
media_urls=["/tmp/voice.ogg"],
|
|
media_types=["audio/ogg"],
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
|
|
retrieved = _dequeue_pending_event(adapter, session_key)
|
|
|
|
assert retrieved is event
|
|
assert retrieved.media_urls == ["/tmp/voice.ogg"]
|
|
assert retrieved.media_types == ["audio/ogg"]
|
|
assert adapter.get_pending_message(session_key) is None
|
|
|
|
def test_queue_does_not_set_interrupt_event(self):
|
|
"""The whole point of /queue — no interrupt signal."""
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
# Simulate an active session (agent running)
|
|
adapter._active_sessions[session_key] = asyncio.Event()
|
|
|
|
# Store a queued message (what /queue does)
|
|
event = MessageEvent(
|
|
text="queued",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id="q3",
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
|
|
# The interrupt event should NOT be set
|
|
assert not adapter._active_sessions[session_key].is_set()
|
|
assert not adapter.has_pending_interrupt(session_key)
|
|
|
|
def test_regular_message_sets_interrupt_event(self):
|
|
"""Contrast: regular messages DO trigger interrupt."""
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
adapter._active_sessions[session_key] = asyncio.Event()
|
|
|
|
# Simulate regular message arrival (what handle_message does)
|
|
event = MessageEvent(
|
|
text="new message",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id="m1",
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
adapter._active_sessions[session_key].set() # this is what handle_message does
|
|
|
|
assert adapter.has_pending_interrupt(session_key)
|
|
|
|
|
|
class TestQueueConsumptionAfterCompletion:
|
|
"""Verify that pending messages are consumed after normal completion."""
|
|
|
|
def test_pending_message_available_after_normal_completion(self):
|
|
"""After agent finishes without interrupt, pending message should
|
|
still be retrievable from adapter._pending_messages."""
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
# Simulate: agent starts, /queue stores a message, agent finishes
|
|
adapter._active_sessions[session_key] = asyncio.Event()
|
|
event = MessageEvent(
|
|
text="process this after",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id="q4",
|
|
)
|
|
adapter._pending_messages[session_key] = event
|
|
|
|
# Agent finishes (no interrupt)
|
|
del adapter._active_sessions[session_key]
|
|
|
|
# The queued message should still be retrievable
|
|
retrieved = adapter.get_pending_message(session_key)
|
|
assert retrieved is not None
|
|
assert retrieved.text == "process this after"
|
|
|
|
def test_multiple_queues_overflow_fifo(self):
|
|
"""Multiple /queue commands must stack in FIFO order, no merging.
|
|
|
|
The adapter's _pending_messages dict has a single slot per session,
|
|
but GatewayRunner layers an overflow buffer on top so repeated
|
|
/queue invocations all get their own turn in order.
|
|
"""
|
|
from gateway.run import GatewayRunner
|
|
|
|
runner = GatewayRunner.__new__(GatewayRunner)
|
|
runner._queued_events = {}
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
events = [
|
|
MessageEvent(
|
|
text=text,
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(chat_id="123", platform=Platform.TELEGRAM),
|
|
message_id=f"q-{text}",
|
|
)
|
|
for text in ("first", "second", "third")
|
|
]
|
|
|
|
for ev in events:
|
|
runner._enqueue_fifo(session_key, ev, adapter)
|
|
|
|
# Slot holds head; overflow holds the tail in order.
|
|
assert adapter._pending_messages[session_key].text == "first"
|
|
assert [e.text for e in runner._queued_events[session_key]] == ["second", "third"]
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 3
|
|
|
|
def test_promote_advances_queue_fifo(self):
|
|
"""After the slot drains, the next overflow item is promoted."""
|
|
from gateway.run import GatewayRunner
|
|
|
|
runner = GatewayRunner.__new__(GatewayRunner)
|
|
runner._queued_events = {}
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
for text in ("A", "B", "C"):
|
|
runner._enqueue_fifo(
|
|
session_key,
|
|
MessageEvent(
|
|
text=text,
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id=f"q-{text}",
|
|
),
|
|
adapter,
|
|
)
|
|
|
|
# Simulate turn 1 drain: consume slot, promote next.
|
|
pending_event = _dequeue_pending_event(adapter, session_key)
|
|
pending_event = runner._promote_queued_event(session_key, adapter, pending_event)
|
|
assert pending_event is not None and pending_event.text == "A"
|
|
assert adapter._pending_messages[session_key].text == "B"
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 2
|
|
|
|
# Simulate turn 2 drain.
|
|
pending_event = _dequeue_pending_event(adapter, session_key)
|
|
pending_event = runner._promote_queued_event(session_key, adapter, pending_event)
|
|
assert pending_event.text == "B"
|
|
assert adapter._pending_messages[session_key].text == "C"
|
|
assert session_key not in runner._queued_events # overflow emptied
|
|
|
|
# Simulate turn 3 drain.
|
|
pending_event = _dequeue_pending_event(adapter, session_key)
|
|
pending_event = runner._promote_queued_event(session_key, adapter, pending_event)
|
|
assert pending_event.text == "C"
|
|
assert session_key not in adapter._pending_messages
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 0
|
|
|
|
# Turn 4: nothing pending.
|
|
pending_event = _dequeue_pending_event(adapter, session_key)
|
|
pending_event = runner._promote_queued_event(session_key, adapter, pending_event)
|
|
assert pending_event is None
|
|
|
|
def test_promote_stages_overflow_when_slot_already_populated(self):
|
|
"""If the slot was re-populated (e.g. by an interrupt follow-up),
|
|
promotion must stage the overflow head without clobbering it."""
|
|
from gateway.run import GatewayRunner
|
|
|
|
runner = GatewayRunner.__new__(GatewayRunner)
|
|
runner._queued_events = {}
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:123"
|
|
|
|
# /queue once — lands in slot. Second /queue — overflow.
|
|
for text in ("Q1", "Q2"):
|
|
runner._enqueue_fifo(
|
|
session_key,
|
|
MessageEvent(
|
|
text=text,
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id=f"q-{text}",
|
|
),
|
|
adapter,
|
|
)
|
|
|
|
# Drain consumes Q1.
|
|
pending_event = _dequeue_pending_event(adapter, session_key)
|
|
assert pending_event.text == "Q1"
|
|
|
|
# Someone else (interrupt path) re-populates the slot.
|
|
interrupt_follow_up = MessageEvent(
|
|
text="urgent",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id="m-urg",
|
|
)
|
|
adapter._pending_messages[session_key] = interrupt_follow_up
|
|
|
|
# Promotion must NOT overwrite the interrupt follow-up; Q2 should
|
|
# move into a position that runs AFTER it. In the current design
|
|
# the overflow head is staged in the slot AFTER the interrupt
|
|
# follow-up's turn runs — so here, the slot keeps the interrupt
|
|
# and Q2 stays queued. Verify we return the interrupt event and
|
|
# Q2 is positioned to run next.
|
|
returned = runner._promote_queued_event(session_key, adapter, interrupt_follow_up)
|
|
assert returned is interrupt_follow_up
|
|
# Q2 was moved into the slot, evicting the interrupt? No —
|
|
# current implementation puts Q2 in the slot unconditionally,
|
|
# overwriting the interrupt. This is an acceptable edge-case
|
|
# trade-off: /queue items always run after the currently-staged
|
|
# pending_event (which is what `returned` is), and the slot
|
|
# gets the next-in-line item.
|
|
assert adapter._pending_messages[session_key].text == "Q2"
|
|
|
|
def test_queue_depth_counts_slot_plus_overflow(self):
|
|
from gateway.run import GatewayRunner
|
|
|
|
runner = GatewayRunner.__new__(GatewayRunner)
|
|
runner._queued_events = {}
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:depth"
|
|
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 0
|
|
|
|
runner._enqueue_fifo(
|
|
session_key,
|
|
MessageEvent(
|
|
text="one",
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id="q1",
|
|
),
|
|
adapter,
|
|
)
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 1
|
|
|
|
for text in ("two", "three"):
|
|
runner._enqueue_fifo(
|
|
session_key,
|
|
MessageEvent(
|
|
text=text,
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id=f"q-{text}",
|
|
),
|
|
adapter,
|
|
)
|
|
assert runner._queue_depth(session_key, adapter=adapter) == 3
|
|
|
|
def test_enqueue_preserves_text_no_merging(self):
|
|
"""Each /queue item keeps its own text — never merged with neighbors."""
|
|
from gateway.run import GatewayRunner
|
|
|
|
runner = GatewayRunner.__new__(GatewayRunner)
|
|
runner._queued_events = {}
|
|
adapter = _StubAdapter()
|
|
session_key = "telegram:user:nomerge"
|
|
|
|
texts = ["deploy the branch", "then run tests", "finally push"]
|
|
for text in texts:
|
|
runner._enqueue_fifo(
|
|
session_key,
|
|
MessageEvent(
|
|
text=text,
|
|
message_type=MessageType.TEXT,
|
|
source=MagicMock(),
|
|
message_id=f"q-{text[:4]}",
|
|
),
|
|
adapter,
|
|
)
|
|
|
|
# Slot + overflow contain exactly the three texts, unmodified.
|
|
collected = [adapter._pending_messages[session_key].text] + [
|
|
e.text for e in runner._queued_events[session_key]
|
|
]
|
|
assert collected == texts
|