mirror of
https://github.com/nesquena/hermes-webui.git
synced 2026-05-26 03:30:36 +00:00
178 lines
7.0 KiB
Python
178 lines
7.0 KiB
Python
import queue
|
|
import sys
|
|
import types
|
|
from typing import Callable, cast
|
|
from unittest import mock
|
|
|
|
|
|
_MISSING = object()
|
|
|
|
|
|
def test_visible_progress_token_reasoning_and_interim_are_deduped(cleanup_test_sessions):
|
|
"""Progress text can arrive through three Hermes callbacks; WebUI must show it once.
|
|
|
|
Some runtimes emit a user-visible progress sentence as a normal token, mirror the
|
|
same text through reasoning, and then report it through interim_assistant before
|
|
a tool call. The SSE bridge should keep the visible token, suppress the hidden
|
|
reasoning echo, and mark interim_assistant as already_streamed so the client and
|
|
journal recovery do not append the same paragraph again.
|
|
"""
|
|
import api.streaming as streaming
|
|
|
|
progress = "Gefunden: der Skill-Tab lädt `/api/skill-html?slug=...`."
|
|
|
|
class FakeSession:
|
|
def __init__(self):
|
|
self.session_id = "issue_progress_echo_dedupe"
|
|
self.title = "Progress echo"
|
|
self.workspace = "/tmp"
|
|
self.model = "gpt-test"
|
|
self.model_provider = None
|
|
self.profile = None
|
|
self.personality = None
|
|
self.messages = []
|
|
self.context_messages = []
|
|
self.input_tokens = 0
|
|
self.output_tokens = 0
|
|
self.estimated_cost = 0
|
|
self.cache_read_tokens = 0
|
|
self.cache_write_tokens = 0
|
|
self.tool_calls = []
|
|
self.gateway_routing = None
|
|
self.gateway_routing_history = []
|
|
self.active_stream_id = ""
|
|
self.pending_user_message = None
|
|
self.pending_attachments = []
|
|
self.pending_started_at = None
|
|
self.context_length = 0
|
|
self.threshold_tokens = 0
|
|
self.last_prompt_tokens = 0
|
|
self.llm_title_generated = True
|
|
|
|
def save(self, *args, **kwargs):
|
|
pass
|
|
|
|
def compact(self):
|
|
return {
|
|
"session_id": self.session_id,
|
|
"title": self.title,
|
|
"workspace": self.workspace,
|
|
"model": self.model,
|
|
"created_at": 0,
|
|
"updated_at": 0,
|
|
"pinned": False,
|
|
"archived": False,
|
|
"project_id": None,
|
|
"profile": self.profile,
|
|
"input_tokens": self.input_tokens,
|
|
"output_tokens": self.output_tokens,
|
|
"estimated_cost": self.estimated_cost,
|
|
"cache_read_tokens": self.cache_read_tokens,
|
|
"cache_write_tokens": self.cache_write_tokens,
|
|
"personality": self.personality,
|
|
}
|
|
|
|
class EchoAgent:
|
|
def __init__(
|
|
self,
|
|
model=None,
|
|
provider=None,
|
|
base_url=None,
|
|
platform=None,
|
|
quiet_mode=False,
|
|
enabled_toolsets=None,
|
|
fallback_model=None,
|
|
session_id=None,
|
|
session_db=None,
|
|
prefill_messages=None,
|
|
stream_delta_callback=None,
|
|
reasoning_callback=None,
|
|
tool_progress_callback=None,
|
|
clarify_callback=None,
|
|
interim_assistant_callback=None,
|
|
**_kwargs,
|
|
):
|
|
self.stream_delta_callback = cast(Callable[[str], None], stream_delta_callback)
|
|
self.reasoning_callback = cast(Callable[[str], None], reasoning_callback)
|
|
self.tool_progress_callback = cast(Callable[..., None], tool_progress_callback)
|
|
self.interim_assistant_callback = cast(Callable[[str], None], interim_assistant_callback)
|
|
self.context_compressor = None
|
|
self.session_prompt_tokens = 0
|
|
self.session_completion_tokens = 0
|
|
self.session_estimated_cost_usd = 0
|
|
self.session_cache_read_tokens = 0
|
|
self.session_cache_write_tokens = 0
|
|
self.reasoning_config = None
|
|
self.ephemeral_system_prompt = None
|
|
self._last_error = None
|
|
|
|
def run_conversation(self, **kwargs):
|
|
self.stream_delta_callback(progress)
|
|
self.reasoning_callback(progress)
|
|
self.tool_progress_callback("reasoning.available", "progress", progress, {})
|
|
self.interim_assistant_callback(progress)
|
|
history = kwargs.get("conversation_history", [])
|
|
return {"messages": history + [
|
|
{"role": "user", "content": kwargs["persist_user_message"]},
|
|
{"role": "assistant", "content": progress},
|
|
]}
|
|
|
|
def interrupt(self, _message):
|
|
pass
|
|
|
|
fake_session = FakeSession()
|
|
fake_stream_id = "stream_issue_progress_echo_dedupe"
|
|
fake_session.active_stream_id = fake_stream_id
|
|
fake_queue = queue.Queue()
|
|
fake_runtime_module = types.ModuleType("hermes_cli.runtime_provider")
|
|
runtime_payload = {
|
|
"provider": "openai",
|
|
"base_url": None,
|
|
"api_mode": "chat_completions",
|
|
"command": None,
|
|
"args": [],
|
|
"credential_pool": None,
|
|
}
|
|
runtime_payload["api_" + "key"] = "***"
|
|
setattr(fake_runtime_module, "resolve_runtime_provider", mock.Mock(return_value=runtime_payload))
|
|
fake_hermes_cli = types.ModuleType("hermes_cli")
|
|
setattr(fake_hermes_cli, "runtime_provider", fake_runtime_module)
|
|
fake_hermes_state = types.ModuleType("hermes_state")
|
|
setattr(fake_hermes_state, "SessionDB", mock.Mock(return_value=None))
|
|
injected = {
|
|
"hermes_cli": fake_hermes_cli,
|
|
"hermes_cli.runtime_provider": fake_runtime_module,
|
|
"hermes_state": fake_hermes_state,
|
|
}
|
|
saved = {k: sys.modules.get(k, _MISSING) for k in injected}
|
|
sys.modules.update(injected)
|
|
try:
|
|
with mock.patch.object(streaming, "get_session", return_value=fake_session), \
|
|
mock.patch.object(streaming, "_get_ai_agent", return_value=EchoAgent), \
|
|
mock.patch.object(streaming, "resolve_model_provider", return_value=("gpt-test", "openai", None)), \
|
|
mock.patch("api.config.get_config", return_value={}), \
|
|
mock.patch("api.config._resolve_cli_toolsets", return_value=[]):
|
|
streaming.STREAMS[fake_stream_id] = fake_queue
|
|
streaming._run_agent_streaming(
|
|
session_id=fake_session.session_id,
|
|
msg_text="scan",
|
|
model="gpt-test",
|
|
workspace="/tmp",
|
|
stream_id=fake_stream_id,
|
|
)
|
|
finally:
|
|
streaming.STREAMS.pop(fake_stream_id, None)
|
|
for k, prev in saved.items():
|
|
if prev is _MISSING:
|
|
sys.modules.pop(k, None)
|
|
else:
|
|
sys.modules[k] = cast(types.ModuleType, prev)
|
|
|
|
events = list(fake_queue.queue)
|
|
assert [(event, payload) for event, payload in events if event == "token"] == [
|
|
("token", {"text": progress})
|
|
]
|
|
assert not [payload for event, payload in events if event == "reasoning" and payload.get("text") == progress]
|
|
interim = [payload for event, payload in events if event == "interim_assistant"]
|
|
assert interim == [{"text": progress, "already_streamed": True}]
|