mirror of
https://github.com/nesquena/hermes-webui.git
synced 2026-05-24 02:36:27 +00:00
418 lines
22 KiB
Python
418 lines
22 KiB
Python
"""Regression checks for #856 background completion unread markers."""
|
|
|
|
from pathlib import Path
|
|
|
|
|
|
REPO = Path(__file__).resolve().parent.parent
|
|
SESSIONS_JS = (REPO / "static" / "sessions.js").read_text(encoding="utf-8")
|
|
MESSAGES_JS = (REPO / "static" / "messages.js").read_text(encoding="utf-8")
|
|
|
|
|
|
def _done_block() -> str:
|
|
start = MESSAGES_JS.find("source.addEventListener('done'")
|
|
assert start != -1, "done handler not found in messages.js"
|
|
end = MESSAGES_JS.find("source.addEventListener('stream_end'", start)
|
|
assert end != -1, "stream_end handler not found after done handler"
|
|
return MESSAGES_JS[start:end]
|
|
|
|
|
|
def _sessions_function_block(name: str, next_name: str) -> str:
|
|
start = SESSIONS_JS.find(f"function {name}")
|
|
assert start != -1, f"{name} not found in sessions.js"
|
|
end = SESSIONS_JS.find(f"function {next_name}", start)
|
|
assert end != -1, f"{next_name} not found after {name}"
|
|
return SESSIONS_JS[start:end]
|
|
|
|
|
|
def test_background_completion_unread_uses_explicit_marker_not_message_delta():
|
|
"""A background completion must stay unread even when message_count has no delta."""
|
|
assert "SESSION_COMPLETION_UNREAD_KEY = 'hermes-session-completion-unread'" in SESSIONS_JS
|
|
assert "function _markSessionCompletionUnread(" in SESSIONS_JS
|
|
assert "function _clearSessionCompletionUnread(" in SESSIONS_JS
|
|
assert "function _hasSessionCompletionUnread(" in SESSIONS_JS
|
|
|
|
has_unread_idx = SESSIONS_JS.find("function _hasUnreadForSession(s)")
|
|
assert has_unread_idx != -1, "_hasUnreadForSession not found"
|
|
has_unread_block = SESSIONS_JS[has_unread_idx:SESSIONS_JS.find("async function newSession", has_unread_idx)]
|
|
|
|
marker_idx = has_unread_block.find("_hasSessionCompletionUnread(s.session_id)")
|
|
count_idx = has_unread_block.find("s.message_count > Number")
|
|
assert marker_idx != -1, "_hasUnreadForSession must check explicit completion unread marker"
|
|
assert count_idx != -1, "_hasUnreadForSession must keep the existing message_count fallback"
|
|
assert marker_idx < count_idx, (
|
|
"explicit completion unread marker must be checked before message_count delta, "
|
|
"because completed streams can have viewed_count == message_count"
|
|
)
|
|
|
|
|
|
def test_background_done_sets_marker_when_session_not_actively_viewed():
|
|
done_block = _done_block()
|
|
assert "const isSessionViewed=_isSessionActivelyViewed(activeSid);" in done_block
|
|
assert "const completedSession=d.session||{session_id:activeSid};" in done_block
|
|
assert "const completedSid=completedSession.session_id||activeSid;" in done_block
|
|
assert "if(!isSessionViewed && typeof _markSessionCompletionUnread==='function')" in done_block
|
|
assert "_markSessionCompletionUnread(completedSid, completedSession.message_count);" in done_block
|
|
|
|
|
|
def test_background_done_uses_rotated_session_id_for_completion_unread():
|
|
done_block = _done_block()
|
|
|
|
completed_sid_idx = done_block.find("const completedSid=completedSession.session_id||activeSid;")
|
|
marker_idx = done_block.find("_markSessionCompletionUnread(completedSid, completedSession.message_count);")
|
|
viewed_idx = done_block.find("_markSessionViewed(completedSid, completedSession.message_count")
|
|
|
|
assert completed_sid_idx != -1, "done handler must derive the final post-compression session id"
|
|
assert marker_idx != -1, "background completion marker must be stored on the final session id"
|
|
assert viewed_idx != -1, "visible completions must mark the final session id as read"
|
|
assert completed_sid_idx < marker_idx < viewed_idx, (
|
|
"context compression can rotate session_id before done; unread/read state must "
|
|
"attach to the visible final row, not the old SSE activeSid"
|
|
)
|
|
|
|
|
|
def test_done_event_updates_sidebar_cache_immediately_after_completion_marker():
|
|
done_block = _done_block()
|
|
|
|
marker_idx = done_block.find("_markSessionCompletionUnread(completedSid")
|
|
cleanup_idx = done_block.find("_clearOwnerInflightState();")
|
|
if cleanup_idx == -1:
|
|
cleanup_idx = done_block.find("delete INFLIGHT[activeSid];")
|
|
cache_idx = done_block.find("_markSessionCompletedInList(completedSession, activeSid);")
|
|
refresh_idx = done_block.find("renderSessionList();", cache_idx)
|
|
sound_idx = done_block.find("playNotificationSound();", cache_idx)
|
|
|
|
assert "function _markSessionCompletedInList(" in SESSIONS_JS
|
|
assert marker_idx != -1, "done handler must write the completion-unread marker first"
|
|
assert cleanup_idx != -1, "done handler must clear local INFLIGHT before rendering idle state"
|
|
assert cache_idx != -1, "done handler must update the sidebar cache immediately"
|
|
assert refresh_idx != -1 and sound_idx != -1
|
|
assert marker_idx < cleanup_idx < cache_idx < refresh_idx < sound_idx, (
|
|
"the sidebar should flip from spinner to dot from the done payload before "
|
|
"waiting for /api/sessions or playing the completion cue"
|
|
)
|
|
|
|
|
|
def test_sidebar_cache_completion_handles_compression_session_rotation():
|
|
helper_block = _sessions_function_block(
|
|
"_markSessionCompletedInList",
|
|
"_markPollingCompletionUnreadTransitions",
|
|
)
|
|
|
|
assert "function _markSessionCompletedInList(session, previousSid = null)" in helper_block
|
|
assert "const finalSid = session.session_id || previousSid;" in helper_block
|
|
assert "s.session_id === finalSid || s.session_id === previousSid" in helper_block
|
|
assert "const {messages: _messages, tool_calls: _toolCalls, ...sessionMeta} = session;" in helper_block
|
|
assert "...sessionMeta" in helper_block
|
|
assert "session_id: finalSid" in helper_block
|
|
assert "_sessionStreamingById.set(finalSid, false);" in helper_block
|
|
assert "if (previousSid && previousSid !== finalSid)" in helper_block
|
|
assert "_sessionStreamingById.delete(previousSid);" in helper_block
|
|
assert "_sessionListSnapshotById.delete(previousSid);" in helper_block
|
|
|
|
|
|
def test_polling_transition_marks_completion_unread_without_sse_done():
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
effective_block = _sessions_function_block(
|
|
"_isSessionEffectivelyStreaming",
|
|
"_markPollingCompletionUnreadTransitions",
|
|
)
|
|
render_idx = SESSIONS_JS.find("async function renderSessionList()")
|
|
assert render_idx != -1, "renderSessionList not found"
|
|
render_block = SESSIONS_JS[render_idx:SESSIONS_JS.find("// ── Gateway session SSE", render_idx)]
|
|
|
|
assert "const _sessionStreamingById = new Map();" in SESSIONS_JS
|
|
assert "const wasStreaming = _sessionStreamingById.get(sid);" in transition_block
|
|
assert "const isStreaming = _isSessionEffectivelyStreaming(s);" in transition_block
|
|
assert "s.is_streaming || _isSessionLocallyStreaming(s)" in effective_block
|
|
assert "wasStreaming === true && !isStreaming" in transition_block, (
|
|
"polling fallback must only fire on an observed streaming -> stopped transition"
|
|
)
|
|
assert "_markSessionCompletionUnread(sid, s.message_count);" in transition_block
|
|
assert "_sessionStreamingById.set(sid, isStreaming);" in transition_block
|
|
assert "_markPollingCompletionUnreadTransitions(_allSessions);" in render_block
|
|
|
|
|
|
def test_polling_transition_does_not_mark_historical_first_render():
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
|
|
assert "wasStreaming === true && !isStreaming" in transition_block
|
|
assert "wasStreaming && !isStreaming" not in transition_block, (
|
|
"first-render undefined state must not be treated as a completed stream"
|
|
)
|
|
mark_idx = transition_block.find("_markSessionCompletionUnread(sid")
|
|
set_idx = transition_block.find("_sessionStreamingById.set(sid, isStreaming)")
|
|
assert mark_idx != -1 and set_idx != -1 and mark_idx < set_idx, (
|
|
"the current render should seed streaming state only after checking for "
|
|
"a prior observed streaming state"
|
|
)
|
|
|
|
|
|
def test_polling_transition_skips_visible_focused_active_session():
|
|
helper_block = _sessions_function_block(
|
|
"_isSessionActivelyViewedForList",
|
|
"_markPollingCompletionUnreadTransitions",
|
|
)
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
|
|
assert "S.session.session_id !== sid" in helper_block
|
|
assert "_loadingSessionId !== sid" in helper_block
|
|
assert "document.visibilityState !== 'visible'" in helper_block
|
|
assert "!document.hasFocus()" in helper_block
|
|
assert "!_isSessionActivelyViewedForList(sid)" in transition_block, (
|
|
"polling fallback must not create an unread marker for a session the "
|
|
"user is visibly and focusedly reading"
|
|
)
|
|
|
|
|
|
def test_polling_transition_tracks_the_same_effective_streaming_state_as_sidebar():
|
|
local_block = _sessions_function_block(
|
|
"_isSessionLocallyStreaming",
|
|
"_isSessionEffectivelyStreaming",
|
|
)
|
|
effective_block = _sessions_function_block(
|
|
"_isSessionEffectivelyStreaming",
|
|
"_markPollingCompletionUnreadTransitions",
|
|
)
|
|
render_idx = SESSIONS_JS.find("function _renderOneSession")
|
|
assert render_idx != -1, "_renderOneSession not found"
|
|
render_block = SESSIONS_JS[render_idx:SESSIONS_JS.find("const hasUnread=", render_idx)]
|
|
|
|
assert "isActive && Boolean(S.busy)" in local_block
|
|
assert "INFLIGHT && INFLIGHT[s.session_id]" not in local_block
|
|
assert "s.is_streaming || _isSessionLocallyStreaming(s)" in effective_block
|
|
assert "const isStreaming=_isSessionEffectivelyStreaming(s);" in render_block, (
|
|
"the row spinner and polling completion transition must use the same "
|
|
"effective streaming source, including local INFLIGHT-only streams"
|
|
)
|
|
|
|
|
|
def test_cache_render_seeds_streaming_transition_state_for_visible_spinners():
|
|
remember_block = _sessions_function_block(
|
|
"_rememberRenderedStreamingState",
|
|
"_rememberRenderedSessionSnapshot",
|
|
)
|
|
render_idx = SESSIONS_JS.find("function _renderOneSession")
|
|
assert render_idx != -1, "_renderOneSession not found"
|
|
render_block = SESSIONS_JS[render_idx:SESSIONS_JS.find("const hasUnread=", render_idx)]
|
|
|
|
assert "if (!s || !s.session_id || !isStreaming) return;" in remember_block
|
|
assert "_sessionStreamingById.set(s.session_id, true);" in remember_block
|
|
assert "const isStreaming=_isSessionEffectivelyStreaming(s);" in render_block
|
|
assert "_rememberRenderedStreamingState(s, isStreaming);" in render_block, (
|
|
"renderSessionListFromCache can display a spinner from local INFLIGHT "
|
|
"state before a full poll runs, so it must seed the transition map too"
|
|
)
|
|
|
|
|
|
def test_polling_transition_marks_completion_when_long_running_stream_snapshot_advances():
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
render_idx = SESSIONS_JS.find("function _renderOneSession")
|
|
assert render_idx != -1, "_renderOneSession not found"
|
|
render_block = SESSIONS_JS[render_idx:SESSIONS_JS.find("const hasUnread=", render_idx)]
|
|
|
|
assert "const _sessionListSnapshotById = new Map();" in SESSIONS_JS
|
|
assert "SESSION_OBSERVED_STREAMING_KEY = 'hermes-session-observed-streaming'" in SESSIONS_JS
|
|
assert "function _rememberObservedStreamingSession(" in SESSIONS_JS
|
|
assert "function _forgetObservedStreamingSession(" in SESSIONS_JS
|
|
assert "const previousSnapshot = _sessionListSnapshotById.get(sid);" in transition_block
|
|
assert "const observedStreaming = _getSessionObservedStreaming()[sid];" in transition_block
|
|
assert "const completedWithNewMessages = Boolean(" in transition_block
|
|
assert "(previousSnapshot || observedStreaming)" in transition_block
|
|
assert "messageCount > Number((previousSnapshot || observedStreaming).message_count || 0)" in transition_block
|
|
assert "lastMessageAt > Number((previousSnapshot || observedStreaming).last_message_at || 0)" in transition_block
|
|
assert "const completedPersistedObservedStream = Boolean(observedStreaming && !isStreaming);" in transition_block
|
|
assert "completedObservedStream || completedPersistedObservedStream || completedWithNewMessages" in transition_block
|
|
assert "_sessionListSnapshotById.set(sid, {" in transition_block
|
|
assert "_rememberRenderedSessionSnapshot(s);" in render_block, (
|
|
"a visible sidebar spinner can outlive the original SSE context for "
|
|
"long-running tasks, so rendered rows must seed the message snapshot "
|
|
"used by the polling fallback"
|
|
)
|
|
|
|
|
|
def test_polling_snapshot_fallback_does_not_mark_first_seen_historical_sessions():
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
|
|
prev_idx = transition_block.find("const previousSnapshot = _sessionListSnapshotById.get(sid);")
|
|
fallback_idx = transition_block.find("const completedWithNewMessages = Boolean(")
|
|
mark_idx = transition_block.find("_markSessionCompletionUnread(sid")
|
|
snapshot_set_idx = transition_block.find("_sessionListSnapshotById.set(sid, {")
|
|
|
|
assert prev_idx != -1 and fallback_idx != -1 and mark_idx != -1 and snapshot_set_idx != -1
|
|
assert "(previousSnapshot || observedStreaming)\n && !isStreaming" in transition_block, (
|
|
"snapshot-delta fallback must require a previous in-memory or persisted "
|
|
"observation so old completed sessions do not become unread on first render"
|
|
)
|
|
assert prev_idx < fallback_idx < mark_idx < snapshot_set_idx, (
|
|
"the old snapshot must be checked before writing the current snapshot"
|
|
)
|
|
|
|
|
|
def test_rendered_streaming_rows_persist_observation_across_reload():
|
|
remember_block = _sessions_function_block(
|
|
"_rememberRenderedStreamingState",
|
|
"_rememberRenderedSessionSnapshot",
|
|
)
|
|
transition_block = _sessions_function_block(
|
|
"_markPollingCompletionUnreadTransitions",
|
|
"newSession",
|
|
)
|
|
|
|
assert "_rememberObservedStreamingSession(s);" in remember_block, (
|
|
"visible spinner rows must persist an observed-running marker so long "
|
|
"tasks still become unread if the original SSE/in-memory state is lost"
|
|
)
|
|
assert "if (isStreaming) {" in transition_block
|
|
assert "_rememberObservedStreamingSession(s);" in transition_block
|
|
assert "} else {\n _forgetObservedStreamingSession(sid);" in transition_block
|
|
|
|
|
|
def test_active_done_marks_viewed_without_setting_unread_marker():
|
|
done_block = _done_block()
|
|
marker_idx = done_block.find("_markSessionCompletionUnread(completedSid")
|
|
active_guard_idx = done_block.find("if(isActiveSession){", marker_idx)
|
|
viewed_guard_idx = done_block.find("if(isSessionViewed) _markSessionViewed(completedSid", active_guard_idx)
|
|
|
|
assert marker_idx != -1, "background completion marker call missing"
|
|
assert active_guard_idx != -1, "done handler must guard active-session UI updates"
|
|
assert viewed_guard_idx != -1, "active/current completion must still mark session viewed when visible/focused"
|
|
assert active_guard_idx < viewed_guard_idx, (
|
|
"active-session viewed write must remain inside isSessionViewed guard so "
|
|
"switch-away races cannot mark a background completion read"
|
|
)
|
|
|
|
|
|
def test_hidden_active_done_still_updates_current_pane_but_not_read_state():
|
|
done_block = _done_block()
|
|
|
|
active_const_idx = done_block.find("const isActiveSession=_isSessionCurrentPane(activeSid);")
|
|
viewed_const_idx = done_block.find("const isSessionViewed=_isSessionActivelyViewed(activeSid);")
|
|
active_guard_idx = done_block.find("if(isActiveSession){", viewed_const_idx)
|
|
session_update_idx = done_block.find("S.session=d.session", active_guard_idx)
|
|
render_idx = done_block.find("renderMessages(", active_guard_idx)
|
|
load_dir_idx = done_block.find("loadDir('.')", active_guard_idx)
|
|
mark_viewed_idx = done_block.find("if(isSessionViewed) _markSessionViewed(completedSid", active_guard_idx)
|
|
|
|
assert active_const_idx != -1, "done handler must compute active/current pane separately"
|
|
assert viewed_const_idx != -1, "done handler must still compute visible/focused read state"
|
|
assert active_const_idx < viewed_const_idx
|
|
assert session_update_idx != -1, "active hidden completion must still refresh S.session"
|
|
assert render_idx != -1, "active hidden completion must still render the final assistant response"
|
|
assert load_dir_idx != -1, "active hidden completion must keep normal active-session finalization"
|
|
assert mark_viewed_idx != -1, "read-state write must stay gated by visible/focused viewing"
|
|
assert session_update_idx < mark_viewed_idx < render_idx, (
|
|
"hidden active completion should update the pane, but only mark read when "
|
|
"isSessionViewed is true"
|
|
)
|
|
|
|
|
|
def test_hidden_or_unfocused_active_session_counts_as_background_completion():
|
|
helper_idx = MESSAGES_JS.find("function _isSessionActivelyViewed(sid)")
|
|
assert helper_idx != -1, "_isSessionActivelyViewed helper missing"
|
|
helper_block = MESSAGES_JS[helper_idx:MESSAGES_JS.find("function _markActiveSessionViewedOnReturn", helper_idx)]
|
|
|
|
current_idx = MESSAGES_JS.find("function _isSessionCurrentPane(sid)")
|
|
assert current_idx != -1, "_isSessionCurrentPane helper missing"
|
|
assert "function _isDocumentVisibleAndFocused()" in MESSAGES_JS
|
|
assert "document.visibilityState" in MESSAGES_JS
|
|
assert "document.visibilityState!=='visible'" in MESSAGES_JS
|
|
assert "document.hasFocus" in MESSAGES_JS
|
|
assert "!document.hasFocus()" in MESSAGES_JS
|
|
assert "if(!_isSessionCurrentPane(sid)) return false;" in helper_block
|
|
assert "if(!_isDocumentVisibleAndFocused()) return false;" in helper_block, (
|
|
"active session completion must be treated as unread when the tab is "
|
|
"hidden or the window is unfocused"
|
|
)
|
|
|
|
|
|
def test_switching_away_counts_as_background_completion():
|
|
helper_idx = MESSAGES_JS.find("function _isSessionCurrentPane(sid)")
|
|
assert helper_idx != -1, "_isSessionCurrentPane helper missing"
|
|
helper_block = MESSAGES_JS[helper_idx:MESSAGES_JS.find("function _isSessionActivelyViewed", helper_idx)]
|
|
|
|
assert "S.session.session_id!==sid" in helper_block
|
|
assert "_loadingSessionId" in helper_block
|
|
assert "_loadingSessionId!==sid" in helper_block, (
|
|
"if loadSession(B) is in flight while done(A) arrives, A must be treated "
|
|
"as background even though S.session can still temporarily point at A"
|
|
)
|
|
|
|
|
|
def test_restore_settled_background_stream_marks_completion_unread():
|
|
restore_idx = MESSAGES_JS.find("async function _restoreSettledSession()")
|
|
assert restore_idx != -1, "_restoreSettledSession not found"
|
|
restore_block = MESSAGES_JS[restore_idx:MESSAGES_JS.find("function _handleStreamError", restore_idx)]
|
|
|
|
assert "const isSessionViewed=_isSessionActivelyViewed(activeSid);" in restore_block
|
|
assert "const completedSid=session.session_id||activeSid;" in restore_block
|
|
assert "if(!isSessionViewed && typeof _markSessionCompletionUnread==='function')" in restore_block
|
|
assert "_markSessionCompletionUnread(completedSid, session.message_count);" in restore_block
|
|
assert "if(isSessionViewed) _markSessionViewed(completedSid" in restore_block, (
|
|
"restore-settled fallback must not mark a hidden/background completion read"
|
|
)
|
|
|
|
|
|
def test_focus_visibility_return_marks_active_session_viewed_and_clears_marker():
|
|
return_idx = MESSAGES_JS.find("function _markActiveSessionViewedOnReturn()")
|
|
assert return_idx != -1, "_markActiveSessionViewedOnReturn helper missing"
|
|
return_block = MESSAGES_JS[return_idx:MESSAGES_JS.find("async function send()", return_idx)]
|
|
|
|
assert "if(!_isDocumentVisibleAndFocused() || !S.session || !S.session.session_id) return;" in return_block
|
|
assert "_markSessionViewed(S.session.session_id" in return_block
|
|
assert "_clearSessionCompletionUnread(S.session.session_id)" in return_block, (
|
|
"returning to a visible/focused tab must clear the explicit unread marker "
|
|
"for the active session the user is now viewing"
|
|
)
|
|
assert "renderSessionListFromCache()" in return_block
|
|
assert "document.addEventListener('visibilitychange', _markActiveSessionViewedOnReturn);" in MESSAGES_JS
|
|
assert "window.addEventListener('focus', _markActiveSessionViewedOnReturn);" in MESSAGES_JS
|
|
|
|
|
|
def test_completion_unread_clears_only_when_session_is_opened():
|
|
load_idx = SESSIONS_JS.find("async function loadSession(sid)")
|
|
assert load_idx != -1, "loadSession not found"
|
|
load_block = SESSIONS_JS[load_idx:SESSIONS_JS.find("function _resolveSessionModelForDisplaySoon", load_idx)]
|
|
|
|
stale_guard_idx = load_block.find("if (_loadingSessionId !== sid) return;")
|
|
clear_idx = load_block.find("_clearSessionCompletionUnread(S.session.session_id);")
|
|
set_viewed_idx = load_block.find("_setSessionViewedCount(S.session.session_id")
|
|
|
|
assert clear_idx != -1, "loadSession must clear explicit completion unread when the user opens the session"
|
|
assert stale_guard_idx != -1 and stale_guard_idx < clear_idx, (
|
|
"stale loadSession responses must not clear unread markers for sessions the user did not actually open"
|
|
)
|
|
assert set_viewed_idx != -1 and set_viewed_idx < clear_idx, (
|
|
"completion unread should clear at the same point the session is marked viewed"
|
|
)
|
|
|
|
|
|
def test_historical_sessions_are_not_marked_unread_on_list_render():
|
|
"""The explicit unread marker must be event-driven, not initialized by _hasUnreadForSession."""
|
|
has_unread_idx = SESSIONS_JS.find("function _hasUnreadForSession(s)")
|
|
assert has_unread_idx != -1
|
|
has_unread_block = SESSIONS_JS[
|
|
has_unread_idx:SESSIONS_JS.find("function _isSessionActivelyViewedForList", has_unread_idx)
|
|
]
|
|
|
|
assert "_markSessionCompletionUnread" not in has_unread_block, (
|
|
"rendering old historical sessions must not create completion-unread markers"
|
|
)
|
|
assert "_setSessionViewedCount(s.session_id, Number(s.message_count || 0));" in has_unread_block, (
|
|
"missing viewed-count baseline should still initialize as read for historical sessions"
|
|
)
|