457 lines
20 KiB
Python
457 lines
20 KiB
Python
"""
|
|
Sprint 42 Tests: SessionDB injection into AIAgent for WebUI sessions (PR #356).
|
|
|
|
Covers:
|
|
- streaming.py: SessionDB is initialized inside _run_agent_streaming (import present)
|
|
- streaming.py: try/except guards SessionDB init so failures are non-fatal
|
|
- streaming.py: session_db= kwarg is passed to AIAgent constructor
|
|
- streaming.py: SessionDB init failure prints a WARNING (not silently swallowed)
|
|
- streaming.py: SessionDB init is placed before AIAgent construction
|
|
"""
|
|
import ast
|
|
import pathlib
|
|
import re
|
|
import queue
|
|
import sys
|
|
import types
|
|
import unittest
|
|
from unittest import mock
|
|
|
|
REPO_ROOT = pathlib.Path(__file__).parent.parent
|
|
STREAMING_PY = (REPO_ROOT / "api" / "streaming.py").read_text()
|
|
|
|
|
|
# ── Shared helpers for sprint-42 additional tests ────────────────────────────
|
|
|
|
REPO = REPO_ROOT # alias used by #427 tests
|
|
_SESSIONS_JS = REPO_ROOT / 'static' / 'sessions.js'
|
|
_STREAMING_PY = REPO_ROOT / 'api' / 'streaming.py'
|
|
_MESSAGES_JS = REPO_ROOT / 'static' / 'messages.js'
|
|
_UI_JS = REPO_ROOT / 'static' / 'ui.js'
|
|
|
|
def _read_sessions_js():
|
|
return _SESSIONS_JS.read_text(encoding='utf-8')
|
|
|
|
# ─────────────────────────────────────────────────────────────────────────────
|
|
|
|
class TestSessionDBInjection(unittest.TestCase):
|
|
"""Verify SessionDB is initialized and passed to AIAgent in streaming.py."""
|
|
|
|
def test_hermes_state_import_present(self):
|
|
"""SessionDB must be imported from hermes_state inside _run_agent_streaming."""
|
|
self.assertIn(
|
|
"from hermes_state import SessionDB",
|
|
STREAMING_PY,
|
|
"SessionDB import missing from streaming.py (PR #356)",
|
|
)
|
|
|
|
def test_session_db_kwarg_passed_to_agent(self):
|
|
"""session_db= must be passed to the AIAgent constructor call."""
|
|
self.assertIn(
|
|
"session_db=_session_db",
|
|
STREAMING_PY,
|
|
"session_db kwarg not passed to AIAgent (PR #356)",
|
|
)
|
|
|
|
def test_sessiondb_init_in_try_except(self):
|
|
"""SessionDB() init must be wrapped in try/except for non-fatal failure handling."""
|
|
# Check that the try/except pattern surrounding SessionDB() is present
|
|
pattern = r"try:\s*\n\s*from hermes_state import SessionDB\s*\n\s*_session_db\s*=\s*SessionDB\(\)"
|
|
self.assertRegex(
|
|
STREAMING_PY,
|
|
pattern,
|
|
"SessionDB() init must be inside a try block for non-fatal error handling (PR #356)",
|
|
)
|
|
|
|
def test_sessiondb_failure_logs_warning(self):
|
|
"""A failure initializing SessionDB must print a WARNING (not silently drop the error)."""
|
|
self.assertIn(
|
|
"WARNING: SessionDB init failed",
|
|
STREAMING_PY,
|
|
"SessionDB init failure must log a WARNING message (PR #356)",
|
|
)
|
|
|
|
def test_session_db_initialized_before_agent_construction(self):
|
|
"""SessionDB initialization must appear before the AIAgent(...) constructor call."""
|
|
db_pos = STREAMING_PY.find("from hermes_state import SessionDB")
|
|
agent_pos = STREAMING_PY.find("session_db=_session_db")
|
|
self.assertGreater(
|
|
agent_pos,
|
|
db_pos,
|
|
"SessionDB init must appear before AIAgent construction (PR #356)",
|
|
)
|
|
|
|
def test_session_db_default_is_none(self):
|
|
"""_session_db must be initialized to None before the try block (safe default)."""
|
|
# Pattern: _session_db = None followed (eventually) by the try/SessionDB block
|
|
pattern = r"_session_db\s*=\s*None\s*\n\s*try:"
|
|
self.assertRegex(
|
|
STREAMING_PY,
|
|
pattern,
|
|
"_session_db must default to None before try/except block (PR #356)",
|
|
)
|
|
|
|
|
|
class TestRuntimeRouteInjection(unittest.TestCase):
|
|
"""Verify WebUI forwards the resolved runtime route into AIAgent."""
|
|
|
|
def test_runtime_provider_keys_are_forwarded_to_agent(self):
|
|
"""WebUI must pass the runtime route fields that CLI already uses."""
|
|
for snippet in (
|
|
"api_mode=_rt.get('api_mode')",
|
|
"acp_command=_rt.get('command')",
|
|
"acp_args=_rt.get('args')",
|
|
"credential_pool=_rt.get('credential_pool')",
|
|
):
|
|
self.assertIn(
|
|
snippet,
|
|
STREAMING_PY,
|
|
f"Missing runtime route forwarding in AIAgent constructor: {snippet}",
|
|
)
|
|
|
|
def test_runtime_route_is_forwarded_from_resolver_into_agent_init(self):
|
|
"""The resolved ACP route should be passed through to AIAgent kwargs."""
|
|
import api.streaming as streaming
|
|
|
|
captured = {}
|
|
fake_session_db = object()
|
|
resolve_runtime_provider = mock.Mock(
|
|
return_value={
|
|
"provider": "openai-codex",
|
|
"base_url": "https://api.openai.com/v1",
|
|
"api_key": "rt-key",
|
|
"api_mode": "codex_responses",
|
|
"command": "codex",
|
|
"args": ["exec", "--json"],
|
|
"credential_pool": "openai-codex",
|
|
}
|
|
)
|
|
|
|
class FakeSession:
|
|
def __init__(self):
|
|
self.session_id = "sess-runtime-route"
|
|
self.title = "Existing title"
|
|
self.workspace = "/tmp"
|
|
self.model = "gpt-5.4"
|
|
self.messages = []
|
|
self.personality = None
|
|
self.input_tokens = 0
|
|
self.output_tokens = 0
|
|
self.estimated_cost = None
|
|
self.tool_calls = []
|
|
self.active_stream_id = None
|
|
self.pending_user_message = None
|
|
self.pending_attachments = []
|
|
self.pending_started_at = None
|
|
|
|
def save(self, touch_updated_at=True):
|
|
self._saved = True
|
|
|
|
def compact(self):
|
|
return {
|
|
"session_id": self.session_id,
|
|
"title": self.title,
|
|
"workspace": self.workspace,
|
|
"model": self.model,
|
|
"created_at": 0,
|
|
"updated_at": 0,
|
|
"pinned": False,
|
|
"archived": False,
|
|
"project_id": None,
|
|
"profile": None,
|
|
"input_tokens": self.input_tokens,
|
|
"output_tokens": self.output_tokens,
|
|
"estimated_cost": self.estimated_cost,
|
|
"personality": self.personality,
|
|
}
|
|
|
|
class CapturingAgent:
|
|
def __init__(self, **kwargs):
|
|
captured["init_kwargs"] = kwargs
|
|
self.session_id = kwargs["session_id"]
|
|
self.context_compressor = None
|
|
self.session_prompt_tokens = 0
|
|
self.session_completion_tokens = 0
|
|
self.session_estimated_cost_usd = None
|
|
self.reasoning_config = None
|
|
self.ephemeral_system_prompt = None
|
|
self._last_error = None
|
|
|
|
def run_conversation(self, **kwargs):
|
|
captured["run_kwargs"] = kwargs
|
|
return {
|
|
"messages": [
|
|
{"role": "user", "content": kwargs["persist_user_message"]},
|
|
{"role": "assistant", "content": "ok"},
|
|
]
|
|
}
|
|
|
|
def interrupt(self, _message):
|
|
captured["interrupted"] = True
|
|
|
|
fake_session = FakeSession()
|
|
fake_stream_id = "stream-runtime-route"
|
|
fake_queue = queue.Queue()
|
|
fake_runtime_module = types.ModuleType("hermes_cli.runtime_provider")
|
|
fake_runtime_module.resolve_runtime_provider = resolve_runtime_provider
|
|
fake_hermes_cli = types.ModuleType("hermes_cli")
|
|
fake_hermes_cli.runtime_provider = fake_runtime_module
|
|
fake_hermes_state = types.ModuleType("hermes_state")
|
|
fake_hermes_state.SessionDB = mock.Mock(return_value=fake_session_db)
|
|
|
|
with mock.patch.object(streaming, "get_session", return_value=fake_session), \
|
|
mock.patch.object(streaming, "_get_ai_agent", return_value=CapturingAgent), \
|
|
mock.patch.object(streaming, "resolve_model_provider", return_value=("gpt-5.4", "openai-codex", None)), \
|
|
mock.patch("api.config.get_config", return_value={}), \
|
|
mock.patch("api.config._resolve_cli_toolsets", return_value=[]), \
|
|
mock.patch.dict(
|
|
sys.modules,
|
|
{
|
|
"hermes_cli": fake_hermes_cli,
|
|
"hermes_cli.runtime_provider": fake_runtime_module,
|
|
"hermes_state": fake_hermes_state,
|
|
},
|
|
):
|
|
streaming.STREAMS[fake_stream_id] = fake_queue
|
|
streaming._run_agent_streaming(
|
|
session_id=fake_session.session_id,
|
|
msg_text="hello from webui",
|
|
model="gpt-5.4",
|
|
workspace="/tmp",
|
|
stream_id=fake_stream_id,
|
|
)
|
|
|
|
resolve_runtime_provider.assert_called_once_with(requested="openai-codex")
|
|
init_kwargs = captured["init_kwargs"]
|
|
self.assertEqual(init_kwargs["api_mode"], "codex_responses")
|
|
self.assertEqual(init_kwargs["acp_command"], "codex")
|
|
self.assertEqual(init_kwargs["acp_args"], ["exec", "--json"])
|
|
self.assertEqual(init_kwargs["credential_pool"], "openai-codex")
|
|
self.assertEqual(init_kwargs["api_key"], "rt-key")
|
|
self.assertIs(init_kwargs["session_db"], fake_session_db)
|
|
|
|
|
|
class TestSessionDBAST(unittest.TestCase):
|
|
"""AST-level checks: verify the try/except is not inside _ENV_LOCK (deadlock guard)."""
|
|
|
|
def setUp(self):
|
|
self.tree = ast.parse(STREAMING_PY)
|
|
|
|
def test_sessiondb_try_not_inside_env_lock(self):
|
|
"""The try block that wraps SessionDB init must NOT be inside a 'with _ENV_LOCK:' block.
|
|
|
|
Putting a try/except inside _ENV_LOCK is the deadlock pattern caught by test_sprint34.
|
|
The SessionDB try/except is outside the lock scope, which is correct.
|
|
"""
|
|
# Find all 'with _ENV_LOCK:' nodes; check none of their bodies contain
|
|
# a Try node that also contains 'from hermes_state import SessionDB'
|
|
for node in ast.walk(self.tree):
|
|
if not isinstance(node, ast.With):
|
|
continue
|
|
names = [getattr(item.context_expr, "id", "") for item in node.items]
|
|
if "_ENV_LOCK" not in names:
|
|
continue
|
|
# Walk the with-body for Try nodes
|
|
for stmt in node.body:
|
|
if isinstance(stmt, ast.Try):
|
|
# Check if this try imports hermes_state
|
|
src = ast.unparse(stmt)
|
|
self.assertNotIn(
|
|
"hermes_state",
|
|
src,
|
|
"SessionDB try/except must NOT be inside _ENV_LOCK body (deadlock risk)",
|
|
)
|
|
|
|
|
|
class TestModelCustomInput(unittest.TestCase):
|
|
"""Tests for issue #444 — custom model ID input in model dropdown."""
|
|
|
|
STATIC = pathlib.Path(__file__).parent.parent / 'static'
|
|
|
|
def _read(self, filename):
|
|
path = self.STATIC / filename
|
|
with open(path, 'r', encoding='utf-8') as f:
|
|
return f.read()
|
|
|
|
def _renderModelDropdown_body(self):
|
|
src = self._read('ui.js')
|
|
start = src.find('function renderModelDropdown()')
|
|
end = src.find('\nasync function selectModelFromDropdown', start)
|
|
return src[start:end]
|
|
|
|
def test_model_custom_input_in_dropdown(self):
|
|
body = self._renderModelDropdown_body()
|
|
self.assertIn('model-custom-input', body,
|
|
'model-custom-input class must be in renderModelDropdown')
|
|
|
|
def test_model_custom_enter_handler(self):
|
|
body = self._renderModelDropdown_body()
|
|
self.assertIn('_applyCustom', body,
|
|
'_applyCustom function must be defined in renderModelDropdown')
|
|
|
|
def test_model_custom_css_defined(self):
|
|
css = self._read('style.css')
|
|
self.assertIn('.model-custom-row', css,
|
|
'.model-custom-row must be defined in style.css')
|
|
self.assertIn('.model-custom-input', css,
|
|
'.model-custom-input must be defined in style.css')
|
|
|
|
def test_model_custom_i18n_keys(self):
|
|
i18n = self._read('i18n.js')
|
|
# Find en locale block (appears first before es)
|
|
en_block_start = i18n.find("'en'")
|
|
es_block_start = i18n.find("'es'")
|
|
en_block = i18n[en_block_start:es_block_start]
|
|
self.assertIn('model_custom_label', en_block,
|
|
'model_custom_label must be in en locale')
|
|
self.assertIn('model_custom_placeholder', en_block,
|
|
'model_custom_placeholder must be in en locale')
|
|
|
|
|
|
# ── Sprint 42 additional tests: context indicator (#437) ─────────────────
|
|
def test_context_indicator_uses_pick_helper():
|
|
"""The _pick helper must be present in sessions.js to prefer latest over stale values."""
|
|
content = _read_sessions_js()
|
|
assert '_pick' in content, "_pick helper not found in static/sessions.js"
|
|
|
|
|
|
def test_context_indicator_old_pattern_removed():
|
|
"""The old || pattern that preferred stale session data must be gone."""
|
|
content = _read_sessions_js()
|
|
assert '_s.input_tokens||u.input_tokens' not in content, \
|
|
"Old stale-data-first pattern '_s.input_tokens||u.input_tokens' still present in static/sessions.js"
|
|
|
|
|
|
def test_context_indicator_all_six_fields():
|
|
"""All six token/cost fields must appear in the _syncCtxIndicator call."""
|
|
content = _read_sessions_js()
|
|
fields = [
|
|
'input_tokens',
|
|
'output_tokens',
|
|
'estimated_cost',
|
|
'context_length',
|
|
'last_prompt_tokens',
|
|
'threshold_tokens',
|
|
]
|
|
for field in fields:
|
|
assert field in content, \
|
|
f"Field '{field}' not found in static/sessions.js _syncCtxIndicator call"
|
|
|
|
|
|
# ── Sprint 42 additional tests: system prompt title (#441) ──────────────
|
|
def test_system_prompt_title_guard_exists():
|
|
"""The guard that detects [SYSTEM: prefixes must be present in sessions.js."""
|
|
content = _read_sessions_js()
|
|
assert '[SYSTEM:' in content, \
|
|
"sessions.js must contain the [SYSTEM: guard to intercept system-prompt titles"
|
|
# Make sure it appears in an if-condition context, not just a comment
|
|
assert "cleanTitle.startsWith('[SYSTEM:')" in content, \
|
|
"sessions.js must have: cleanTitle.startsWith('[SYSTEM:') guard expression"
|
|
|
|
|
|
def test_cleanTitle_is_let_not_const():
|
|
"""cleanTitle must be declared with let (not const) to allow reassignment in the guard."""
|
|
content = _read_sessions_js()
|
|
assert 'let cleanTitle' in content, \
|
|
"cleanTitle must be declared with 'let' (not 'const') to allow reassignment"
|
|
# Make sure the old const form is gone in this context
|
|
# (check the specific assignment line pattern)
|
|
assert "const cleanTitle=tags.length" not in content, \
|
|
"Old 'const cleanTitle=tags.length...' must be replaced by 'let cleanTitle=...'"
|
|
|
|
|
|
# ── Sprint 42 additional tests: thinking panel persistence (#427) ────────
|
|
def test_streaming_persists_reasoning_in_session():
|
|
"""streaming.py must accumulate reasoning_text and patch last assistant message."""
|
|
src = (REPO / 'api' / 'streaming.py').read_text()
|
|
|
|
# _reasoning_text must be initialised
|
|
assert "_reasoning_text = ''" in src, \
|
|
"_reasoning_text variable not initialised in streaming.py"
|
|
|
|
# on_reasoning must accumulate into _reasoning_text
|
|
assert '_reasoning_text += str(text)' in src, \
|
|
"on_reasoning callback does not accumulate into _reasoning_text"
|
|
|
|
# Persistence block must exist before raw_session is built
|
|
assert "Persist reasoning trace in the session so it survives reload" in src, \
|
|
"Reasoning persistence comment not found in streaming.py"
|
|
|
|
assert "_rm['reasoning'] = _reasoning_text" in src, \
|
|
"Code to set _rm['reasoning'] not found in streaming.py"
|
|
|
|
# Persistence block must come BEFORE raw_session assignment
|
|
persist_idx = src.index("Persist reasoning trace in the session")
|
|
raw_session_idx = src.index("raw_session = s.compact()")
|
|
assert persist_idx < raw_session_idx, \
|
|
"Reasoning persistence block must appear before raw_session assignment"
|
|
|
|
|
|
def test_done_handler_patches_reasoning_field():
|
|
"""messages.js done SSE handler must patch reasoningText onto the last assistant message."""
|
|
src = (REPO / 'static' / 'messages.js').read_text()
|
|
|
|
# The persistence comment must be present inside the done handler
|
|
assert "Persist reasoning trace so thinking card survives page reload" in src, \
|
|
"Reasoning persistence comment not found in messages.js done handler"
|
|
|
|
# The guard and assignment must be present
|
|
assert "if(reasoningText){" in src, \
|
|
"reasoningText guard not found in messages.js"
|
|
|
|
assert "lastAsst.reasoning=reasoningText" in src, \
|
|
"lastAsst.reasoning assignment not found in messages.js"
|
|
|
|
# Verify the patch is inside the done handler (after 'source.addEventListener' for done)
|
|
done_handler_idx = src.index("source.addEventListener('done'")
|
|
persist_idx = src.index("Persist reasoning trace so thinking card survives page reload")
|
|
assert done_handler_idx < persist_idx, \
|
|
"Reasoning persistence patch must be inside the done SSE handler"
|
|
|
|
# The guard must also check !lastAsst.reasoning to avoid overwriting server value
|
|
assert "!lastAsst.reasoning" in src, \
|
|
"Guard '!lastAsst.reasoning' missing — would overwrite server-persisted reasoning"
|
|
|
|
|
|
def test_rendermessages_reads_reasoning_from_messages():
|
|
"""ui.js renderMessages must read m.reasoning to display the thinking card."""
|
|
src = (REPO / 'static' / 'ui.js').read_text()
|
|
|
|
# m.reasoning must be read in the render path
|
|
assert 'm.reasoning' in src, \
|
|
"m.reasoning not referenced in ui.js — thinking card won't render on reload"
|
|
|
|
# The thinking card rendering block must also be present
|
|
assert 'thinking-card' in src, \
|
|
"thinking-card CSS class not found in ui.js"
|
|
|
|
# Specifically, the fallback that reads from top-level m.reasoning field
|
|
assert 'thinkingText=m.reasoning' in src.replace(' ', ''), \
|
|
"thinkingText=m.reasoning assignment not found in ui.js renderMessages"
|
|
|
|
|
|
def test_streaming_restores_prior_reasoning_metadata_after_followup():
|
|
"""Previous-turn thinking must survive later turns.
|
|
|
|
The provider-facing history strips WebUI-only `reasoning` fields, so the
|
|
streaming path must merge that metadata back onto the returned message
|
|
history before saving the session, including reinserting dropped
|
|
reasoning-only assistant segments.
|
|
"""
|
|
src = (REPO / 'api' / 'streaming.py').read_text()
|
|
assert "def _restore_reasoning_metadata(" in src, \
|
|
"streaming.py must define a helper to restore prior reasoning metadata"
|
|
assert "s.messages = _restore_reasoning_metadata(" in src, \
|
|
"streaming.py must merge prior reasoning metadata back after run_conversation()"
|
|
assert "updated_messages.insert(safe_pos, copy.deepcopy(prev_msg))" in src, \
|
|
"streaming.py must reinsert dropped reasoning-only assistant messages"
|
|
|
|
|
|
def test_routes_restores_prior_reasoning_metadata_after_followup():
|
|
"""The non-streaming route path must preserve prior reasoning metadata too."""
|
|
src = (REPO / 'api' / 'routes.py').read_text()
|
|
assert "_restore_reasoning_metadata" in src, \
|
|
"routes.py must import reasoning metadata restoration helper"
|
|
assert 's.messages = _restore_reasoning_metadata(' in src, \
|
|
"routes.py must merge prior reasoning metadata back after run_conversation()"
|