fix(history): block compact during active runs (#2635)
This commit is contained in:
@@ -10,7 +10,12 @@ from fastapi import APIRouter, Request, HTTPException
|
||||
from core.models import ChatMessage
|
||||
from core.database import SessionLocal, ChatMessage as DbChatMessage, Session as DbSession
|
||||
from src.topic_analyzer import analyze_topics
|
||||
from routes.session_routes import _verify_session_owner
|
||||
from routes.session_routes import (
|
||||
_message_role,
|
||||
_message_text,
|
||||
_reject_compact_during_active_run,
|
||||
_verify_session_owner,
|
||||
)
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
@@ -521,6 +526,7 @@ def setup_history_routes(session_manager) -> APIRouter:
|
||||
session = session_manager.get_session(session_id)
|
||||
except KeyError:
|
||||
raise HTTPException(404, "Session not found")
|
||||
_reject_compact_during_active_run(session_id)
|
||||
|
||||
try:
|
||||
from src.model_context import estimate_tokens, get_context_length
|
||||
@@ -543,8 +549,8 @@ def setup_history_routes(session_manager) -> APIRouter:
|
||||
|
||||
# Build text to summarize
|
||||
convo_text = "\n".join(
|
||||
f"{(m.role if isinstance(m, ChatMessage) else m.get('role', '')).upper()}: "
|
||||
f"{((m.content if isinstance(m, ChatMessage) else m.get('content')) or '')[:2000]}"
|
||||
f"{_message_role(m).upper()}: "
|
||||
f"{_message_text(m)[:2000]}"
|
||||
for m in older
|
||||
)
|
||||
|
||||
|
||||
@@ -57,6 +57,40 @@ def _content_to_text(content) -> str:
|
||||
return ""
|
||||
|
||||
|
||||
def _message_role(message) -> str:
|
||||
if isinstance(message, ChatMessage):
|
||||
return message.role or ""
|
||||
if isinstance(message, dict):
|
||||
return message.get("role", "") or ""
|
||||
return getattr(message, "role", "") or ""
|
||||
|
||||
|
||||
def _message_text(message) -> str:
|
||||
if isinstance(message, ChatMessage):
|
||||
content = message.content
|
||||
elif isinstance(message, dict):
|
||||
content = message.get("content")
|
||||
else:
|
||||
content = getattr(message, "content", None)
|
||||
return _content_to_text(content)
|
||||
|
||||
|
||||
def _message_metadata(message) -> dict:
|
||||
if isinstance(message, ChatMessage):
|
||||
metadata = message.metadata
|
||||
elif isinstance(message, dict):
|
||||
metadata = message.get("metadata")
|
||||
else:
|
||||
metadata = getattr(message, "metadata", None)
|
||||
return metadata if isinstance(metadata, dict) else {}
|
||||
|
||||
|
||||
def _reject_compact_during_active_run(session_id: str) -> None:
|
||||
from src import agent_runs
|
||||
if agent_runs.is_active(session_id):
|
||||
raise HTTPException(409, "Session has an active run; try compacting after it finishes")
|
||||
|
||||
|
||||
def _verify_session_owner(request: Request, session_id: str, session_manager=None):
|
||||
"""Verify the current user owns the session. Raises 404 if not.
|
||||
|
||||
@@ -872,6 +906,7 @@ def setup_session_routes(session_manager: SessionManager, config: dict, webhook_
|
||||
session = session_manager.get_session(session_id)
|
||||
except KeyError:
|
||||
raise HTTPException(404, f"Session {session_id} not found")
|
||||
_reject_compact_during_active_run(session_id)
|
||||
|
||||
history = list(session.history or [])
|
||||
if len(history) < 6:
|
||||
@@ -897,7 +932,7 @@ def setup_session_routes(session_manager: SessionManager, config: dict, webhook_
|
||||
|
||||
prior_compactions = sum(
|
||||
1 for m in history
|
||||
if (m.metadata or {}).get("compacted") or "[Conversation summary" in (m.content or "")
|
||||
if _message_metadata(m).get("compacted") or "[Conversation summary" in _message_text(m)
|
||||
)
|
||||
prompt = SELF_SUMMARY_SYSTEM_PROMPT.replace(
|
||||
"{count}", str(len(older))
|
||||
@@ -905,7 +940,7 @@ def setup_session_routes(session_manager: SessionManager, config: dict, webhook_
|
||||
"{n}", str(prior_compactions + 1)
|
||||
)
|
||||
convo_text = "\n".join(
|
||||
f"{m.role.upper()}: {(m.content or '')[:2000]}"
|
||||
f"{_message_role(m).upper()}: {_message_text(m)[:2000]}"
|
||||
for m in older
|
||||
)
|
||||
try:
|
||||
|
||||
@@ -1,10 +1,11 @@
|
||||
from types import SimpleNamespace
|
||||
|
||||
from fastapi import FastAPI
|
||||
from fastapi import APIRouter, FastAPI
|
||||
from fastapi.testclient import TestClient
|
||||
|
||||
from core.models import ChatMessage
|
||||
import routes.history_routes as history_routes
|
||||
import routes.session_routes as session_routes
|
||||
|
||||
|
||||
class _FakeQuery:
|
||||
@@ -53,6 +54,7 @@ class _FakeSessionManager:
|
||||
def __init__(self, session):
|
||||
self.session = session
|
||||
self.saved = False
|
||||
self.replaced_messages = None
|
||||
|
||||
def get_session(self, session_id):
|
||||
if session_id != self.session.id:
|
||||
@@ -62,6 +64,14 @@ class _FakeSessionManager:
|
||||
def save_sessions(self):
|
||||
self.saved = True
|
||||
|
||||
def replace_messages(self, session_id, messages):
|
||||
if session_id != self.session.id:
|
||||
return False
|
||||
self.replaced_messages = list(messages)
|
||||
self.session.history = list(messages)
|
||||
self.session.message_count = len(messages)
|
||||
return True
|
||||
|
||||
|
||||
class _FakeSession:
|
||||
id = "session-1"
|
||||
@@ -91,11 +101,13 @@ def _compact_prompt_for(monkeypatch, history):
|
||||
monkeypatch.setattr(history_routes, "_verify_session_owner", lambda request, session_id: None)
|
||||
monkeypatch.setattr(history_routes, "SessionLocal", lambda: _FakeDb())
|
||||
|
||||
import src.agent_runs as agent_runs
|
||||
import src.endpoint_resolver as endpoint_resolver
|
||||
import src.llm_core as llm_core
|
||||
import src.model_context as model_context
|
||||
|
||||
monkeypatch.setattr(endpoint_resolver, "resolve_endpoint", lambda kind: (None, None, {}))
|
||||
monkeypatch.setattr(agent_runs, "is_active", lambda session_id: False)
|
||||
monkeypatch.setattr(endpoint_resolver, "resolve_endpoint", lambda kind, owner=None: (None, None, {}))
|
||||
monkeypatch.setattr(llm_core, "llm_call_async", fake_llm_call_async)
|
||||
monkeypatch.setattr(model_context, "estimate_tokens", lambda messages: 100)
|
||||
monkeypatch.setattr(model_context, "get_context_length", lambda endpoint_url, model: 1000)
|
||||
@@ -113,6 +125,40 @@ def _compact_prompt_for(monkeypatch, history):
|
||||
return captured["messages"][1]["content"]
|
||||
|
||||
|
||||
def _registered_compact_response(monkeypatch, history, active_run=False):
|
||||
captured = {}
|
||||
|
||||
async def fake_llm_call_async(endpoint_url, model, messages, **kwargs):
|
||||
captured["messages"] = messages
|
||||
return "Summary text"
|
||||
|
||||
monkeypatch.setattr(
|
||||
session_routes,
|
||||
"router",
|
||||
APIRouter(prefix="/api", tags=["sessions"]),
|
||||
)
|
||||
monkeypatch.setattr(session_routes, "_verify_session_owner", lambda request, session_id: None)
|
||||
monkeypatch.setattr(history_routes, "_verify_session_owner", lambda request, session_id: None)
|
||||
monkeypatch.setattr(history_routes, "SessionLocal", lambda: _FakeDb())
|
||||
|
||||
import src.agent_runs as agent_runs
|
||||
import src.endpoint_resolver as endpoint_resolver
|
||||
import src.llm_core as llm_core
|
||||
|
||||
monkeypatch.setattr(agent_runs, "is_active", lambda session_id: active_run)
|
||||
monkeypatch.setattr(endpoint_resolver, "resolve_endpoint", lambda kind, owner=None: (None, None, {}))
|
||||
monkeypatch.setattr(llm_core, "llm_call_async", fake_llm_call_async)
|
||||
|
||||
session = _FakeSession(history)
|
||||
manager = _FakeSessionManager(session)
|
||||
app = FastAPI()
|
||||
app.include_router(session_routes.setup_session_routes(manager, {}))
|
||||
app.include_router(history_routes.setup_history_routes(manager))
|
||||
|
||||
response = TestClient(app).post("/api/session/session-1/compact")
|
||||
return response, captured, manager
|
||||
|
||||
|
||||
def test_manual_compact_tolerates_chatmessage_with_none_content(monkeypatch):
|
||||
compact_prompt = _compact_prompt_for(
|
||||
monkeypatch,
|
||||
@@ -143,3 +189,44 @@ def test_manual_compact_tolerates_dict_message_with_none_content(monkeypatch):
|
||||
)
|
||||
assert "ASSISTANT: None" not in compact_prompt
|
||||
assert "ASSISTANT: " in compact_prompt
|
||||
|
||||
|
||||
def test_registered_manual_compact_route_tolerates_none_content(monkeypatch):
|
||||
response, captured, manager = _registered_compact_response(
|
||||
monkeypatch,
|
||||
[
|
||||
ChatMessage(role="user", content="start"),
|
||||
ChatMessage(role="assistant", content=None),
|
||||
ChatMessage(role="tool", content="tool result"),
|
||||
ChatMessage(role="assistant", content="done"),
|
||||
ChatMessage(role="user", content="next"),
|
||||
ChatMessage(role="assistant", content="final"),
|
||||
],
|
||||
)
|
||||
|
||||
assert response.status_code == 200
|
||||
assert response.json()["ok"] is True
|
||||
compact_prompt = captured["messages"][1]["content"]
|
||||
assert "ASSISTANT: None" not in compact_prompt
|
||||
assert "ASSISTANT: " in compact_prompt
|
||||
assert manager.replaced_messages is not None
|
||||
|
||||
|
||||
def test_registered_manual_compact_route_rejects_active_agent_run(monkeypatch):
|
||||
response, captured, manager = _registered_compact_response(
|
||||
monkeypatch,
|
||||
[
|
||||
ChatMessage(role="user", content="start"),
|
||||
ChatMessage(role="assistant", content="tool call"),
|
||||
ChatMessage(role="tool", content="tool result"),
|
||||
ChatMessage(role="assistant", content="done"),
|
||||
ChatMessage(role="user", content="next"),
|
||||
ChatMessage(role="assistant", content="final"),
|
||||
],
|
||||
active_run=True,
|
||||
)
|
||||
|
||||
assert response.status_code == 409
|
||||
assert "active run" in response.text
|
||||
assert captured == {}
|
||||
assert manager.replaced_messages is None
|
||||
|
||||
Reference in New Issue
Block a user