fixed chat history context

2026-03-16 21:22:40 +01:00 · 2026-03-16 21:22:40 +01:00 · f3de454b66
commit f3de454b66
parent 6154eb2553
4 changed files with 93 additions and 3 deletions
--- a/modules/features/workspace/routeFeatureWorkspace.py
+++ b/modules/features/workspace/routeFeatureWorkspace.py
@ -9,7 +9,7 @@ and Playground into a single agent-driven workspace.
 import logging
 import json
 import asyncio
-from typing import Optional, List
+from typing import Dict, Optional, List

 from fastapi import APIRouter, HTTPException, Depends, Body, Path, Query, Request, UploadFile, File
 from fastapi.responses import StreamingResponse, JSONResponse
@ -146,6 +146,37 @@ def _buildDataSourceContext(chatService, dataSourceIds: List[str]) -> str:
    return "\n".join(parts) if found else ""


+def _loadConversationHistory(chatInterface, workflowId: str, currentPrompt: str) -> List[Dict[str, str]]:
+    """Load prior messages from DB for follow-up context, excluding the current prompt."""
+    try:
+        rawMessages = chatInterface.getMessages(workflowId) or []
+    except Exception as e:
+        logger.warning(f"Failed to load conversation history: {e}")
+        return []
+
+    history = []
+    for msg in rawMessages:
+        if isinstance(msg, dict):
+            role = msg.get("role", "")
+            content = msg.get("message", "") or msg.get("content", "")
+        else:
+            role = getattr(msg, "role", "")
+            content = getattr(msg, "message", "") or getattr(msg, "content", "")
+        if role in ("user", "assistant") and content:
+            history.append({"role": role, "content": content})
+
+    if not history:
+        return []
+
+    # Drop the last user message if it matches the current prompt (already added by the agent loop)
+    if history[-1]["role"] == "user" and history[-1]["content"].strip() == currentPrompt.strip():
+        history = history[:-1]
+
+    if history:
+        logger.info(f"Loaded {len(history)} prior messages for workflow {workflowId}")
+    return history
+
+
 async def _deriveWorkflowName(prompt: str, aiService) -> str:
    """Use AI to generate a concise workflow title from the user prompt."""
    from modules.datamodels.datamodelAi import AiCallRequest, AiCallOptions, OperationTypeEnum, PriorityEnum
@ -320,16 +351,25 @@ async def _runWorkspaceAgent(
            if dsInfo:
                enrichedPrompt = f"{prompt}\n\n[Active Data Sources]\n{dsInfo}"

+        conversationHistory = _loadConversationHistory(chatInterface, workflowId, prompt)
+
+        accumulatedText = ""
+        messagePersisted = False
+
        async for event in agentService.runAgent(
            prompt=enrichedPrompt,
            fileIds=fileIds,
            workflowId=workflowId,
            userLanguage=userLanguage,
+            conversationHistory=conversationHistory,
        ):
            if eventManager.is_cancelled(queueId):
                logger.info(f"Agent cancelled by user for workflow {workflowId}")
                break

+            if event.type == AgentEventTypeEnum.CHUNK and event.content:
+                accumulatedText += event.content
+
            sseEvent = {
                "type": event.type.value if hasattr(event.type, "value") else event.type,
                "workflowId": workflowId,
@ -337,6 +377,7 @@ async def _runWorkspaceAgent(
            if event.content:
                sseEvent["content"] = event.content
                if event.type == AgentEventTypeEnum.MESSAGE:
+                    accumulatedText += event.content
                    sseEvent["item"] = {
                        "id": f"msg-{workflowId}-{id(event)}",
                        "role": "assistant",
@ -349,16 +390,30 @@ async def _runWorkspaceAgent(
            await eventManager.emit_event(queueId, sseEvent["type"], sseEvent)

            if event.type in (AgentEventTypeEnum.FINAL, AgentEventTypeEnum.ERROR):
-                if event.content:
+                finalContent = event.content or accumulatedText
+                if finalContent:
                    try:
                        chatInterface.createMessage({
                            "workflowId": workflowId,
                            "role": "assistant",
-                            "message": event.content,
+                            "message": finalContent,
                        })
+                        messagePersisted = True
                    except Exception as msgErr:
                        logger.error(f"Failed to persist assistant message: {msgErr}")

+        # Persist any streamed content that wasn't saved via FINAL (e.g. cancellation)
+        if not messagePersisted and accumulatedText.strip():
+            try:
+                chatInterface.createMessage({
+                    "workflowId": workflowId,
+                    "role": "assistant",
+                    "message": accumulatedText,
+                })
+                logger.info(f"Persisted partial assistant response ({len(accumulatedText)} chars) for workflow {workflowId}")
+            except Exception as msgErr:
+                logger.error(f"Failed to persist partial assistant message: {msgErr}")
+
        logger.info(f"Agent loop completed for workflow {workflowId}, sending 'complete' event")
        await eventManager.emit_event(queueId, "complete", {
            "type": "complete",
--- a/modules/serviceCenter/services/serviceAgent/agentLoop.py
+++ b/modules/serviceCenter/services/serviceAgent/agentLoop.py
@ -41,6 +41,7 @@ async def runAgentLoop(
    mandateId: str = "",
    aiCallStreamFn: Callable = None,
    userLanguage: str = "",
+    conversationHistory: List[Dict[str, Any]] = None,
 ) -> AsyncGenerator[AgentEvent, None]:
    """Run the agent loop. Yields AgentEvent for each step (SSE-ready).

@ -56,6 +57,7 @@ async def runAgentLoop(
        buildRagContextFn: Optional async function to build RAG context before each round
        mandateId: Mandate ID for RAG scoping
        userLanguage: ISO 639-1 language code for agent responses
+        conversationHistory: Prior messages [{role, content/message}] for follow-up context
    """
    state = AgentState(workflowId=workflowId, maxRounds=config.maxRounds)
    trace = AgentTrace(
@ -69,6 +71,8 @@ async def runAgentLoop(

    systemPrompt = buildSystemPrompt(tools, toolsText, userLanguage=userLanguage)
    conversation = ConversationManager(systemPrompt)
+    if conversationHistory:
+        conversation.loadHistory(conversationHistory)
    conversation.addUserMessage(prompt)

    while state.status == AgentStatusEnum.RUNNING and state.currentRound < state.maxRounds:
--- a/modules/serviceCenter/services/serviceAgent/conversationManager.py
+++ b/modules/serviceCenter/services/serviceAgent/conversationManager.py
@ -14,6 +14,8 @@ FIRST_SUMMARY_ROUND = 4
 META_SUMMARY_ROUND = 7
 KEEP_RECENT_MESSAGES = 4
 MAX_ESTIMATED_TOKENS = 60000
+_MAX_HISTORY_MESSAGES = 40
+_MAX_HISTORY_MSG_CHARS = 12000


 class ConversationManager:
@ -33,6 +35,32 @@ class ConversationManager:
        self._lastSummarizedRound: int = 0
        self._ragContextInjected: bool = False

+    def loadHistory(self, messages: List[Dict[str, Any]]):
+        """Load prior conversation messages for follow-up context.
+
+        Accepts messages with {role, content/message} format (as stored in DB).
+        Truncates long messages and limits total count to keep the context window
+        manageable. Must be called BEFORE addUserMessage with the current prompt.
+        """
+        if not messages:
+            return
+
+        recent = messages[-_MAX_HISTORY_MESSAGES:]
+        loaded = 0
+        for msg in recent:
+            role = msg.get("role", "")
+            content = msg.get("content", "") or msg.get("message", "") or ""
+            if role not in ("user", "assistant"):
+                continue
+            if not content.strip():
+                continue
+            if len(content) > _MAX_HISTORY_MSG_CHARS:
+                content = content[:_MAX_HISTORY_MSG_CHARS] + "…"
+            self._messages.append({"role": role, "content": content})
+            loaded += 1
+        if loaded:
+            logger.info(f"Loaded {loaded} history messages into conversation context")
+
    @property
    def messages(self) -> List[Dict[str, Any]]:
        """Current messages for the next AI call (internal markers stripped)."""
--- a/modules/serviceCenter/services/serviceAgent/mainServiceAgent.py
+++ b/modules/serviceCenter/services/serviceAgent/mainServiceAgent.py
@ -109,6 +109,7 @@ class AgentService:
        workflowId: str = None,
        additionalTools: List[Dict[str, Any]] = None,
        userLanguage: str = "",
+        conversationHistory: List[Dict[str, Any]] = None,
    ) -> AsyncGenerator[AgentEvent, None]:
        """Run an agent with the given prompt and tools.

@ -120,6 +121,7 @@ class AgentService:
            workflowId: Workflow ID for tracking and billing
            additionalTools: Extra tool definitions to register dynamically
            userLanguage: ISO 639-1 language code; falls back to user.language from profile
+            conversationHistory: Prior messages for follow-up context

        Yields:
            AgentEvent for each step (SSE-ready)
@ -154,6 +156,7 @@ class AgentService:
            mandateId=self.services.mandateId or "",
            aiCallStreamFn=aiCallStreamFn,
            userLanguage=resolvedLanguage,
+            conversationHistory=conversationHistory,
        ):
            if event.type == AgentEventTypeEnum.AGENT_SUMMARY:
                await self._persistTrace(workflowId, event.data or {})