From 8592cdd790404e0a592b07fa70f2a0fa8c5d2f15 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Sat, 16 Aug 2025 23:32:36 +0200
Subject: [PATCH] stable workflow

---
 modules/chat/OLD_BACKUP managerChat.py       | 3078 ------------------
 modules/chat/documents/documentExtraction.py | 1435 +++++++-
 modules/chat/documents/documentGeneration.py |   47 +-
 modules/chat/handling/handlingTasks.py       |  410 ++-
 modules/chat/handling/promptFactory.py       |  139 +-
 modules/chat/managerChat.py                  |   32 +-
 modules/chat/serviceCenter.py                |  116 +-
 modules/interfaces/interfaceAiCalls.py       |   53 +-
 modules/interfaces/interfaceAppObjects.py    |   15 +-
 modules/interfaces/interfaceChatModel.py     |    7 +-
 modules/interfaces/interfaceChatObjects.py   |   23 +
 modules/methods/methodDocument.py            |  461 ++-
 modules/methods/methodOutlook.py             |  325 +-
 modules/methods/methodSharepoint.py          |    4 +-
 modules/workflow/managerWorkflow.py          |   81 +-
 requirements.txt                             |   12 +
 test_documentExtraction.py                   |  855 +++++
 test_excel_processing.py                     |  189 ++
 web_search_20250717_140455.txt               |    0
 web_search_20250717_144557.txt               |    0
 20 files changed, 3701 insertions(+), 3581 deletions(-)
 delete mode 100644 modules/chat/OLD_BACKUP managerChat.py
 create mode 100644 test_documentExtraction.py
 create mode 100644 test_excel_processing.py
 delete mode 100644 web_search_20250717_140455.txt
 delete mode 100644 web_search_20250717_144557.txt

diff --git a/modules/chat/OLD_BACKUP managerChat.py b/modules/chat/OLD_BACKUP managerChat.py
deleted file mode 100644
index 056efcbc..00000000
--- a/modules/chat/OLD_BACKUP managerChat.py	
+++ /dev/null
@@ -1,3078 +0,0 @@
-import asyncio
-import logging
-import uuid
-import json
-import time
-from typing import Dict, Any, Optional, List, Union
-from datetime import datetime, UTC
-
-from modules.interfaces.interfaceAppModel import User
-from modules.interfaces.interfaceChatModel import (
-    TaskStatus, ChatDocument, TaskItem, TaskAction, TaskResult, ChatStat, ChatLog, ChatMessage, ChatWorkflow, UserInputRequest, ActionResult,
-    ExtractedContent, ContentItem, ContentMetadata, DocumentExchange, TaskStep, TaskContext, ActionExecutionResult, ReviewContext, ReviewResult, TaskPlan, WorkflowResult
-)
-from modules.chat.serviceCenter import ServiceCenter
-from modules.interfaces.interfaceChatObjects import ChatObjects
-
-logger = logging.getLogger(__name__)
-
-# ===== STATE MANAGEMENT AND VALIDATION CLASSES =====
-
-class TaskExecutionState:
-    """Manages state during task execution with retry logic"""
-    def __init__(self, task_step: TaskStep):
-        self.task_step = task_step
-        self.successful_actions: List[ActionExecutionResult] = []  # Preserved across retries
-        self.failed_actions: List[ActionExecutionResult] = []      # For analysis
-        self.current_action_index = 0
-        self.retry_count = 0
-        self.improvements = []
-        self.partial_results = {}     # Store intermediate results
-        self.max_retries = 3
-    def addSuccessfulAction(self, action_result: ActionExecutionResult):
-        self.successful_actions.append(action_result)
-        if action_result.data.get('resultLabel'):
-            self.partial_results[action_result.data['resultLabel']] = action_result
-    def addFailedAction(self, action_result: ActionExecutionResult):
-        self.failed_actions.append(action_result)
-    def getAvailableResults(self) -> list:
-        return [result.data.get('resultLabel', '') for result in self.successful_actions if result.data.get('resultLabel')]
-    def shouldRetryTask(self) -> bool:
-        return len(self.successful_actions) > 0 and len(self.failed_actions) > 0
-    def canRetry(self) -> bool:
-        return self.retry_count < self.max_retries
-    def incrementRetryCount(self):
-        self.retry_count += 1
-    def getFailurePatterns(self) -> list:
-        patterns = []
-        for action in self.failed_actions:
-            error = action.error.lower() if action.error else ''
-            if "timeout" in error:
-                patterns.append("timeout_issues")
-            elif "document_not_found" in error or "file not found" in error:
-                patterns.append("document_reference_issues")
-            elif "empty_result" in error or "no content" in error:
-                patterns.append("content_extraction_issues")
-            elif "invalid_format" in error or "wrong format" in error:
-                patterns.append("format_issues")
-            elif "permission" in error or "access denied" in error:
-                patterns.append("permission_issues")
-        return list(set(patterns))
-
-class ActionValidator:
-    """Generic AI-based action result validation"""
-    def __init__(self, chat_manager):
-        self.chat_manager = chat_manager
-    
-    async def validateActionResult(self, action_result: ActionResult, action: TaskAction, context: TaskContext) -> dict:
-        """Generic action validation using AI"""
-        try:
-            # Create generic validation prompt
-            prompt = self._createGenericValidationPrompt(action_result, action, context)
-            response = await self.chat_manager._callAIWithCircuitBreaker(prompt, "action_validation")
-            validation = self._parseValidationResponse(response)
-            
-            # Add action metadata
-            validation['action_id'] = action.id
-            validation['action_method'] = action.execMethod
-            validation['action_name'] = action.execAction
-            validation['result_label'] = action.execResultLabel
-            
-            return validation
-        except Exception as e:
-            logger.error(f"Error validating action result: {str(e)}")
-            return {
-                'status': 'success',
-                'reason': f'Validation failed: {str(e)}',
-                'confidence': 0.5,
-                'improvements': [],
-                'action_id': action.id,
-                'action_method': action.execMethod,
-                'action_name': action.execAction,
-                'result_label': action.execResultLabel
-            }
-    
-    def _createGenericValidationPrompt(self, action_result: ActionResult, action: TaskAction, context: TaskContext) -> str:
-        """Create a validation prompt focused on result file delivery"""
-        # Extract data from ActionResult model
-        success = action_result.success
-        result_data = action_result.data
-        error = action_result.error
-        validation_messages = action_result.validation
-        
-        # Extract result text from data
-        result_text = result_data.get("result", "") if isinstance(result_data, dict) else str(result_data)
-        
-        # Get documents from ActionResult data
-        documents = result_data.get("documents", []) if isinstance(result_data, dict) else []
-        doc_count = len(documents)
-        
-        # Extract expected result format from action parameters
-        expected_result_label = action.execResultLabel
-        expected_format = action.execParameters.get('outputFormat', 'unknown')
-        
-        # Extract expected document formats from action
-        expected_document_formats = action.expectedDocumentFormats or []
-        
-        # Check if the result label is present in the action result data
-        actual_result_label = result_data.get("resultLabel", "") if isinstance(result_data, dict) else ""
-        result_label_match = actual_result_label == expected_result_label
-        
-        # Analyze delivered documents and content
-        delivered_files = []
-        delivered_formats = []
-        content_items = []
-        
-        # Check for ChatDocument objects
-        for doc in documents:
-            if hasattr(doc, 'filename'):
-                delivered_files.append(doc.filename)
-                # Extract format information
-                file_extension = self._getFileExtension(doc.filename)
-                mime_type = getattr(doc, 'mimeType', 'application/octet-stream')
-                delivered_formats.append({
-                    'filename': doc.filename,
-                    'extension': file_extension,
-                    'mimeType': mime_type
-                })
-            elif isinstance(doc, dict) and 'filename' in doc:
-                delivered_files.append(doc['filename'])
-                file_extension = self._getFileExtension(doc['filename'])
-                mime_type = doc.get('mimeType', 'application/octet-stream')
-                delivered_formats.append({
-                    'filename': doc['filename'],
-                    'extension': file_extension,
-                    'mimeType': mime_type
-                })
-            else:
-                delivered_files.append(f"document_{len(delivered_files)}")
-                delivered_formats.append({
-                    'filename': f"document_{len(delivered_files)}",
-                    'extension': 'unknown',
-                    'mimeType': 'application/octet-stream'
-                })
-        
-        # Check for ExtractedContent in result data
-        if isinstance(result_data, dict):
-            if 'extractedContent' in result_data:
-                extracted_content = result_data['extractedContent']
-                if hasattr(extracted_content, 'contents'):
-                    content_items = extracted_content.contents
-            elif 'contents' in result_data:
-                content_items = result_data['contents']
-        
-        # If we have delivered files but no content items, consider it successful
-        # This handles the case where content is stored in files rather than result data
-        if delivered_files and not content_items:
-            content_items = [f"File content available in: {', '.join(delivered_files)}"]
-        
-        # Analyze content items
-        content_summary = []
-        for item in content_items:
-            if hasattr(item, 'label') and hasattr(item, 'metadata'):
-                content_summary.append(f"{item.label}: {item.metadata.mimeType if hasattr(item.metadata, 'mimeType') else 'unknown'}")
-            elif isinstance(item, str):
-                content_summary.append(item)
-            else:
-                content_summary.append(str(item))
-        
-        return f"""You are an action result validator. Your primary focus is to validate that the action delivered the promised result files in the promised format.
-
-ACTION DETAILS:
-- Method: {action.execMethod}
-- Action: {action.execAction}
-- Expected Result Label: {expected_result_label}
-- Actual Result Label: {actual_result_label}
-- Result Label Match: {result_label_match}
-- Expected Format: {expected_format}
-- Expected Document Formats: {json.dumps(expected_document_formats, indent=2) if expected_document_formats else 'None specified'}
-- Parameters: {json.dumps(action.execParameters, indent=2)}
-
-RESULT TO VALIDATE:
-- Success: {success}
-- Result Data: {result_text[:500]}{'...' if len(result_text) > 500 else ''}
-- Error: {error}
-- Validation Messages: {', '.join(validation_messages) if validation_messages else 'None'}
-- Documents Produced: {doc_count}
-- Delivered Files: {', '.join(delivered_files) if delivered_files else 'None'}
-- Delivered Formats: {json.dumps(delivered_formats, indent=2) if delivered_formats else 'None'}
-- Content Items: {', '.join(content_summary) if content_summary else 'None'}
-
-CRITICAL VALIDATION CRITERIA:
-1. **Result Label Match**: Does the action result contain the expected result label?
-2. **File Delivery**: Did the action deliver the promised result file(s)?
-3. **Format Compliance**: If expected document formats were specified, do the delivered files match the expected formats?
-4. **Content Quality**: Is the content of the delivered files usable and complete?
-5. **Content Processing**: If content extraction was expected, was it performed correctly?
-
-CONTEXT:
-- Task Description: {context.task_step.description if context.task_step else 'Unknown'}
-- Previous Results: {', '.join(context.previous_results) if context.previous_results else 'None'}
-
-VALIDATION INSTRUCTIONS:
-1. **Result Label Check**: Verify that the expected result label "{expected_result_label}" is present in the action result data. This is the primary success criterion.
-2. **File Delivery**: Check if files were delivered when expected. The individual filenames don't need to match the result label - focus on whether content was actually produced.
-3. **Format Compliance**: If expected document formats were specified, check if delivered files match the expected extensions and MIME types. If no formats were specified, this criterion is satisfied.
-4. **Content Quality**: If files were delivered, consider the action successful. The presence of delivered files indicates content was processed and stored.
-5. **Content Processing**: If files were delivered, assume content extraction was performed correctly. The file delivery is evidence of successful processing.
-6. **Success Criteria**: The action is successful if the result label matches AND files were delivered. If expected formats were specified, they should also match.
-
-IMPORTANT NOTES:
-- The result label must be present in the action result data for success
-- Individual filenames can be different from the result label
-- If files were delivered, consider the action successful even if content details are not provided
-- Focus on whether the action accomplished its intended purpose (file delivery)
-- Empty files should be considered failures, but delivered files indicate success
-
-REQUIRED JSON RESPONSE:
-{{
-    "status": "success|retry|fail",
-    "reason": "Detailed explanation focusing on result label match and content quality",
-    "confidence": 0.0-1.0,
-    "improvements": ["specific improvements if needed"],
-    "quality_score": 1-10,
-    "missing_elements": ["missing result label", "missing files", "content issues"],
-    "suggested_retry_approach": "Specific approach for retry if status is retry"
-}}
-
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-    
-    def _parseValidationResponse(self, response: str) -> dict:
-        """Parse the AI validation response"""
-        try:
-            json_start = response.find('{')
-            json_end = response.rfind('}') + 1
-            if json_start == -1 or json_end == 0:
-                raise ValueError("No JSON found in validation response")
-            
-            json_str = response[json_start:json_end]
-            validation = json.loads(json_str)
-            
-            if 'status' not in validation:
-                raise ValueError("Validation response missing 'status' field")
-            
-            # Set defaults for optional fields
-            validation.setdefault('confidence', 0.5)
-            validation.setdefault('improvements', [])
-            validation.setdefault('quality_score', 5)
-            validation.setdefault('missing_elements', [])
-            validation.setdefault('suggested_retry_approach', '')
-            
-            return validation
-        except Exception as e:
-            logger.error(f"Error parsing validation response: {str(e)}")
-            return {
-                'status': 'success',
-                'reason': f'Parse error: {str(e)}',
-                'confidence': 0.5,
-                'improvements': [],
-                'quality_score': 5,
-                'missing_elements': [],
-                'suggested_retry_approach': ''
-            }
-    
-    def _getFileExtension(self, filename: str) -> str:
-        """Extract file extension from filename"""
-        if '.' in filename:
-            return '.' + filename.split('.')[-1]
-        return ''
-
-class ChatManager:
-    """Chat manager with improved AI integration and method handling"""
-    
-    def __init__(self, currentUser: User, chatInterface: ChatObjects):
-        self.currentUser = currentUser
-        self.chatInterface = chatInterface
-        self.service: ServiceCenter = None
-        self.workflow: ChatWorkflow = None
-        
-        # Circuit breaker for AI calls
-        self.ai_failure_count = 0
-        self.ai_last_failure_time = None
-        self.ai_circuit_breaker_threshold = 5
-        self.ai_circuit_breaker_timeout = 300  # 5 minutes
-        
-        # Timeout settings
-        self.ai_call_timeout = 120  # 2 minutes
-        self.task_execution_timeout = 600  # 10 minutes
-
-    # ===== Initialization and Setup =====
-    async def initialize(self, workflow: ChatWorkflow) -> None:
-        """Initialize chat manager with workflow"""
-        self.workflow = workflow
-        self.service = ServiceCenter(self.currentUser, self.workflow)
-
-    # ===== WORKFLOW PHASES =====
-    
-    # Phase 1: High-Level Task Planning
-    async def planHighLevelTasks(self, userInput: str, workflow: ChatWorkflow) -> TaskPlan:
-        """Phase 1: Plan high-level tasks from user input"""
-        try:
-            logger.info(f"Planning high-level tasks for workflow {workflow.id}")
-            
-            # Create planning prompt
-            prompt = self.createTaskPlanningPrompt({
-                'user_request': userInput,
-                'available_documents': self._getAvailableDocuments(workflow),
-                'workflow_id': workflow.id
-            })
-            
-            # Get AI response with fallback mechanism
-            response = await self._callAIWithCircuitBreaker(prompt, "task_planning")
-            
-            # Parse and validate task plan
-            task_plan_dict = self._parseTaskPlanResponse(response)
-            
-            if not self._validateTaskPlan(task_plan_dict):
-                logger.error("Generated task plan failed validation")
-                raise Exception("AI-generated task plan failed validation - AI is required for task planning")
-            
-            # Convert to TaskPlan model
-            tasks = []
-            for task_dict in task_plan_dict.get('tasks', []):
-                task = TaskStep(
-                    id=task_dict.get('id', ''),
-                    description=task_dict.get('description', ''),
-                    dependencies=task_dict.get('dependencies', []),
-                    expected_outputs=task_dict.get('expected_outputs', []),
-                    success_criteria=task_dict.get('success_criteria', []),
-                    required_documents=task_dict.get('required_documents', []),
-                    estimated_complexity=task_dict.get('estimated_complexity'),
-                    ai_prompt=task_dict.get('ai_prompt')
-                )
-                tasks.append(task)
-            
-            task_plan = TaskPlan(
-                overview=task_plan_dict.get('overview', ''),
-                tasks=tasks
-            )
-            
-            # Log the task plan as JSON for debugging
-            logger.info(f"Task plan created for workflow {workflow.id}:")
-            task_plan_json = {
-                'overview': task_plan.overview,
-                'tasks_count': len(task_plan.tasks),
-                'tasks': []
-            }
-            for task in task_plan.tasks:
-                task_json = {
-                    'id': task.id,
-                    'description': task.description,
-                    'dependencies': task.dependencies or [],
-                    'expected_outputs': task.expected_outputs or [],
-                    'success_criteria': task.success_criteria or [],
-                    'required_documents': task.required_documents or [],
-                    'estimated_complexity': task.estimated_complexity or '',
-                    'ai_prompt': task.ai_prompt or ''
-                }
-                task_plan_json['tasks'].append(task_json)
-            logger.info(f"Task Plan: {json.dumps(task_plan_json, indent=2, ensure_ascii=False)}")
-            
-            logger.info(f"High-level task planning completed: {len(task_plan.tasks)} tasks")
-            return task_plan
-            
-        except Exception as e:
-            error_message = str(e)
-            logger.error(f"Error in high-level task planning: {error_message}")
-            
-            # Provide more specific error messages based on the error type
-            if "overloaded" in error_message.lower() or "529" in error_message:
-                detailed_error = "AI service is currently overloaded. Please try again in a few minutes."
-            elif "rate limit" in error_message.lower() or "429" in error_message:
-                detailed_error = "Rate limit exceeded. Please wait before making another request."
-            elif "api key" in error_message.lower() or "401" in error_message:
-                detailed_error = "Invalid API key. Please check your AI service configuration."
-            elif "timeout" in error_message.lower():
-                detailed_error = "AI service request timed out. Please try again."
-            else:
-                detailed_error = f"AI service error: {error_message}"
-            
-            raise Exception(detailed_error)
-    
-    # Phase 2: Task Definition and Action Generation
-    async def defineTaskActions(self, task_step: TaskStep, workflow: ChatWorkflow, previous_results: List[str] = None, 
-                               enhanced_context: TaskContext = None) -> List[TaskAction]:
-        """Phase 2: Define specific actions for a task step with enhanced retry context"""
-        try:
-            logger.info(f"Defining actions for task: {task_step.description if hasattr(task_step, 'description') else 'Unknown'}")
-            
-            # Use enhanced context if provided (for retries), otherwise create basic context
-            if enhanced_context:
-                context = enhanced_context
-            else:
-                context = TaskContext(
-                    task_step=task_step,
-                    workflow=workflow,
-                    workflow_id=workflow.id,
-                    available_documents=self._getAvailableDocuments(workflow),
-                    previous_results=previous_results or [],
-                    improvements=[],
-                    retry_count=0,
-                    previous_action_results=[],
-                    previous_review_result=None,
-                    is_regeneration=False,
-                    failure_patterns=[],
-                    failed_actions=[],
-                    successful_actions=[]
-                )
-            
-            # Generate actions using AI
-            actions = await self._generateActionsForTaskStep(context)
-            
-            # Log the generated actions as JSON for debugging
-            logger.info(f"Generated {len(actions)} actions for task '{task_step.description}':")
-            for i, action in enumerate(actions):
-                logger.info(f"Action {i+1}: {json.dumps(action, indent=2, ensure_ascii=False)}")
-            
-            # Convert to TaskAction objects
-            # Get available document labels for validation
-            available_document_labels = set(self._getAvailableDocuments(workflow))
-            task_actions = []
-            invalid_doc_ref_detected = False
-            # Collect resultLabels of actions defined so far in this step
-            result_labels_so_far = set()
-            for action_dict in actions:
-                # Validate document references in parameters
-                params = action_dict.get('parameters', {})
-                if 'documentList' in params and isinstance(params['documentList'], list):
-                    original_refs = params['documentList']
-                    # Allow references to available documents or to resultLabels of actions defined so far
-                    valid_refs = [ref for ref in original_refs if ref in available_document_labels or ref in result_labels_so_far]
-                    if len(valid_refs) < len(original_refs):
-                        logger.warning(f"Action {action_dict.get('method','?')}.{action_dict.get('action','?')} has invalid document references: {set(original_refs) - set(valid_refs)}. Only using valid: {valid_refs}")
-                        invalid_doc_ref_detected = True
-                    if not valid_refs:
-                        logger.warning(f"Skipping action {action_dict.get('method','?')}.{action_dict.get('action','?')} due to no valid document references.")
-                        continue
-                    params['documentList'] = valid_refs
-                action_data = {
-                    "execMethod": action_dict.get('method', 'unknown'),
-                    "execAction": action_dict.get('action', 'unknown'),
-                    "execParameters": params,
-                    "execResultLabel": action_dict.get('resultLabel', ''),
-                    "expectedDocumentFormats": action_dict.get('expectedDocumentFormats', None),
-                    "status": TaskStatus.PENDING
-                }
-                task_action = self.chatInterface.createTaskAction(action_data)
-                if task_action:
-                    # Log action definition: parameters, input documentLabels, output document label
-                    logger.debug(f"[ACTION DEFINITION] Method: {task_action.execMethod}, Action: {task_action.execAction}, Parameters: {json.dumps(task_action.execParameters, ensure_ascii=False)}, Input documentLabels: {task_action.execParameters.get('documentList', [])}, Output documentLabel: {task_action.execResultLabel}")
-                    task_actions.append(task_action)
-                    # Add this action's resultLabel to the running set for subsequent actions
-                    if action_data["execResultLabel"]:
-                        result_labels_so_far.add(action_data["execResultLabel"])
-                    logger.info(f"Created task action: {task_action.execMethod}.{task_action.execAction}")
-            # If all actions were skipped due to invalid document references, add improvement and return []
-            if not task_actions and invalid_doc_ref_detected:
-                improvement_msg = ("Previous action(s) referenced invalid or unavailable document labels. "
-                                   "Only use document labels listed in AVAILABLE DOCUMENTS. Do not invent or copy message IDs.")
-                if enhanced_context:
-                    if hasattr(enhanced_context, 'improvements') and isinstance(enhanced_context.improvements, list):
-                        enhanced_context.improvements.append(improvement_msg)
-                else:
-                    if hasattr(context, 'improvements') and isinstance(context.improvements, list):
-                        context.improvements.append(improvement_msg)
-                logger.warning("All actions skipped due to invalid document references. Added improvement for retry.")
-                return []
-            
-            # Update stats for task validation (estimate bytes for action validation)
-            if task_actions:
-                # Calculate actual action size for stats
-                action_size = self.service.calculateObjectSize(task_actions)
-                self.service.updateWorkflowStats(eventLabel="action", bytesSent=action_size)
-                
-                # Log the final TaskAction objects as JSON
-                logger.info(f"Final TaskAction objects for task '{task_step.description}':")
-                for i, task_action in enumerate(task_actions):
-                    action_json = {
-                        'id': task_action.id,
-                        'execMethod': task_action.execMethod,
-                        'execAction': task_action.execAction,
-                        'execParameters': task_action.execParameters,
-                        'execResultLabel': task_action.execResultLabel,
-                        'status': task_action.status.value if hasattr(task_action.status, 'value') else str(task_action.status)
-                    }
-                    logger.info(f"TaskAction {i+1}: {json.dumps(action_json, indent=2, ensure_ascii=False)}")
-            
-            logger.info(f"Task action definition completed: {len(task_actions)} actions")
-            return task_actions
-            
-        except Exception as e:
-            logger.error(f"Error defining task actions: {str(e)}")
-            return []
-    
-    # Phase 3: Action Execution
-    async def executeTaskActions(self, task_actions: List[TaskAction], workflow: ChatWorkflow) -> List[ActionExecutionResult]:
-        """Phase 3: Execute all actions for a task with retry mechanism"""
-        try:
-            logger.info(f"Executing {len(task_actions)} task actions")
-            
-            results = []
-            for i, action in enumerate(task_actions):
-                logger.info(f"Executing action {i+1}/{len(task_actions)}: {action.execMethod}.{action.execAction}")
-                
-                # Execute single action with retry mechanism
-                result = await self._executeSingleAction(action, workflow)
-                results.append(result)
-                
-                # If action failed after all retries, continue with next action instead of stopping
-                if not result.success:
-                    logger.error(f"Action {i+1} failed after retries, continuing with next action")
-                    # Don't break - continue with remaining actions
-                    continue
-            
-            logger.info(f"Task action execution completed: {len(results)} results")
-            return results
-            
-        except Exception as e:
-            logger.error(f"Error executing task actions: {str(e)}")
-            return []
-    
-    # Phase 4: Task Review and Quality Assessment
-    async def reviewTaskCompletion(self, task_step: TaskStep, task_actions: List[TaskAction], 
-                                 action_results: List[ActionExecutionResult], workflow: ChatWorkflow) -> ReviewResult:
-        """Phase 4: Review task completion and decide next steps"""
-        try:
-            logger.info(f"Reviewing task completion: {task_step.description}")
-            
-            # Create step result summary from action results
-            step_result = {
-                'task_step': task_step,
-                'action_results': action_results,
-                'successful_actions': sum(1 for result in action_results if result.success),
-                'total_actions': len(action_results),
-                'results': [result.data.get('result', '') for result in action_results if result.success],
-                'errors': [result.error for result in action_results if not result.success]
-            }
-            
-            # Prepare review context
-            review_context = ReviewContext(
-                task_step=task_step,
-                task_actions=task_actions,
-                action_results=action_results,
-                step_result=step_result,
-                workflow_id=workflow.id,
-                previous_results=self._getPreviousResultsFromActions(task_actions)
-            )
-            
-            # Use AI to review the results
-            review = await self._performTaskReview(review_context)
-            
-            # Add quality metrics
-            quality_metrics = self._calculateTaskQualityMetrics(task_step, action_results)
-            
-            logger.info(f"Task review completed: {review.status}")
-            return ReviewResult(
-                status=review.status,
-                reason=review.reason,
-                improvements=review.improvements,
-                quality_score=review.quality_score,
-                missing_outputs=review.missing_outputs,
-                met_criteria=review.met_criteria,
-                unmet_criteria=review.unmet_criteria,
-                confidence=review.confidence
-            )
-            
-        except Exception as e:
-            logger.error(f"Error reviewing task completion: {str(e)}")
-            return ReviewResult(
-                status='failed',
-                reason=f'Review failed: {str(e)}',
-                quality_score=0,
-                confidence=0
-            )
-    
-    # Phase 5: Task Handover and State Management
-    async def prepareTaskHandover(self, task_step: TaskStep, task_actions: List[TaskAction], 
-                                review_result: ReviewResult, workflow: ChatWorkflow) -> Dict[str, Any]:
-        """Phase 5: Prepare results for next task or workflow completion"""
-        try:
-            logger.info(f"Preparing task handover: {task_step.description}")
-            
-            # Update task actions with results
-            for action in task_actions:
-                if action.status == TaskStatus.PENDING:
-                    action.status = TaskStatus.COMPLETED if review_result.status == 'success' else TaskStatus.FAILED
-            
-            # Create serializable task actions
-            task_actions_serializable = []
-            for action in task_actions:
-                action_dict = {
-                    'id': action.id,
-                    'execMethod': action.execMethod,
-                    'execAction': action.execAction,
-                    'execParameters': action.execParameters,
-                    'execResultLabel': action.execResultLabel,
-                    'status': action.status.value if hasattr(action.status, 'value') else str(action.status)
-                }
-                task_actions_serializable.append(action_dict)
-            
-            # Create handover data
-            handover_data = {
-                'task_step': task_step,
-                'task_actions': task_actions_serializable,
-                'review_result': review_result,
-                'next_task_ready': review_result.status == 'success',
-                'available_results': self._getPreviousResultsFromActions(task_actions)
-            }
-            
-            logger.info(f"Task handover prepared: next_task_ready={handover_data['next_task_ready']}")
-            return handover_data
-            
-        except Exception as e:
-            logger.error(f"Error preparing task handover: {str(e)}")
-            # Create serializable task actions for exception case
-            task_actions_serializable = []
-            for action in task_actions:
-                action_dict = {
-                    'id': action.id,
-                    'execMethod': action.execMethod,
-                    'execAction': action.execAction,
-                    'execParameters': action.execParameters,
-                    'execResultLabel': action.execResultLabel,
-                    'status': action.status.value if hasattr(action.status, 'value') else str(action.status)
-                }
-                task_actions_serializable.append(action_dict)
-            
-            return {
-                'task_step': task_step,
-                'task_actions': task_actions_serializable,
-                'review_result': review_result,
-                'next_task_ready': False,
-                'available_results': []
-            }
-    
-
-
-
-
-    # ===== Utility Methods =====
-
-    async def processFileIds(self, fileIds: List[str]) -> List[ChatDocument]:
-        """Process file IDs and return ChatDocument objects"""
-        documents = []
-        
-        for fileId in fileIds:
-            try:
-                # Ensure service is initialized
-                if not hasattr(self, 'service') or not self.service:
-                    logger.error(f"Service not initialized for file ID {fileId}")
-                    continue
-                
-                # Get file info from service
-                fileInfo = self.service.getFileInfo(fileId)
-                if fileInfo:
-                    # Create document using interface
-                    documentData = {
-                        "fileId": fileId,
-                        "filename": fileInfo.get("filename", "unknown"),
-                        "fileSize": fileInfo.get("size", 0),
-                        "mimeType": fileInfo.get("mimeType", "application/octet-stream")
-                    }
-                    document = self.chatInterface.createChatDocument(documentData)
-                    if document:
-                        documents.append(document)
-                        logger.info(f"Processed file ID {fileId} -> {document.filename}")
-                else:
-                    logger.warning(f"No file info found for file ID {fileId}")
-            except Exception as e:
-                logger.error(f"Error processing file ID {fileId}: {str(e)}")
-        
-        
-        return documents
-
-    def setUserLanguage(self, language: str) -> None:
-        """Set user language for the chat manager"""
-        if hasattr(self, 'service') and self.service:
-            self.service.user.language = language 
-
-    # ===== Enhanced Task Planning Methods =====
-    
-    async def _callAIWithCircuitBreaker(self, prompt: str, context: str) -> str:
-        """Call AI with intelligent routing based on complexity and circuit breaker pattern"""
-        max_retries = 3
-        base_delay = 2  # Start with 2 seconds
-        
-        for attempt in range(max_retries):
-            try:
-                # Check circuit breaker
-                if self._isCircuitBreakerOpen():
-                    raise Exception("AI circuit breaker is open - too many recent failures")
-                
-                # Determine which AI service to use based on complexity
-                ai_choice = self._determineAIChoice(prompt, context)
-                logger.debug(f"AI choice for {context}: {ai_choice} (attempt {attempt + 1}/{max_retries})")
-                
-                if ai_choice == "advanced":
-                    # Use advanced AI for complex tasks
-                    try:
-                        response = await asyncio.wait_for(
-                            self._callAdvancedAI(prompt, context),
-                            timeout=self.ai_call_timeout
-                        )
-                        
-                        # Reset failure count on success
-                        self.ai_failure_count = 0
-                        logger.info(f"Advanced AI call successful for {context}")
-                        return response
-                        
-                    except Exception as advanced_error:
-                        error_message = str(advanced_error)
-                        logger.warning(f"Advanced AI call failed for {context}: {error_message}")
-                        
-                        # Fall back to basic AI for complex tasks
-                        logger.info(f"Falling back to basic AI for complex task: {context}")
-                        try:
-                            response = await asyncio.wait_for(
-                                self._callStandardAI(prompt, context),
-                                timeout=self.ai_call_timeout
-                            )
-                            
-                            # Reset failure count on success
-                            self.ai_failure_count = 0
-                            logger.info(f"Basic AI fallback successful for complex task: {context}")
-                            return response
-                            
-                        except Exception as standard_error:
-                            # Both failed for complex task
-                            error_message = f"Advanced AI failed: {str(advanced_error)}. Basic AI failed: {str(standard_error)}"
-                            raise Exception(error_message)
-                
-                else:  # basic
-                    # Use basic AI for simple tasks
-                    try:
-                        response = await asyncio.wait_for(
-                            self._callStandardAI(prompt, context),
-                            timeout=self.ai_call_timeout
-                        )
-                        
-                        # Reset failure count on success
-                        self.ai_failure_count = 0
-                        logger.info(f"Basic AI call successful for {context}")
-                        return response
-                        
-                    except Exception as basic_error:
-                        error_message = str(basic_error)
-                        logger.warning(f"Basic AI call failed for {context}: {error_message}")
-                        
-                        # Only upgrade to advanced AI for critical simple tasks
-                        if self._isCriticalTask(context):
-                            logger.info(f"Upgrading to advanced AI for critical simple task: {context}")
-                            try:
-                                response = await asyncio.wait_for(
-                                    self._callAdvancedAI(prompt, context),
-                                    timeout=self.ai_call_timeout
-                                )
-                                
-                                # Reset failure count on success
-                                self.ai_failure_count = 0
-                                logger.info(f"Advanced AI upgrade successful for critical task: {context}")
-                                return response
-                                
-                            except Exception as advanced_error:
-                                # Both failed for critical task
-                                error_message = f"Basic AI failed: {str(basic_error)}. Advanced AI failed: {str(advanced_error)}"
-                                raise Exception(error_message)
-                        else:
-                            # Non-critical simple task failed
-                            raise Exception(f"Basic AI failed for simple task: {error_message}")
-                
-            except asyncio.TimeoutError:
-                self._recordAIFailure("Timeout")
-                if attempt < max_retries - 1:
-                    delay = base_delay * (2 ** attempt)  # Exponential backoff
-                    logger.warning(f"AI call timed out, retrying in {delay} seconds (attempt {attempt + 1}/{max_retries})")
-                    await asyncio.sleep(delay)
-                    continue
-                else:
-                    raise Exception(f"AI call timed out after {self.ai_call_timeout} seconds")
-                    
-            except Exception as e:
-                error_message = str(e)
-                
-                # Special handling for overloaded service (529 error)
-                if "overloaded" in error_message.lower() or "529" in error_message:
-                    if attempt < max_retries - 1:
-                        delay = base_delay * (2 ** attempt)  # Exponential backoff
-                        logger.warning(f"AI service overloaded, retrying in {delay} seconds (attempt {attempt + 1}/{max_retries})")
-                        await asyncio.sleep(delay)
-                        continue
-                    else:
-                        # Don't record this as a circuit breaker failure since it's a service issue
-                        raise Exception("AI service is currently overloaded. Please try again in a few minutes.")
-                
-                # For other errors, record failure and potentially retry
-                self._recordAIFailure(error_message)
-                if attempt < max_retries - 1:
-                    delay = base_delay * (2 ** attempt)  # Exponential backoff
-                    logger.warning(f"AI call failed, retrying in {delay} seconds (attempt {attempt + 1}/{max_retries}): {error_message}")
-                    await asyncio.sleep(delay)
-                    continue
-                else:
-                    raise
-
-    def _isCircuitBreakerOpen(self) -> bool:
-        """Check if circuit breaker is open"""
-        if self.ai_failure_count >= self.ai_circuit_breaker_threshold:
-            if self.ai_last_failure_time:
-                time_since_failure = (datetime.now(UTC) - self.ai_last_failure_time).total_seconds()
-                if time_since_failure < self.ai_circuit_breaker_timeout:
-                    return True
-                else:
-                    # Reset circuit breaker after timeout
-                    self.ai_failure_count = 0
-                    self.ai_last_failure_time = None
-        return False
-
-    def _determineAIChoice(self, prompt: str, context: str) -> str:
-        """Determine whether to use advanced or basic AI based on task complexity"""
-        
-        # Check for forced AI choice based on context
-        forced_choice = self._getForcedAIChoice(context)
-        if forced_choice:
-            logger.debug(f"Forced AI choice for {context}: {forced_choice}")
-            return forced_choice
-        
-        # Define complex task patterns that require advanced AI
-        complex_patterns = [
-            # Task planning and workflow management
-            "task_planning", "action_generation", "result_review", "task_completion_validation",
-            
-            # Complex document analysis
-            "document", "extract", "analysis", "comprehensive", "detailed analysis",
-            
-            # Multi-step reasoning
-            "plan", "strategy", "evaluate", "assess", "compare", "analyze",
-            
-            # Complex business logic
-            "workflow", "task", "action", "validation", "review", "assessment",
-            
-            # Critical decision making
-            "decision", "recommendation", "evaluation", "quality", "success criteria",
-            
-            # Complex prompts
-            "JSON", "structured", "format", "validation", "improvements", "quality_score"
-        ]
-        
-        # Define simple task patterns that can use basic AI
-        simple_patterns = [
-            # Basic text processing
-            "summarize", "translate", "format", "convert", "extract text",
-            
-            # Simple queries
-            "find", "search", "list", "get", "retrieve",
-            
-            # Basic operations
-            "send", "upload", "download", "create", "delete",
-            
-            # Simple responses
-            "confirm", "acknowledge", "status", "info"
-        ]
-        
-        # Check prompt and context for complexity indicators
-        combined_text = f"{prompt} {context}".lower()
-        
-        # Count complex indicators
-        complex_count = sum(1 for pattern in complex_patterns if pattern in combined_text)
-        
-        # Count simple indicators
-        simple_count = sum(1 for pattern in simple_patterns if pattern in combined_text)
-        
-        # Additional complexity factors
-        prompt_length = len(prompt)
-        has_json_requirement = "json" in combined_text and ("{" in prompt or "}" in prompt)
-        has_structured_output = any(word in combined_text for word in ["format", "structure", "template"])
-        has_validation = any(word in combined_text for word in ["validate", "check", "verify", "quality"])
-        
-        # Calculate complexity score
-        complexity_score = 0
-        complexity_score += complex_count * 2  # Complex patterns worth more
-        complexity_score += simple_count * 1   # Simple patterns worth less
-        complexity_score += (prompt_length > 1000) * 3  # Long prompts are complex
-        complexity_score += has_json_requirement * 5  # JSON requirements are complex
-        complexity_score += has_structured_output * 3  # Structured output is complex
-        complexity_score += has_validation * 4  # Validation is complex
-        
-        # Determine AI choice based on complexity score
-        if complexity_score >= 5:
-            logger.debug(f"Complex task detected (score: {complexity_score}) - using advanced AI for {context}")
-            return "advanced"
-        else:
-            logger.debug(f"Simple task detected (score: {complexity_score}) - using basic AI for {context}")
-            return "basic"
-    
-    def _getForcedAIChoice(self, context: str) -> str:
-        """Get forced AI choice for specific contexts (can be overridden)"""
-        
-        # Define contexts that always use advanced AI
-        advanced_contexts = [
-            "task_planning",           # Always use advanced for task planning
-            "action_generation",       # Always use advanced for action generation
-            "result_review",           # Always use advanced for result review
-            "task_completion_validation"  # Always use advanced for validation
-        ]
-        
-        # Define contexts that always use basic AI
-        basic_contexts = [
-            "summarize",              # Always use basic for summarization
-            "translate",              # Always use basic for translation
-            "format",                 # Always use basic for formatting
-            "status",                 # Always use basic for status updates
-            "info"                    # Always use basic for info queries
-        ]
-        
-        context_lower = context.lower()
-        
-        # Check for forced advanced AI
-        for advanced_context in advanced_contexts:
-            if advanced_context in context_lower:
-                return "advanced"
-        
-        # Check for forced basic AI
-        for basic_context in basic_contexts:
-            if basic_context in context_lower:
-                return "basic"
-        
-        # No forced choice
-        return None
-    
-    def _isCriticalTask(self, context: str) -> bool:
-        """Determine if a simple task is critical enough to warrant advanced AI upgrade"""
-        
-        # Define critical task patterns
-        critical_patterns = [
-            # Workflow critical tasks
-            "task_planning", "workflow", "critical", "essential",
-            
-            # User-facing decisions
-            "decision", "recommendation", "evaluation", "assessment",
-            
-            # Quality-sensitive tasks
-            "quality", "validation", "review", "check",
-            
-            # Business-critical operations
-            "business", "strategy", "planning", "analysis"
-        ]
-        
-        context_lower = context.lower()
-        
-        # Check if context contains critical patterns
-        is_critical = any(pattern in context_lower for pattern in critical_patterns)
-        
-        if is_critical:
-            logger.debug(f"Critical task detected - {context}")
-        
-        return is_critical
-
-    def _recordAIFailure(self, error: str):
-        """Record AI failure for circuit breaker"""
-        self.ai_failure_count += 1
-        self.ai_last_failure_time = datetime.now(UTC)
-        logger.warning(f"AI failure recorded ({self.ai_failure_count}/{self.ai_circuit_breaker_threshold}): {error}")
-
-    def _validateTaskPlan(self, task_plan: Dict[str, Any]) -> bool:
-        """Validate task plan structure and dependencies"""
-        try:
-            if not isinstance(task_plan, dict):
-                return False
-            
-            if 'tasks' not in task_plan or not isinstance(task_plan['tasks'], list):
-                return False
-            
-            # Check each task
-            task_ids = set()
-            for task in task_plan['tasks']:
-                if not isinstance(task, dict):
-                    return False
-                
-                required_fields = ['id', 'description', 'expected_outputs', 'success_criteria']
-                if not all(field in task for field in required_fields):
-                    return False
-                
-                # Check for duplicate task IDs
-                if task['id'] in task_ids:
-                    return False
-                task_ids.add(task['id'])
-                
-                # Validate dependencies
-                dependencies = task.get('dependencies', [])
-                if not isinstance(dependencies, list):
-                    return False
-                
-                # Check that dependencies reference existing tasks
-                for dep in dependencies:
-                    if dep not in task_ids and dep != 'task_0':  # Allow task_0 as special case
-                        return False
-                
-                # Validate ai_prompt if present (optional field)
-                if 'ai_prompt' in task and not isinstance(task['ai_prompt'], str):
-                    return False
-            
-            return True
-            
-        except Exception as e:
-            logger.error(f"Error validating task plan: {str(e)}")
-            return False
-
- 
-    def _validateActions(self, actions: List[Dict[str, Any]], context: TaskContext) -> bool:
-        """Validate generated actions"""
-        try:
-            if not isinstance(actions, list):
-                logger.error("Actions must be a list")
-                return False
-            
-            if len(actions) == 0:
-                logger.warning("No actions generated")
-                return False
-            
-            for i, action in enumerate(actions):
-                if not isinstance(action, dict):
-                    logger.error(f"Action {i} must be a dictionary")
-                    return False
-                
-                # Check required fields
-                required_fields = ['method', 'action', 'parameters', 'resultLabel']
-                missing_fields = []
-                for field in required_fields:
-                    if field not in action or not action[field]:
-                        missing_fields.append(field)
-                
-                if missing_fields:
-                    logger.error(f"Action {i} missing required fields: {missing_fields}")
-                    return False
-                
-                # Validate result label format
-                result_label = action.get('resultLabel', '')
-                if not result_label.startswith('task'):
-                    logger.error(f"Action {i} result label must start with 'task': {result_label}")
-                    return False
-                
-                # Validate parameters
-                parameters = action.get('parameters', {})
-                if not isinstance(parameters, dict):
-                    logger.error(f"Action {i} parameters must be a dictionary")
-                    return False
-            
-            logger.info(f"Successfully validated {len(actions)} actions")
-            return True
-            
-        except Exception as e:
-            logger.error(f"Error validating actions: {str(e)}")
-            return False
-
-
-
-    # ===== Prompt Creation Methods =====
-    
-    def createTaskPlanningPrompt(self, context: Dict[str, Any]) -> str:
-        """Create prompt for task planning"""
-        return f"""You are a task planning AI that analyzes user requests and creates structured task plans.
-
-USER REQUEST: {context['user_request']}
-
-AVAILABLE DOCUMENTS: {', '.join(context['available_documents'])}
-
-INSTRUCTIONS:
-1. Analyze the user request and available documents
-2. Break down the request into 2-4 meaningful high-level task steps
-3. Focus on business outcomes, not technical operations
-4. For document processing, create ONE task with a comprehensive AI prompt rather than multiple granular tasks
-5. Each task should produce meaningful, usable outputs
-6. Ensure proper handover between tasks using result labels
-7. Return a JSON object with the exact structure shown below
-
-TASK PLANNING PRINCIPLES:
-- Combine related operations into single tasks (e.g., "Extract and analyze all candidate profiles" instead of separate "read file" and "analyze content" tasks)
-- Use comprehensive AI prompts for document processing rather than multiple small tasks
-- Focus on business value and outcomes
-- Keep tasks at a meaningful level of abstraction
-- Each task should produce results that can be used by subsequent tasks
-
-REQUIRED JSON STRUCTURE:
-{{
-    "overview": "Brief description of the overall plan",
-    "tasks": [
-        {{
-            "id": "task_1",
-            "description": "Clear description of what this task accomplishes (business outcome)",
-            "dependencies": ["task_0"],  // IDs of tasks that must complete first
-            "expected_outputs": ["output1", "output2"],
-            "success_criteria": ["criteria1", "criteria2"],
-            "required_documents": ["doc1", "doc2"],
-            "estimated_complexity": "low|medium|high",
-            "ai_prompt": "Comprehensive AI prompt for document processing tasks (if applicable)"
-        }}
-    ]
-}}
-
-EXAMPLES OF GOOD TASK DESCRIPTIONS:
-- "Extract and analyze all candidate profiles to identify key qualifications and experience"
-- "Create evaluation matrix and rate candidates against product designer criteria"
-- "Generate comprehensive PowerPoint presentation for management decision"
-- "Store final presentation in SharePoint for specified account"
-
-EXAMPLES OF BAD TASK DESCRIPTIONS:
-- "Open and read the PDF file" (too granular)
-- "Identify table structure" (technical detail)
-- "Convert data to CSV format" (implementation detail)
-
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-
-    async def createActionDefinitionPrompt(self, context: TaskContext) -> str:
-        """Create prompt for action generation with enhanced document extraction guidance and retry context"""
-        task_step = context.task_step
-        workflow = context.workflow
-        available_docs = context.available_documents or []
-        previous_results = context.previous_results or []
-        improvements = context.improvements or []
-        retry_count = context.retry_count or 0
-        previous_action_results = context.previous_action_results or []
-        previous_review_result = context.previous_review_result
-        
-        # Get available methods and actions with signatures
-        methodList = self.service.getMethodsList()
-        method_actions = {}
-        for sig in methodList:
-            if '.' in sig:
-                method, rest = sig.split('.', 1)
-                action = rest.split('(')[0]
-                method_actions.setdefault(method, []).append((action, sig))
-        
-        # Get workflow history
-        messageSummary = await self.service.summarizeChat(workflow.messages)
-        
-        # Get available documents and connections
-        docRefs = self.service.getDocumentReferenceList()
-        connRefs = self.service.getConnectionReferenceList()
-        all_doc_refs = docRefs.get('chat', []) + docRefs.get('history', [])
-        
-        # Build AVAILABLE METHODS section
-        available_methods_str = ''
-        for method, actions in method_actions.items():
-            available_methods_str += f"- {method}:\n"
-            for action, sig in actions:
-                available_methods_str += f"    - {action}: {sig}\n"
-        
-        # Get AI prompt from task step if available
-        task_ai_prompt = task_step.ai_prompt or ''
-        
-        # Build retry context section
-        retry_context = ""
-        if retry_count > 0:
-            retry_context = f"""
-RETRY CONTEXT (Attempt {retry_count}):
-Previous action results that failed or were incomplete:
-"""
-            for i, result in enumerate(previous_action_results):
-                retry_context += f"- Action {i+1}: {result.actionMethod or 'unknown'}.{result.actionName or 'unknown'}\n"
-                retry_context += f"  Status: {result.success and 'success' or 'failed'}\n"
-                retry_context += f"  Error: {result.error or 'None'}\n"
-                retry_context += f"  Result: {(result.data.get('result', '') if result.data else '')[:100]}...\n"
-            
-            if previous_review_result:
-                retry_context += f"""
-Previous review feedback:
-- Status: {previous_review_result.status or 'unknown'}
-- Reason: {previous_review_result.reason or 'No reason provided'}
-- Quality Score: {previous_review_result.quality_score or 0}/10
-- Missing Outputs: {', '.join(previous_review_result.missing_outputs or [])}
-- Unmet Criteria: {', '.join(previous_review_result.unmet_criteria or [])}
-"""
-        
-        # Precompute all complex string expressions to avoid f-string nesting issues
-        expected_outputs_str = ', '.join(task_step.expected_outputs or [])
-        success_criteria_str = ', '.join(task_step.success_criteria or [])
-        previous_results_str = ', '.join(previous_results) if previous_results else 'None'
-        improvements_str = str(improvements) if improvements else 'None'
-        available_connections_str = '\n'.join(f"- {conn}" for conn in connRefs)
-        available_documents_str = '\n'.join(f"- {doc.documentsLabel} contains {', '.join(doc.documents)}" for doc in all_doc_refs)
-        # Build the prompt using only precomputed variables
-        prompt = f"""
-You are an action generation AI that creates specific actions to accomplish a task step.
-
-DOCUMENT REFERENCE TYPES:
-- docItem: Reference to a single document. Format: "docItem:<id>:<filename>"
-- docList: Reference to a group of documents under a label. Format: <label> (e.g., "task1_action2_results").
-  - Each docList label maps to a list of docItem references (see AVAILABLE DOCUMENTS).
-  - A label like "task1_action2_results" refers to the output of action 2 in task 1.
-
-CRITICAL DOCUMENT REFERENCE RULES:
-- ONLY use the exact labels listed in AVAILABLE DOCUMENTS below
-- NEVER invent new labels or use message IDs
-- NEVER use formats like "msg_xxx:documents" or "task_X_results" (these will fail)
-- ONLY use the exact labels shown in AVAILABLE DOCUMENTS
-- **When generating multiple actions, you may only use as input documents those that are already present in AVAILABLE DOCUMENTS or produced by actions that come earlier in the list. Do NOT use as input any document label that will be produced by a later action.**
-
-TASK STEP: {task_step.description} (ID: {task_step.id})
-EXPECTED OUTPUTS: {expected_outputs_str}
-SUCCESS CRITERIA: {success_criteria_str}
-TASK AI PROMPT: {task_ai_prompt if task_ai_prompt else 'None provided'}
-
-CONTEXT - Chat History:
-{messageSummary}
-
-AVAILABLE METHODS AND ACTIONS (with signatures):
-{available_methods_str}
-
-AVAILABLE CONNECTIONS:
-{available_connections_str}
-
-AVAILABLE DOCUMENTS:
-{available_documents_str}
-
-DOCUMENT REFERENCE EXAMPLES:
-✅ CORRECT: Use exact labels from AVAILABLE DOCUMENTS above
-- "task2_action1_personnel_search"
-- "task2_action3_personnel_analysis"
-- "docItem:doc_abc:file1.txt"
-- "docList:msg123:user_uploads" (supported format, but use actual labels instead)
-
-❌ INCORRECT: These will cause errors
-- "msg_xxx:documents" (invalid format - missing docList/docItem prefix)
-- "task_2_results" (not a valid label - use exact labels from AVAILABLE DOCUMENTS)
-- Inventing message IDs instead of using actual document labels
-
-PREVIOUS RESULTS: {previous_results_str}
-IMPROVEMENTS NEEDED: {improvements_str}{retry_context}
-
-ACTION GENERATION PRINCIPLES:
-- Create meaningful actions per task step
-- Use comprehensive AI prompts for document processing
-- Focus on business outcomes, not technical operations
-- Combine related operations into single actions when possible
-- Use the task's AI prompt if provided, or create a comprehensive one
-- Each action should produce meaningful, usable outputs
-- For document extraction, ensure prompts are specific and detailed
-- Include validation steps in extraction prompts
-- If this is a retry, learn from previous failures and improve the approach
-- Address specific issues mentioned in previous review feedback
-- When specifying expectedDocumentFormats, ensure AI prompts explicitly request pure data without markdown formatting
-
-INSTRUCTIONS:
-- Generate actions to accomplish this task step using available documents, connections, and previous results
-- Use docItem for single documents and docList labels for groups of documents as shown in AVAILABLE DOCUMENTS
-- Always pass documentList as a LIST of references (docItem and/or docList)
-- For resultLabel, use the format: "task{{task_id}}_action{{action_number}}_{{short_label}}" where:
-    - {{task_id}} = the current task's id (e.g., 1)
-    - {{action_number}} = the sequence number of the action within the task (e.g., 2)
-    - {{short_label}} = a short, descriptive label for the output (e.g., "analysis_results")
-  Example: "task1_action2_analysis_results"
-- If this is a retry, ensure the new actions address the specific issues from previous attempts
-- Follow the JSON structure below. All fields are required.
-
-REQUIRED JSON STRUCTURE:
-{{
-    "actions": [
-        {{
-            "method": "method_name",  // Use only the method name (e.g., "document")
-            "action": "action_name",  // Use only the action name (e.g., "extract")
-            "parameters": {{
-                "documentList": ["docItem:doc_abc:file1.txt", "task1_action2_results"],
-                "aiPrompt": "Comprehensive AI prompt describing what to accomplish"
-            }},
-            "resultLabel": "task1_action3_analysis_results",
-            "expectedDocumentFormats": [  // OPTIONAL: Specify expected document formats when needed
-                {{
-                    "extension": ".csv",
-                    "mimeType": "text/csv",
-                    "description": "Structured data output"
-                }}
-            ],
-            "description": "What this action accomplishes (business outcome)"
-        }}
-    ]
-}}
-
-FIELD REQUIREMENTS:
-- "method": Must be from AVAILABLE METHODS
-- "action": Must be valid for the method
-- "parameters": Method-specific, must include documentList as a list if required by the signature
-- "resultLabel": Must follow the format above (e.g., "task1_action3_analysis_results")
-- "expectedDocumentFormats": OPTIONAL - Only specify when you need to control output format
-  - Use when you need specific file types (e.g., CSV for data, JSON for structured output)
-  - Omit when format is flexible (e.g., folder queries with mixed file types)
-  - Each format should specify: extension, mimeType, description
-  - When using expectedDocumentFormats, ensure the aiPrompt explicitly requests pure data without markdown formatting
-- "description": Clear summary of the business outcome
-
-EXAMPLES OF GOOD ACTIONS:
-
-1. Document analysis with specific output format (use expectedDocumentFormats):
-{{
-    "method": "document",
-    "action": "extract",
-    "parameters": {{
-        "documentList": ["docItem:doc_57520394-6b6d-41c2-b641-bab3fc6d7f4b:candidate_1_profile.txt"],
-        "aiPrompt": "Extract and analyze the candidate's qualifications, experience, skills, and suitability for the product designer position. Identify key strengths, relevant experience, technical skills, and any areas of concern. Provide a comprehensive assessment that can be used for evaluation."
-    }},
-    "resultLabel": "task1_action1_candidate_analysis",
-    "expectedDocumentFormats": [
-        {{
-            "extension": ".json",
-            "mimeType": "application/json",
-            "description": "Structured candidate analysis data"
-        }}
-    ],
-    "description": "Comprehensive analysis of candidate profile for evaluation"
-}}
-
-2. Multi-document processing with flexible output (omit expectedDocumentFormats):
-{{
-    "method": "document",
-    "action": "extract",
-    "parameters": {{
-        "documentList": ["task1_action1_candidate_analysis", "task1_action2_candidate_analysis", "task1_action3_candidate_analysis"],
-        "aiPrompt": "Compare all three candidate profiles and create an evaluation matrix. Rate each candidate on technical skills, experience level, cultural fit, portfolio quality, and communication skills. Provide clear rankings and recommendations for the product designer position."
-    }},
-    "resultLabel": "task1_action4_evaluation_matrix",
-    "description": "Create comprehensive evaluation matrix comparing all candidates"
-}}
-
-3. Data extraction with specific CSV format:
-{{
-    "method": "document",
-    "action": "extract",
-    "parameters": {{
-        "documentList": ["docItem:doc_abc:table_data.pdf"],
-        "aiPrompt": "Extract all table data and convert to structured CSV format with proper headers and data types. IMPORTANT: Deliver pure CSV data without any markdown formatting, code blocks, or additional text. Output only the CSV content with proper headers and data rows."
-    }},
-    "resultLabel": "task1_action2_structured_data",
-    "expectedDocumentFormats": [
-        {{
-            "extension": ".csv",
-            "mimeType": "text/csv",
-            "description": "Structured table data in CSV format"
-        }}
-    ],
-    "description": "Extract and structure table data for analysis"
-}}
-
-4. Comprehensive summary report from multiple documents (use generateReport):
-{{
-    "method": "document",
-    "action": "generateReport",
-    "parameters": {{
-        "documentList": ["task1_action1_candidate_analysis", "task1_action2_candidate_analysis", "task1_action3_candidate_analysis"],
-        "title": "Comprehensive Candidate Evaluation Report"
-    }},
-    "resultLabel": "task1_action5_summary_report",
-    "description": "Generate a comprehensive, professional HTML report consolidating all candidate analyses and findings"
-}}
-
-5. Correct chaining of actions within a task:
-{{
-    "actions": [
-        {{
-            "method": "document",
-            "action": "extract",
-            "parameters": {{
-                "documentList": ["docItem:doc_abc:file1.txt"],
-                "aiPrompt": "Extract data from file1."
-            }},
-            "resultLabel": "task1_action1_extracted_data",
-            "description": "Extract data from file1."
-        }},
-        {{
-            "method": "document",
-            "action": "generateReport",
-            "parameters": {{
-                "documentList": ["task1_action1_extracted_data"],
-                "title": "Report"
-            }},
-            "resultLabel": "task1_action2_report",
-            "description": "Generate report from extracted data."
-        }}
-    ]
-}}
-
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-        # Log excerpt: available documents, user connections, available methods (summarized)
-        logger.debug(f"[ACTION PLAN PROMPT] Available Documents Section:\n{available_documents_str}\nUser Connections Section:\n{available_connections_str}\nAvailable Methods (summarized):\n{', '.join(method_actions.keys())}")
-        return prompt
-
-    def createResultReviewPrompt(self, review_context: ReviewContext) -> str:
-        """Create prompt for result review"""
-        task_step = review_context.task_step
-        step_result = review_context.step_result or {}
-        
-        # Create serializable version of step_result with only metadata (no document content)
-        step_result_serializable = {
-            'task_step': {
-                'id': task_step.id,
-                'description': task_step.description,
-                'expected_outputs': task_step.expected_outputs or [],
-                'success_criteria': task_step.success_criteria or []
-            },
-            'action_results': [],
-            'successful_actions': step_result.get('successful_actions', 0),
-            'total_actions': step_result.get('total_actions', 0),
-            'results_count': len(step_result.get('results', [])),
-            'errors_count': len(step_result.get('errors', []))
-        }
-        
-        # Convert action_results to serializable format with only metadata (no document content)
-        for action_result in review_context.action_results or []:
-            # Extract only document metadata, not content
-            documents_metadata = []
-            for doc in action_result.documents or []:
-                if hasattr(doc, 'filename'):
-                    documents_metadata.append({
-                        'filename': doc.filename,
-                        'fileSize': getattr(doc, 'fileSize', 0),
-                        'mimeType': getattr(doc, 'mimeType', 'unknown')
-                    })
-                elif isinstance(doc, dict):
-                    documents_metadata.append({
-                        'filename': doc.get('filename', 'unknown'),
-                        'fileSize': doc.get('fileSize', 0),
-                        'mimeType': doc.get('mimeType', 'unknown')
-                    })
-            
-            serializable_action_result = {
-                'status': 'completed' if action_result.success else 'failed',
-                'result_summary': action_result.data.get('result', '')[:200] + '...' if len(action_result.data.get('result', '')) > 200 else action_result.data.get('result', ''),
-                'error': action_result.error,
-                'resultLabel': action_result.data.get('resultLabel', ''),
-                'documents_count': len(documents_metadata),
-                'documents_metadata': documents_metadata,
-                'actionId': action_result.actionId,
-                'actionMethod': action_result.actionMethod,
-                'actionName': action_result.actionName,
-                'success_indicator': 'documents' if len(documents_metadata) > 0 else 'text_result' if action_result.data.get('result', '').strip() else 'none'
-            }
-            step_result_serializable['action_results'].append(serializable_action_result)
-        
-        # Fix: Compute JSON string outside the f-string to avoid nested curly braces error
-        step_result_json = json.dumps(step_result_serializable, indent=2, ensure_ascii=False)
-        expected_outputs_str = ', '.join(task_step.expected_outputs or [])
-        success_criteria_str = ', '.join(task_step.success_criteria or [])
-        return f"""You are a result review AI that evaluates task step completion and decides on next actions.
-
-TASK STEP: {task_step.description}
-EXPECTED OUTPUTS: {expected_outputs_str}
-SUCCESS CRITERIA: {success_criteria_str}
-
-STEP RESULT: {step_result_json}
-
-INSTRUCTIONS:
-1. Evaluate if the task step was completed successfully
-2. Check if all expected outputs were produced
-3. Verify if success criteria were met
-4. Decide on next action: continue, retry, or fail
-5. If retry, provide specific improvements needed
-
-IMPORTANT NOTES:
-- Actions can produce either text results OR documents (or both)
-- Empty result_summary is acceptable if documents were produced (documents_count > 0)
-- Focus on whether the action achieved its intended purpose, not just text output
-- Document-based actions (like file extractions) often have empty text results but successful document outputs
-- Check the 'success_indicator' field: 'documents' means success via document output, 'text_result' means success via text, 'none' means no output
-
-REQUIRED JSON STRUCTURE:
-{{
-    "status": "success|retry|failed",
-    "reason": "Explanation of the decision",
-    "improvements": "Specific improvements for retry (if status is retry)",
-    "quality_score": 1-10,
-    "missing_outputs": ["output1", "output2"],
-    "met_criteria": ["criteria1", "criteria2"],
-    "unmet_criteria": ["criteria3", "criteria4"]
-}}
-
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-    
-    # ===== HELPER METHODS FOR WORKFLOW PHASES =====
-    
-    async def _generateActionsForTaskStep(self, context: TaskContext) -> List[Dict[str, Any]]:
-        """Generate actions for a specific task step with enhanced retry context"""
-        try:
-            # Prepare prompt for action generation
-            prompt = await self.createActionDefinitionPrompt(context)
-            
-            # Call AI with circuit breaker
-            response = await self._callAIWithCircuitBreaker(prompt, "action_generation")
-            
-            # Parse and validate actions
-            actions = self._parseActionResponse(response)
-            
-            # Validate actions
-            if not self._validateActions(actions, context):
-                logger.error("Generated actions failed validation")
-                raise Exception("AI-generated actions failed validation - AI is required for action generation")
-            
-            logger.info(f"Generated {len(actions)} actions for task step")
-            return actions
-            
-        except Exception as e:
-            logger.error(f"Error generating actions for task step: {str(e)}")
-            raise Exception(f"AI is required for action generation but failed: {str(e)}")
-    
-    async def _executeSingleAction(self, action: TaskAction, workflow: ChatWorkflow) -> ActionResult:
-        """Execute a single action and return ActionResult with enhanced document processing"""
-        try:
-            # Enhance parameters with expected document formats if specified
-            enhanced_parameters = action.execParameters.copy()
-            if action.expectedDocumentFormats:
-                enhanced_parameters['expectedDocumentFormats'] = action.expectedDocumentFormats
-                logger.info(f"Action {action.execMethod}.{action.execAction} expects formats: {action.expectedDocumentFormats}")
-            
-            # Execute the actual method action using the service center
-            result = await self.service.executeAction(
-                methodName=action.execMethod,
-                actionName=action.execAction,
-                parameters=enhanced_parameters
-            )
-            
-            # Always use the execResultLabel from the action definition
-            result_label = action.execResultLabel
-            
-            # Update action based on result
-            if result.success:
-                action.setSuccess()
-                action.result = result.data.get("result", "")
-                action.execResultLabel = result_label
-                
-                # Create and store message in workflow for successful action
-                await self._createActionMessage(action, result, workflow, result_label)
-                
-            else:
-                action.setError(result.error or "Action execution failed")
-            
-            # Enhanced result processing with better document handling
-            documents = result.data.get("documents", [])
-            processed_documents = []
-            
-            # Process documents with better metadata extraction
-            for doc in documents:
-                if hasattr(doc, 'filename') and doc.filename:
-                    # Document object with proper metadata
-                    mime_type = getattr(doc, 'mimeType', 'application/octet-stream')
-                    
-                    # Enhanced MIME type detection for document objects
-                    if mime_type == "application/octet-stream":
-                        mime_type = self._detectMimeTypeFromDocument(doc, doc.filename)
-                    
-                    processed_documents.append({
-                        'filename': doc.filename,
-                        'fileSize': getattr(doc, 'fileSize', 0),
-                        'mimeType': mime_type,
-                        'content': getattr(doc, 'content', ''),
-                        'document': doc
-                    })
-                elif isinstance(doc, dict):
-                    # Dictionary document with metadata
-                    filename = doc.get('documentName', doc.get('filename', f"{action.execMethod}_{action.execAction}_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}"))
-                    fileSize = doc.get('fileSize', len(str(doc.get('documentData', ''))))
-                    mimeType = doc.get('mimeType', 'application/octet-stream')
-                    
-                    # Enhanced MIME type detection for dictionary documents
-                    if mimeType == "application/octet-stream":
-                        document_data = doc.get('documentData', '')
-                        mimeType = self._detectMimeTypeFromContent(document_data, filename)
-                    
-                    processed_documents.append({
-                        'filename': filename,
-                        'fileSize': fileSize,
-                        'mimeType': mimeType,
-                        'content': doc.get('documentData', ''),
-                        'document': doc
-                    })
-                else:
-                    # Fallback for unknown document types
-                    logger.warning(f"Unknown document type for action {action.execMethod}.{action.execAction}: {type(doc)}")
-                    filename = f"{action.execMethod}_{action.execAction}_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}"
-                    mimeType = 'application/octet-stream'
-                    
-                    # Try to detect MIME type for unknown document types
-                    mimeType = self._detectMimeTypeFromContent(doc, filename)
-                    
-                    processed_documents.append({
-                        'filename': filename,
-                        'fileSize': 0,
-                        'mimeType': mimeType,
-                        'content': str(doc),
-                        'document': doc
-                    })
-            
-            # Create ActionResult with processed data
-            return ActionResult(
-                success=result.success,
-                data={
-                    "result": result.data.get("result", ""),
-                    "documents": processed_documents,
-                    "actionId": action.id,
-                    "actionMethod": action.execMethod,
-                    "actionName": action.execAction,
-                    "resultLabel": result_label
-                },
-                metadata={
-                    "actionId": action.id,
-                    "actionMethod": action.execMethod,
-                    "actionName": action.execAction,
-                    "resultLabel": result_label
-                },
-                validation=[],
-                error=result.error or ""
-            )
-            
-        except Exception as e:
-            logger.error(f"Error executing single action: {str(e)}")
-            action.setError(str(e))
-            return ActionResult(
-                success=False,
-                data={
-                    "actionId": action.id,
-                    "actionMethod": action.execMethod,
-                    "actionName": action.execAction,
-                    "documents": []
-                },
-                metadata={
-                    "actionId": action.id,
-                    "actionMethod": action.execMethod,
-                    "actionName": action.execAction
-                },
-                validation=[],
-                error=str(e)
-            )
-    
-    async def _createActionMessage(self, action: TaskAction, result: Any, workflow: ChatWorkflow, result_label: str = None) -> None:
-        """Create and store a message for the action result in the workflow with enhanced document processing"""
-        try:
-            # Get result data
-            result_data = result.data if hasattr(result, 'data') else {}
-            documents_data = result_data.get("documents", [])
-            if result_label is None:
-                result_label = action.execResultLabel
-            
-            # Create message data
-            message_data = {
-                "workflowId": workflow.id,
-                "role": "assistant",
-                "message": f"Executed action {action.execMethod}.{action.execAction}",
-                "status": "step",
-                "sequenceNr": len(workflow.messages) + 1,
-                "publishedAt": datetime.now(UTC).isoformat(),
-                "actionId": action.id,
-                "actionMethod": action.execMethod,
-                "actionName": action.execAction,
-                "documentsLabel": result_label,  # Use intent label from action definition
-                "documents": []
-            }
-            
-            # Process documents if any
-            if documents_data:
-                processed_documents = []
-                for doc_data in documents_data:
-                    try:
-                        # Handle different document data formats
-                        if isinstance(doc_data, dict):
-                            # Enhanced document processing for dictionary format
-                            document_name = doc_data.get("documentName", doc_data.get("filename", f"{action.execMethod}_{action.execAction}_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}"))
-                            document_data = doc_data.get("documentData", {})
-                            file_size = doc_data.get("fileSize", 0)
-                            mime_type = doc_data.get("mimeType", "application/octet-stream")
-                        elif hasattr(doc_data, 'filename'):
-                            # Document object format
-                            document_name = doc_data.filename
-                            document_data = getattr(doc_data, 'content', {})
-                            file_size = getattr(doc_data, 'fileSize', 0)
-                            mime_type = getattr(doc_data, 'mimeType', "application/octet-stream")
-                        else:
-                            # Fallback for unknown formats
-                            document_name = f"{action.execMethod}_{action.execAction}_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}"
-                            document_data = doc_data
-                            file_size = len(str(doc_data))
-                            mime_type = "application/octet-stream"
-                        
-                        # Enhanced MIME type detection using service center
-                        if mime_type == "application/octet-stream":
-                            mime_type = self._detectMimeTypeFromContent(document_data, document_name)
-                        
-                        # Convert document data to string content
-                        content = self._convertDocumentDataToString(document_data, self._getFileExtension(document_name))
-                        
-                        # Validate content before creating file
-                        minimal_content_patterns = ['{}', '[]', 'null', '""', "''"]
-                        if not content or content.strip() == "" or content.strip() in minimal_content_patterns:
-                            logger.warning(f"Empty or minimal content for document {document_name}, skipping")
-                            continue
-                        
-                        # Create file in database
-                        file_id = self.service.createFile(
-                            fileName=document_name,
-                            mimeType=mime_type,
-                            content=content,
-                            base64encoded=False
-                        )
-                        
-                        if not file_id:
-                            logger.error(f"Failed to create file for document {document_name}")
-                            continue
-                        
-                        # Create ChatDocument object
-                        document = self.service.createDocument(
-                            fileName=document_name,
-                            mimeType=mime_type,
-                            content=content,
-                            base64encoded=False
-                        )
-                        
-                        if document:
-                            processed_documents.append(document)
-                            logger.info(f"Created document: {document_name} with file ID: {file_id} and MIME type: {mime_type}")
-                        else:
-                            logger.error(f"Failed to create ChatDocument object for {document_name}")
-                        
-                    except Exception as e:
-                        logger.error(f"Error processing document {doc_data.get('documentName', 'unknown')}: {str(e)}")
-                        continue
-                
-                # Update message with processed documents
-                message_data["documents"] = processed_documents
-            
-            # Create message using interface
-            message = self.chatInterface.createWorkflowMessage(message_data)
-            if message:
-                workflow.messages.append(message)
-                logger.info(f"Created action message for {action.execMethod}.{action.execAction} with {len(message_data.get('documents', []))} documents")
-                # ADDED LOGGING: Print workflow id, message count, and all message labels and document counts
-                logger.debug(f"WORKFLOW STATE after _createActionMessage: id={id(workflow)}, message_count={len(workflow.messages)}")
-                for idx, msg in enumerate(workflow.messages):
-                    label = getattr(msg, 'documentsLabel', None)
-                    docs = getattr(msg, 'documents', None)
-                    logger.debug(f"  Message {idx}: label='{label}', documents_count={len(docs) if docs else 0}")
-            else:
-                logger.error(f"Failed to create workflow message for action {action.execMethod}.{action.execAction}")
-                
-        except Exception as e:
-            logger.error(f"Error creating action message: {str(e)}")
-    
-    def _getFileExtension(self, filename: str) -> str:
-        """Extract file extension from filename"""
-        return self.service.getFileExtension(filename)
-    
-    def _getMimeType(self, extension: str) -> str:
-        """Get MIME type based on file extension"""
-        return self.service.getMimeTypeFromExtension(extension)
-    
-    def _detectMimeTypeFromContent(self, content: Any, filename: str) -> str:
-        """
-        Detect MIME type from content and filename using service center.
-        Only returns a detected MIME type if it's better than application/octet-stream.
-        
-        Args:
-            content: Content data (string, dict, or other)
-            filename: Name of the file
-            
-        Returns:
-            str: Detected MIME type or original if detection failed
-        """
-        try:
-            # Convert content to bytes for MIME type detection
-            if isinstance(content, str):
-                file_bytes = content.encode('utf-8')
-            elif isinstance(content, dict):
-                import json
-                file_bytes = json.dumps(content, ensure_ascii=False).encode('utf-8')
-            else:
-                file_bytes = str(content).encode('utf-8')
-            
-            # Use service center's MIME type detection
-            detected_mime_type = self.service.detectContentTypeFromData(file_bytes, filename)
-            if detected_mime_type != "application/octet-stream":
-                return detected_mime_type
-            return "application/octet-stream"
-        except Exception as e:
-            logger.warning(f"Error in MIME type detection for {filename}: {str(e)}")
-            return 'application/octet-stream'
-    
-    def _detectMimeTypeFromDocument(self, document: Any, filename: str) -> str:
-        """
-        Detect MIME type from document object using service center.
-        Only returns a detected MIME type if it's better than application/octet-stream.
-        
-        Args:
-            document: Document object with content attribute
-            filename: Name of the file
-            
-        Returns:
-            str: Detected MIME type or original if detection failed
-        """
-        try:
-            # Get document content as bytes for MIME type detection
-            content = getattr(document, 'content', '')
-            if isinstance(content, str):
-                file_bytes = content.encode('utf-8')
-            else:
-                file_bytes = str(content).encode('utf-8')
-            
-            # Use service center's MIME type detection
-            detected_mime_type = self.service.detectContentTypeFromData(file_bytes, filename)
-            if detected_mime_type != "application/octet-stream":
-                return detected_mime_type
-            return "application/octet-stream"
-        except Exception as e:
-            logger.warning(f"Error in MIME type detection for document {filename}: {str(e)}")
-            return 'application/octet-stream'
-    
-    def _convertDocumentDataToString(self, document_data: Dict[str, Any], file_extension: str) -> str:
-        """Convert document data to string content based on file type with enhanced processing"""
-        try:
-            # Handle None or empty data
-            if document_data is None:
-                return ""
-            
-            # Handle string data directly
-            if isinstance(document_data, str):
-                return document_data
-            
-            # Handle dictionary data
-            if isinstance(document_data, dict):
-                # For JSON files, return formatted JSON
-                if file_extension == 'json':
-                    return json.dumps(document_data, indent=2, ensure_ascii=False)
-                
-                # For text files, try to extract text content
-                elif file_extension in ['txt', 'md', 'html', 'css', 'js', 'py']:
-                    # Look for common text content fields
-                    text_fields = ['content', 'text', 'data', 'result', 'summary', 'extracted_content', 'table_data']
-                    for field in text_fields:
-                        if field in document_data:
-                            content = document_data[field]
-                            if isinstance(content, str):
-                                return content
-                            elif isinstance(content, (dict, list)):
-                                return json.dumps(content, indent=2, ensure_ascii=False)
-                    
-                    # If no text field found, convert entire dict to JSON
-                    return json.dumps(document_data, indent=2, ensure_ascii=False)
-                
-                # For CSV files, try to extract table data
-                elif file_extension == 'csv':
-                    # Look for CSV-specific fields first, then general content fields
-                    csv_fields = ['table_data', 'csv_data', 'rows', 'data', 'content', 'text']
-                    for field in csv_fields:
-                        if field in document_data:
-                            content = document_data[field]
-                            if isinstance(content, str):
-                                return content
-                            elif isinstance(content, list):
-                                # Convert list of rows to CSV format
-                                if content and isinstance(content[0], (list, dict)):
-                                    import csv
-                                    import io
-                                    output = io.StringIO()
-                                    if isinstance(content[0], dict):
-                                        # List of dictionaries
-                                        if content:
-                                            fieldnames = content[0].keys()
-                                            writer = csv.DictWriter(output, fieldnames=fieldnames)
-                                            writer.writeheader()
-                                            writer.writerows(content)
-                                    else:
-                                        # List of lists
-                                        writer = csv.writer(output)
-                                        writer.writerows(content)
-                                    return output.getvalue()
-                    
-                    # Fallback to JSON if no CSV data found
-                    return json.dumps(document_data, indent=2, ensure_ascii=False)
-                
-                # For other file types, convert to JSON
-                else:
-                    return json.dumps(document_data, indent=2, ensure_ascii=False)
-            
-            # Handle list data
-            elif isinstance(document_data, list):
-                if file_extension == 'csv':
-                    # Convert list to CSV format
-                    import csv
-                    import io
-                    output = io.StringIO()
-                    if document_data and isinstance(document_data[0], dict):
-                        # List of dictionaries
-                        fieldnames = document_data[0].keys()
-                        writer = csv.DictWriter(output, fieldnames=fieldnames)
-                        writer.writeheader()
-                        writer.writerows(document_data)
-                    else:
-                        # List of lists
-                        writer = csv.writer(output)
-                        writer.writerows(document_data)
-                    return output.getvalue()
-                else:
-                    return json.dumps(document_data, indent=2, ensure_ascii=False)
-            
-            # Handle other data types
-            else:
-                return str(document_data)
-                
-        except Exception as e:
-            logger.error(f"Error converting document data to string: {str(e)}")
-            return str(document_data)
-    
-    async def _performTaskReview(self, review_context: ReviewContext) -> ReviewResult:
-        """Perform AI-based task review with enhanced retry logic"""
-        try:
-            # Prepare prompt for result review
-            prompt = self.createResultReviewPrompt(review_context)
-            
-            # Call AI with circuit breaker
-            response = await self._callAIWithCircuitBreaker(prompt, "result_review")
-            
-            # Parse review result
-            review_dict = self._parseReviewResponse(response)
-            
-            # Add default values for missing fields
-            review_dict.setdefault('status', 'unknown')
-            review_dict.setdefault('reason', 'No reason provided')
-            review_dict.setdefault('quality_score', 5)
-            
-            # Enhanced retry logic based on result quality
-            if review_dict.get('status') == 'retry':
-                # Analyze the specific issues for better retry guidance
-                action_results = review_context.action_results or []
-                if action_results:
-                    # Check for common issues that warrant retry
-                    # Only consider empty results a problem if there are no documents produced
-                    has_empty_results = any(
-                        not result.data.get('result', '').strip() and 
-                        not result.data.get('documents') and 
-                        not result.data.get('documents')
-                        for result in action_results 
-                        if result.success
-                    )
-                    
-                    has_incomplete_metadata = any(
-                        any(doc.get('filename') == 'unknown' for doc in result.data.get('documents', []) or [])
-                        for result in action_results
-                        if result.success
-                    )
-                    
-                    if has_empty_results:
-                        review_dict['improvements'] = (review_dict.get('improvements', '') + 
-                                               " Ensure the document extraction returns actual content, not empty results. " +
-                                               "Check if the AI prompt is specific enough to extract meaningful data.")
-                    
-                    if has_incomplete_metadata:
-                        review_dict['improvements'] = (review_dict.get('improvements', '') + 
-                                               " Ensure proper document metadata is extracted including filename, size, and mime type. " +
-                                               "The document processing should provide complete file information.")
-                    
-                    # If we have specific issues, adjust quality score
-                    if has_empty_results or has_incomplete_metadata:
-                        review_dict['quality_score'] = max(1, review_dict.get('quality_score', 5) - 2)
-            
-            # Create ReviewResult model
-            return ReviewResult(
-                status=review_dict.get('status', 'unknown'),
-                reason=review_dict.get('reason', 'No reason provided'),
-                improvements=review_dict.get('improvements', []),
-                quality_score=review_dict.get('quality_score', 5),
-                missing_outputs=review_dict.get('missing_outputs', []),
-                met_criteria=review_dict.get('met_criteria', []),
-                unmet_criteria=review_dict.get('unmet_criteria', []),
-                confidence=review_dict.get('confidence', 0.5)
-            )
-            
-        except Exception as e:
-            logger.error(f"Error performing task review: {str(e)}")
-            return ReviewResult(
-                status='success',  # Default to success to avoid blocking workflow
-                reason=f'Review failed: {str(e)}',
-                quality_score=5,
-                confidence=0.5
-            )
-    
-    def _getPreviousResultsFromActions(self, task_actions: List[TaskAction]) -> List[str]:
-        """Get list of previous results from completed actions and workflow messages"""
-        results = []
-        
-        # Get results from action objects
-        for action in task_actions:
-            if action.execResultLabel and action.isSuccessful():
-                results.append(action.execResultLabel)
-        
-        # Get results from workflow messages (for actions that have been executed)
-        if hasattr(self, 'workflow') and self.workflow and self.workflow.messages:
-            for message in self.workflow.messages:
-                if (message.role == 'assistant' and 
-                    message.status == 'step' and 
-                    message.documentsLabel and 
-                    message.documentsLabel not in results):
-                    results.append(message.documentsLabel)
-        
-        return results
-    
-    def _calculateTaskQualityMetrics(self, task_step: TaskStep, action_results: List[ActionExecutionResult]) -> Dict[str, Any]:
-        """Calculate quality metrics for task step results"""
-        try:
-            quality_score = 0
-            confidence = 0
-            
-            # Count successful actions
-            successful_actions = sum(1 for result in action_results if result.success)
-            total_actions = len(action_results)
-            
-            if total_actions > 0:
-                success_rate = successful_actions / total_actions
-                quality_score = int(success_rate * 10)  # Scale to 0-10
-                confidence = min(success_rate, 1.0)
-            
-            return {
-                'score': quality_score,
-                'confidence': confidence,
-                'successful_actions': successful_actions,
-                'total_actions': total_actions
-            }
-            
-        except Exception as e:
-            logger.error(f"Error calculating task quality metrics: {str(e)}")
-            return {'score': 0, 'confidence': 0, 'successful_actions': 0, 'total_actions': 0}
-    
-    # ===== BASIC HELPER METHODS =====
-    
-    def _getAvailableDocuments(self, workflow: ChatWorkflow) -> List[str]:
-        """Get list of available documents in the workflow"""
-        documents = []
-        for message in workflow.messages:
-            for doc in message.documents:
-                documents.append(doc.filename)
-        return documents
-
-    def _getPreviousResults(self, task: TaskItem) -> List[str]:
-        """Get list of previous results from completed actions"""
-        results = []
-        for action in task.actionList:
-            if action.execResultLabel:
-                results.append(action.execResultLabel)
-        return results
-
-    def _parseTaskPlanResponse(self, response: str) -> Dict[str, Any]:
-        """Parse AI response into task plan structure"""
-        try:
-            # Extract JSON from response
-            json_start = response.find('{')
-            json_end = response.rfind('}') + 1
-            if json_start == -1 or json_end == 0:
-                raise ValueError("No JSON found in response")
-            
-            json_str = response[json_start:json_end]
-            task_plan = json.loads(json_str)
-            
-            # Validate structure
-            if 'tasks' not in task_plan:
-                raise ValueError("Task plan missing 'tasks' field")
-            
-            return task_plan
-            
-        except Exception as e:
-            logger.error(f"Error parsing task plan response: {str(e)}")
-            return {'tasks': []}
-
-    def _parseActionResponse(self, response: str) -> List[Dict[str, Any]]:
-        """Parse AI response into action list"""
-        try:
-            # Extract JSON from response
-            json_start = response.find('{')
-            json_end = response.rfind('}') + 1
-            if json_start == -1 or json_end == 0:
-                raise ValueError("No JSON found in response")
-            
-            json_str = response[json_start:json_end]
-            action_data = json.loads(json_str)
-            
-            # Validate structure
-            if 'actions' not in action_data:
-                raise ValueError("Action response missing 'actions' field")
-            
-            return action_data['actions']
-            
-        except Exception as e:
-            logger.error(f"Error parsing action response: {str(e)}")
-            return []
-
-    def _parseReviewResponse(self, response: str) -> Dict[str, Any]:
-        """Parse AI response into review result"""
-        try:
-            # Extract JSON from response
-            json_start = response.find('{')
-            json_end = response.rfind('}') + 1
-            if json_start == -1 or json_end == 0:
-                raise ValueError("No JSON found in response")
-            
-            json_str = response[json_start:json_end]
-            review = json.loads(json_str)
-            
-            # Validate structure
-            if 'status' not in review:
-                raise ValueError("Review response missing 'status' field")
-            
-            return review
-            
-        except Exception as e:
-            logger.error(f"Error parsing review response: {str(e)}")
-            return {'status': 'failed', 'reason': f'Parse error: {str(e)}'}
-
-    async def _callAdvancedAI(self, prompt: str, context: str) -> str:
-        """Call advanced AI service with prompt (primary method)"""
-        try:
-            # Use the advanced AI call mechanism through service
-            if hasattr(self, 'service') and self.service:
-                # Try advanced AI call first
-                if hasattr(self.service, 'callAiTextAdvanced'):
-                    response = await self.service.callAiTextAdvanced(prompt)
-                    logger.debug(f"Advanced AI call successful for {context}")
-                    return response
-                else:
-                    raise Exception("Service does not have callAiTextAdvanced method")
-            else:
-                raise Exception("No service available for AI calls")
-                
-        except Exception as e:
-            error_message = str(e)
-            logger.warning(f"Advanced AI call failed for {context}: {error_message}")
-            raise Exception(f"Advanced AI failed: {error_message}")
-
-    async def _callStandardAI(self, prompt: str, context: str) -> str:
-        """Call standard AI service with prompt (fallback method)"""
-        try:
-            # Use the standard AI call mechanism through service
-            if hasattr(self, 'service') and self.service:
-                # Try standard AI call as fallback
-                if hasattr(self.service, 'callAiTextBasic'):
-                    response = await self.service.callAiTextBasic(prompt)
-                    logger.debug(f"Standard AI call successful for {context}")
-                    return response
-                else:
-                    raise Exception("Service does not have callAiTextBasic method")
-            else:
-                raise Exception("No service available for AI calls")
-                
-        except Exception as e:
-            error_message = str(e)
-            logger.error(f"Standard AI call failed for {context}: {error_message}")
-            
-            # Provide more specific error messages based on the error type
-            if "overloaded" in error_message.lower() or "529" in error_message:
-                detailed_error = "AI service is currently overloaded. Please try again in a few minutes."
-            elif "rate limit" in error_message.lower() or "429" in error_message:
-                detailed_error = "Rate limit exceeded. Please wait before making another request."
-            elif "api key" in error_message.lower() or "401" in error_message:
-                detailed_error = "Invalid API key. Please check your AI service configuration."
-            elif "timeout" in error_message.lower():
-                detailed_error = "AI service request timed out. Please try again."
-            else:
-                detailed_error = f"AI service error: {error_message}"
-            
-            raise Exception(detailed_error)
-
-    async def _callAI(self, prompt: str, context: str) -> str:
-        """Call AI service with prompt (legacy method - now uses the circuit breaker)"""
-        return await self._callAIWithCircuitBreaker(prompt, context) 
-
-    # ===== WORKFLOW FEEDBACK GENERATION =====
-    
-    async def generateWorkflowFeedback(self, workflow: ChatWorkflow) -> str:
-        """Generate feedback message for workflow completion"""
-        try:
-            # Count messages by role
-            user_messages = [msg for msg in workflow.messages if msg.role == 'user']
-            assistant_messages = [msg for msg in workflow.messages if msg.role == 'assistant']
-            
-            # Generate summary feedback
-            feedback = f"Workflow completed.\n\n"
-            feedback += f"Processed {len(user_messages)} user inputs and generated {len(assistant_messages)} responses.\n"
-            
-            # Add final status
-            if workflow.status == "completed":
-                feedback += "All tasks completed successfully."
-            elif workflow.status == "partial":
-                feedback += "Some tasks completed with partial success."
-            else:
-                feedback += f"Workflow status: {workflow.status}"
-            
-            return feedback
-            
-        except Exception as e:
-            logger.error(f"Error generating workflow feedback: {str(e)}")
-            return "Workflow processing completed."
-
-    # ===== UNIFIED WORKFLOW EXECUTION =====
-    
-    async def executeUnifiedWorkflow(self, userInput: UserInputRequest, workflow: ChatWorkflow) -> WorkflowResult:
-        """Execute a unified workflow with state management and action-level validation"""
-        try:
-            logger.info(f"Starting unified workflow execution for workflow {workflow.id}")
-            start_time = time.time()
-            
-            # Initialize chat manager with workflow
-            await self.initialize(workflow)
-            
-            # Process file IDs if provided
-            documents = []
-            if hasattr(userInput, 'listFileId') and userInput.listFileId:
-                documents = await self.processFileIds(userInput.listFileId)
-                logger.info(f"Processed {len(documents)} documents")
-            
-            # Calculate and update user input stats
-            user_input_size = self.service.calculateUserInputSize(userInput.prompt)
-            self.service.updateWorkflowStats(eventLabel="userinput", bytesReceived=user_input_size)
-            
-            # Phase 1: High-Level Task Planning
-            logger.info("--- PHASE 1: HIGH-LEVEL TASK PLANNING ---")
-            task_plan = await self.planHighLevelTasks(userInput.prompt, workflow)
-            
-            # Update stats for task planning
-            task_plan_size = self.service.calculateObjectSize(task_plan)
-            self.service.updateWorkflowStats(eventLabel="taskplan", bytesSent=task_plan_size)
-            
-            # Create user-friendly task plan log
-            tasks_count = len(task_plan.tasks)
-            task_descriptions = "\n".join([f"- {task.description}" for task in task_plan.tasks])
-            self.chatInterface.createWorkflowLog({
-                "workflowId": workflow.id,
-                "message": f"Planning completed: {tasks_count} tasks identified\n{task_descriptions}",
-                "type": "info",
-                "status": "running",
-                "progress": 15,
-                "agentName": "System"
-            })
-            
-            # Log task plan details (without document content)
-            task_plan_log = {
-                'overview': task_plan.overview,
-                'tasks_count': len(task_plan.tasks),
-                'tasks': []
-            }
-            for task in task_plan.tasks:
-                task_log = {
-                    'id': task.id,
-                    'description': task.description,
-                    'dependencies': task.dependencies or [],
-                    'expected_outputs': task.expected_outputs or [],
-                    'success_criteria': task.success_criteria or [],
-                    'required_documents_count': len(task.required_documents or []),
-                    'estimated_complexity': task.estimated_complexity or ''
-                }
-                task_plan_log['tasks'].append(task_log)
-            logger.debug(f"TASK PLAN CREATED: {json.dumps(task_plan_log, indent=2, ensure_ascii=False)}")
-            
-            # Execute each task step with state management
-            workflow_results = []
-            previous_results = []
-            
-            for i, task_step in enumerate(task_plan.tasks):
-                task_description = task_step.description
-                logger.info(f"=== PROCESSING TASK {i+1}/{len(task_plan.tasks)}: {task_description} ===")
-                
-                # Create user-friendly task start log with action details
-                progress = 20 + (i * 60 // len(task_plan.tasks))
-                
-                # Get actions for this task to show in the log
-                task_actions = await self.defineTaskActions(task_step, workflow, previous_results)
-                if not task_actions:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"❌ Task {i+1}/{len(task_plan.tasks)} failed: No actions could be generated for this task. Please check your input or available documents.",
-                        "type": "error",
-                        "status": "failed",
-                        "progress": 100,
-                        "agentName": "System"
-                    })
-                    return WorkflowResult(
-                        status='failed',
-                        error='No actions could be generated for task',
-                        phase='execution',
-                        completed_tasks=i,
-                        total_tasks=len(task_plan.tasks),
-                        execution_time=time.time() - start_time,
-                        final_results_count=0
-                    )
-                action_details = []
-                for j, action in enumerate(task_actions):
-                    action_details.append(f"  {j+1}. {action.execMethod}.{action.execAction}")
-                action_summary = "\n".join(action_details)
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"Executing task {i+1}/{len(task_plan.tasks)}: {task_description}\nActions to be executed:\n{action_summary}",
-                    "type": "info",
-                    "status": "running",
-                    "progress": progress,
-                    "agentName": "System"
-                })
-                
-                # Create context for task execution
-                task_context = TaskContext(
-                    task_step=task_step,
-                    workflow=workflow,
-                    workflow_id=workflow.id,
-                    available_documents=self._getAvailableDocuments(workflow),
-                    previous_results=previous_results
-                )
-                
-                # Execute task with state management
-                task_result = await self.executeTaskWithStateManagement(task_step, workflow, task_context)
-                
-                # Log task result
-                if task_result.success:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"🎯 Task {i+1} completed successfully",
-                        "type": "success",
-                        "status": "running",
-                        "progress": progress + 20
-                    })
-                    
-                    # Update previous results for next task
-                    # Note: TaskResult doesn't have successful_actions field, so we'll use a placeholder
-                    previous_results = [f"task_{i+1}_results"]
-                    
-                else:
-                    # Task failed - provide detailed feedback and stop workflow
-                    reason = task_result.error or 'Unknown error'
-                    
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"❌ Task {i+1} failed: {reason}",
-                        "type": "error",
-                        "status": "failed",
-                        "progress": progress + 15
-                    })
-                    
-                    # Generate detailed failure feedback
-                    failure_feedback = self._generateTaskFailureFeedback(task_step, task_result, i+1, len(task_plan.tasks))
-                    
-                    # Stop workflow and return failure
-                    return WorkflowResult(
-                        status='failed',
-                        error=reason,
-                        phase='execution',
-                        completed_tasks=i,
-                        total_tasks=len(task_plan.tasks),
-                        execution_time=time.time() - start_time,
-                        final_results_count=0
-                    )
-                
-                # Add task result to workflow results
-                workflow_results.append(task_result)
-            
-            # Calculate total processing time
-            total_processing_time = time.time() - start_time
-            
-            # Create final success log
-            self.chatInterface.createWorkflowLog({
-                "workflowId": workflow.id,
-                "message": f"🎉 Workflow completed ({len(workflow_results)}/{len(task_plan.tasks)} tasks)",
-                "type": "success",
-                "status": "completed",
-                "progress": 100
-            })
-            
-            # Create workflow summary
-            workflow_summary = WorkflowResult(
-                status='completed',
-                completed_tasks=len(workflow_results),
-                total_tasks=len(task_plan.tasks),
-                execution_time=total_processing_time,
-                final_results_count=len(previous_results)
-            )
-            
-            logger.info(f"=== UNIFIED WORKFLOW COMPLETED: {len(workflow_results)}/{len(task_plan.tasks)} tasks successful ===")
-            logger.debug(f"FINAL WORKFLOW SUMMARY: {json.dumps(workflow_summary.dict(), indent=2, ensure_ascii=False)}")
-            return workflow_summary
-            
-        except Exception as e:
-            logger.error(f"Error in unified workflow execution: {str(e)}")
-            # Create error log for user
-            self.chatInterface.createWorkflowLog({
-                "workflowId": workflow.id,
-                "message": f"Workflow execution failed: {str(e)}",
-                "type": "error",
-                "status": "failed",
-                "progress": 100,
-                "agentName": "System"
-            })
-            return WorkflowResult(
-                status='failed',
-                error=str(e),
-                phase='execution',
-                completed_tasks=0,
-                total_tasks=0,
-                execution_time=0,
-                final_results_count=0
-            )
-
-    def _generateTaskFailureFeedback(self, task_step: TaskStep, task_result: TaskResult, task_number: int, total_tasks: int) -> str:
-        """Generate detailed feedback for task failure"""
-        
-        feedback = f"""
-Workflow execution stopped due to task failure.
-
-PROGRESS: {task_number}/{total_tasks} tasks completed successfully
-FAILED TASK: {task_step.description}
-
-FAILURE DETAILS:
-- Task ID: {task_result.taskId}
-- Status: {task_result.status}
-- Success: {task_result.success}
-- Error: {task_result.error or 'Unknown error'}
-
-The workflow cannot continue because this task is essential for subsequent steps.
-Please review the task requirements and try again with different input or approach.
-"""
-        
-        return feedback
-
-    # ===== NEW STATE MANAGEMENT AND VALIDATION CLASSES =====
-
-    async def executeTaskWithStateManagement(self, task_step: TaskStep, workflow: ChatWorkflow, context: TaskContext) -> TaskResult:
-        try:
-            logger.info(f"Executing task with state management: {task_step.description}")
-            state = TaskExecutionState(task_step)
-            while state.canRetry():
-                logger.info(f"Task execution attempt {state.retry_count + 1}/{state.max_retries + 1}")
-                if state.retry_count == 0:
-                    actions = await self.defineTaskActions(task_step, workflow, context.previous_results)
-                else:
-                    actions = await self._regenerateTaskActionsWithFailureContext(task_step, state, context)
-                if not actions:
-                    logger.warning(f"No actions defined for task, marking as failed")
-                    return TaskResult(
-                        taskId=task_step.id,
-                        status=TaskStatus.FAILED,
-                        success=False,
-                        error='No actions could be generated for task'
-                    )
-                # --- BEGIN TWO-PASS LOGIC ---
-                available_labels = set(self._getAvailableDocuments(workflow))
-                for i, action in enumerate(actions):
-                    # Log parameters before documentList resolution
-                    logger.info(f"[Two-pass] Action {i+1}/{len(actions)} BEFORE resolution: execMethod={action.execMethod}, execAction={action.execAction}, parameters={json.dumps(action.execParameters, default=str, ensure_ascii=False)}")
-                    # Add outputs from already executed actions in this step
-                    available_labels.update([r.data['resultLabel'] for r in state.successful_actions if 'resultLabel' in r.data])
-                    # Resolve documentList for this action
-                    params = action.execParameters
-                    if 'documentList' in params and isinstance(params['documentList'], list):
-                        original_refs = params['documentList']
-                        resolved_refs = [ref for ref in original_refs if ref in available_labels]
-                        if len(resolved_refs) < len(original_refs):
-                            logger.warning(f"Action {action.execMethod}.{action.execAction} has unresolved document references: {set(original_refs) - set(resolved_refs)}. Only using resolved: {resolved_refs}")
-                        params['documentList'] = resolved_refs
-                        action.execParameters = params
-                        # Log document info for each resolved documentList reference
-                        doc_info_list = []
-                        for ref in resolved_refs:
-                            # Try to get document metadata from workflow messages
-                            doc_size = None
-                            doc_type = None
-                            for msg in workflow.messages:
-                                if hasattr(msg, 'documentsLabel') and msg.documentsLabel == ref and hasattr(msg, 'documents'):
-                                    for doc in msg.documents:
-                                        size = getattr(doc, 'fileSize', None) or doc.get('fileSize', None) if isinstance(doc, dict) else None
-                                        mime = getattr(doc, 'mimeType', None) or doc.get('mimeType', None) if isinstance(doc, dict) else None
-                                        doc_info_list.append({
-                                            'ref': ref,
-                                            'filename': getattr(doc, 'filename', None) or doc.get('filename', None) if isinstance(doc, dict) else None,
-                                            'size': size,
-                                            'type': mime
-                                        })
-                        logger.info(f"[Two-pass] Action {i+1}/{len(actions)} resolved documentList: {json.dumps(doc_info_list, ensure_ascii=False)}")
-                    logger.info(f"[Two-pass] Action {i+1}/{len(actions)} AFTER resolution: execMethod={action.execMethod}, execAction={action.execAction}, parameters={json.dumps(action.execParameters, default=str, ensure_ascii=False)}")
-                    logger.info(f"[Two-pass] Before executing action {i+1}/{len(actions)}: available_labels={sorted(available_labels)}")
-                    result = await self.executeActionWithValidation(action, workflow, context)
-                    if result.success:
-                        state.addSuccessfulAction(result)
-                    else:
-                        state.addFailedAction(result)
-                        logger.error(f"Action {i+1} failed validation - stopping task execution")
-                        self.chatInterface.createWorkflowLog({
-                            "workflowId": workflow.id,
-                            "message": f"❌ Action {i+1}/{len(actions)} failed: {action.execMethod}.{action.execAction}",
-                            "type": "error",
-                            "status": "running",
-                            "progress": 0,
-                            "agentName": "System"
-                        })
-                        break
-                # Validate task completion
-                task_validation = await self._validateTaskCompletion(state.successful_actions, task_step, workflow)
-                if task_validation.status == 'success':
-                    logger.info(f"Task completed successfully with {len(state.successful_actions)} successful actions")
-                    return TaskResult(
-                        taskId=task_step.id,
-                        status=TaskStatus.COMPLETED,
-                        success=True,
-                        feedback=f"Task completed successfully with {len(state.successful_actions)} successful actions"
-                    )
-                elif task_validation.status == 'retry':
-                    state.improvements = task_validation.improvements or []
-                    state.incrementRetryCount()
-                    logger.info(f"Task needs retry. Improvements: {state.improvements}")
-                    continue
-                else:
-                    logger.error(f"Task failed permanently")
-                    return TaskResult(
-                        taskId=task_step.id,
-                        status=TaskStatus.FAILED,
-                        success=False,
-                        error=task_validation.reason or 'Task validation failed'
-                    )
-            logger.error(f"Task failed after {state.max_retries} retries")
-            return TaskResult(
-                taskId=task_step.id,
-                status=TaskStatus.FAILED,
-                success=False,
-                error=f'Task failed after {state.max_retries} retries'
-            )
-        except Exception as e:
-            logger.error(f"Error in task execution with state management: {str(e)}")
-            return TaskResult(
-                taskId=task_step.id,
-                status=TaskStatus.FAILED,
-                success=False,
-                error=f'Task execution error: {str(e)}'
-            )
-
-    async def _regenerateTaskActionsWithFailureContext(self, task_step: TaskStep, state: TaskExecutionState, context: TaskContext) -> List[TaskAction]:
-        """Regenerate task actions with failure context and improvements"""
-        try:
-            logger.info(f"Regenerating actions for task with failure context")
-            
-            # Analyze failure patterns
-            failure_patterns = state.getFailurePatterns()
-            
-            # Create enhanced context with failure information
-            enhanced_context = TaskContext(
-                task_step=task_step,
-                workflow=context.workflow,
-                workflow_id=context.workflow_id,
-                available_documents=context.available_documents,
-                previous_results=state.getAvailableResults(),
-                improvements=state.improvements,
-                retry_count=state.retry_count,
-                failure_patterns=failure_patterns,
-                failed_actions=state.failed_actions,
-                successful_actions=state.successful_actions,
-                is_regeneration=True
-            )
-            
-            # Generate new actions with failure avoidance
-            logger.info(f"Regenerating actions for task '{task_step.description}' with failure context (retry {state.retry_count})")
-            actions = await self.defineTaskActions(task_step, context.workflow, state.getAvailableResults(), enhanced_context)
-            
-            logger.info(f"Regenerated {len(actions)} actions with failure context")
-            return actions
-            
-        except Exception as e:
-            logger.error(f"Error regenerating task actions: {str(e)}")
-            return []
-
-    async def _validateTaskCompletion(self, successful_actions: List[ActionExecutionResult], task_step: TaskStep, workflow: ChatWorkflow) -> ReviewResult:
-        """Validate if task is completed successfully"""
-        try:
-            logger.info(f"Validating task completion: {task_step.description}")
-            
-            # Create task result summary
-            task_result = {
-                'task_step': task_step,
-                'successful_actions': successful_actions,
-                'successful_count': len(successful_actions),
-                'expected_outputs': task_step.expected_outputs or [],
-                'success_criteria': task_step.success_criteria or []
-            }
-            
-            # Use AI to validate task completion
-            prompt = self._createTaskCompletionValidationPrompt(task_result, task_step)
-            response = await self._callAIWithCircuitBreaker(prompt, "task_completion_validation")
-            
-            # Log the validation response for debugging
-            logger.debug(f"Task validation AI response: {response}")
-            
-            # Parse validation result
-            validation = self._parseTaskValidationResponse(response)
-            
-            # Add quality metrics
-            validation['quality_metrics'] = self._calculateTaskQualityMetrics(task_step, successful_actions)
-            
-            logger.info(f"Task completion validation: {validation.get('status', 'unknown')} - Reason: {validation.get('reason', 'No reason')}")
-            logger.debug(f"Parsed validation result: {json.dumps(validation, indent=2)}")
-            return ReviewResult(
-                status=validation.get('status', 'unknown'),
-                reason=validation.get('reason', 'No reason provided'),
-                improvements=validation.get('improvements', []),
-                quality_score=validation.get('quality_score', 5),
-                missing_outputs=validation.get('missing_outputs', []),
-                met_criteria=validation.get('met_criteria', []),
-                unmet_criteria=validation.get('unmet_criteria', []),
-                confidence=validation.get('confidence', 0.5)
-            )
-            
-        except Exception as e:
-            logger.error(f"Error validating task completion: {str(e)}")
-            return ReviewResult(
-                status='success',  # Default to success to avoid blocking
-                reason=f'Validation failed: {str(e)}',
-                quality_score=5,
-                confidence=0.5
-            )
-
-    def _createTaskCompletionValidationPrompt(self, task_result: Dict[str, Any], task_step: TaskStep) -> str:
-        """Create prompt for task completion validation"""
-        
-        successful_actions = task_result['successful_actions']
-        expected_outputs = task_result['expected_outputs']
-        success_criteria = task_result['success_criteria']
-        
-        # Summarize successful actions
-        action_summary = []
-        document_delivery_summary = []
-        for action in successful_actions:
-            doc_names = []
-            for doc in (action.documents or []):
-                if hasattr(doc, 'filename'):
-                    doc_names.append(doc.filename)
-                elif isinstance(doc, dict):
-                    doc_names.append(doc.get('filename', doc.get('documentName', 'unknown')))
-                else:
-                    doc_names.append(str(doc))
-            document_delivery_summary.append(f"- {action.actionMethod}.{action.actionName} (label: {action.data.get('resultLabel', '')}): {len(doc_names)} document(s): {', '.join(doc_names) if doc_names else 'None'}")
-            action_summary.append({
-                'method': action.actionMethod or '',
-                'action': action.actionName or '',
-                'result_label': action.data.get('resultLabel', ''),
-                'documents_count': len(action.documents or []),
-                'has_text_result': bool(action.data.get('result', '').strip())
-            })
-        delivery_summary_str = '\n'.join(document_delivery_summary) if document_delivery_summary else 'No documents delivered by any action.'
-        return f"""You are an action completion validator that evaluates if individual actions were successfully completed.
-
-DOCUMENT DELIVERY SUMMARY:
-{delivery_summary_str}
-
-ACTION DETAILS:
-{json.dumps(action_summary, indent=2)}
-
-VALIDATION CRITERIA:
-1. Check if the action's result_label matches what was delivered
-2. If documents were delivered and result_label is present → SUCCESS
-3. If no documents but text result with matching result_label or different result_label → RETRY
-4. If no result_label and no delivery → FAIL
-
-VALIDATION RULES:
-- Focus on result_label matching
-- Check if the action delivered the expected result type
-- Document delivery with correct result_label = SUCCESS
-- Text result with correct result_label = SUCCESS
-
-VALIDATION QUESTIONS:
-1. Does the result_label match what the action was supposed to deliver?
-2. Were documents or text results delivered with the correct label?
-3. Does the delivery match the action's objective?
-
-REQUIRED JSON RESPONSE:
-{{
-    "status": "success|retry|fail",
-    "reason": "Detailed explanation of the validation decision",
-    "improvements": ["specific improvement 1", "specific improvement 2"],
-    "missing_outputs": ["output1", "output2"],
-    "met_criteria": ["criteria1", "criteria2"],
-    "unmet_criteria": ["criteria3", "criteria4"],
-    "quality_score": 1-10,
-    "confidence": 0.0-1.0
-}}
-
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-
-    def _parseTaskValidationResponse(self, response: str) -> Dict[str, Any]:
-        """Parse task validation response"""
-        try:
-            # Extract JSON from response
-            json_start = response.find('{')
-            json_end = response.rfind('}') + 1
-            if json_start == -1 or json_end == 0:
-                raise ValueError("No JSON found in task validation response")
-            
-            json_str = response[json_start:json_end]
-            validation = json.loads(json_str)
-            
-            # Validate structure
-            if 'status' not in validation:
-                raise ValueError("Task validation response missing 'status' field")
-            
-            # Set default values
-            validation.setdefault('reason', 'No reason provided')
-            validation.setdefault('improvements', [])
-            validation.setdefault('missing_outputs', [])
-            validation.setdefault('met_criteria', [])
-            validation.setdefault('unmet_criteria', [])
-            validation.setdefault('quality_score', 5)
-            validation.setdefault('confidence', 0.5)
-            
-            return validation
-            
-        except Exception as e:
-            logger.error(f"Error parsing task validation response: {str(e)}")
-            return {
-                'status': 'success',
-                'reason': f'Parse error: {str(e)}',
-                'improvements': [],
-                'missing_outputs': [],
-                'met_criteria': [],
-                'unmet_criteria': [],
-                'quality_score': 5,
-                'confidence': 0.5
-            }
-
-    # ===== FIX MISSING METHOD CALL =====
-
-    async def _executeSingleActionWithRetry(self, action: TaskAction, workflow: ChatWorkflow) -> ActionExecutionResult:
-        """Execute single action with retry mechanism - FIXED"""
-        try:
-            logger.info(f"Executing action with retry: {action.execMethod}.{action.execAction}")
-            
-            # Create context for validation
-            context = TaskContext(
-                task_step=TaskStep(id="action_retry", description="Action execution"),
-                workflow_id=workflow.id,
-                available_documents=[],
-                previous_results=[]
-            )
-            
-            # Execute action with validation
-            result = await self.executeActionWithValidation(action, workflow, context)
-            
-            # If validation indicates retry, attempt retry
-            if result.validation.get('status') == 'retry':
-                improvements = result.validation.get('improvements', [])
-                retry_result = await self.retryActionWithImprovements(action, result, improvements)
-                return retry_result
-            
-            return result
-            
-        except Exception as e:
-            logger.error(f"Error executing action with retry: {str(e)}")
-            action.setError(str(e))
-            return ActionExecutionResult(
-                success=False,
-                data={},
-                metadata={},
-                error=str(e),
-                actionId=action.id,
-                actionMethod=action.execMethod,
-                actionName=action.execAction,
-                documents=[],
-                validation={
-                    'status': 'fail',
-                    'reason': f'Execution error: {str(e)}',
-                    'confidence': 0.0,
-                    'improvements': [],
-                    'quality_score': 0,
-                    'missing_elements': [],
-                    'suggested_retry_approach': ''
-                }
-            )
-
-    # ===== REPLACE OLD executeTaskActions METHOD =====
-
-    async def executeTaskActions(self, task_actions: List[TaskAction], workflow: ChatWorkflow) -> List[ActionExecutionResult]:
-        """Execute task actions with individual validation and retry logic"""
-        try:
-            logger.info(f"Executing {len(task_actions)} task actions with validation")
-            
-            results = []
-            for i, action in enumerate(task_actions):
-                logger.info(f"Executing action {i+1}/{len(task_actions)}: {action.execMethod}.{action.execAction}")
-                
-                # Create context for validation
-                context = TaskContext(
-                    task_step=TaskStep(id=f"action_{i}", description="Action execution"),
-                    workflow_id=workflow.id,
-                    available_documents=[],
-                    previous_results=[r.data.get('resultLabel', '') for r in results if r.data.get('resultLabel')]
-                )
-                
-                # Execute action with validation
-                result = await self.executeActionWithValidation(action, workflow, context)
-                results.append(result)
-                
-                # If action failed after validation, continue with next action
-                if isinstance(result.validation, dict) and result.validation.get('status') == 'fail':
-                    logger.error(f"Action {i+1} failed validation, continuing with next action")
-                    continue
-            
-            logger.info(f"Task action execution completed: {len(results)} results")
-            return results
-            
-        except Exception as e:
-            logger.error(f"Error executing task actions: {str(e)}")
-            return []
-
-    # ===== RESTRUCTURED ACTION EXECUTION WITH VALIDATION =====
-
-    async def executeActionWithValidation(self, action: TaskAction, workflow: ChatWorkflow, context: TaskContext) -> ActionExecutionResult:
-        """Execute single action with immediate validation"""
-        try:
-            logger.info(f"Executing action: {action.execMethod}.{action.execAction}")
-            
-            # Execute the action
-            result = await self._executeSingleAction(action, workflow)
-            
-            # Validate the result immediately
-            validator = ActionValidator(self)
-            validation = await validator.validateActionResult(result, action, context)
-            
-            # Create ActionExecutionResult model
-            action_result = ActionExecutionResult(
-                success=result.success,
-                data=result.data,
-                metadata=result.metadata,
-                validation=validation,
-                error=result.error,
-                actionId=action.id,
-                actionMethod=action.execMethod,
-                actionName=action.execAction,
-                documents=result.data.get("documents", [])
-            )
-            
-            # Log the action execution result as JSON (without document content)
-            action_result_json = {
-                'success': action_result.success,
-                'actionId': action_result.actionId,
-                'actionMethod': action_result.actionMethod,
-                'actionName': action_result.actionName,
-                'validation': action_result.validation,
-                'error': action_result.error,
-                'documents_count': len(action_result.documents),
-                'document_names': [doc.filename if hasattr(doc, 'filename') else str(doc) for doc in action_result.documents],
-                'data_keys': list(action_result.data.keys()) if isinstance(action_result.data, dict) else [],
-                'metadata_keys': list(action_result.metadata.keys()) if isinstance(action_result.metadata, dict) else []
-            }
-            logger.info(f"Action execution result for {action.execMethod}.{action.execAction}: {json.dumps(action_result_json, indent=2, ensure_ascii=False)}")
-            
-            # Update action status based on validation
-            if validation['status'] == 'success':
-                action.setSuccess()
-                logger.info(f"Action {action.execMethod}.{action.execAction} validated successfully")
-                
-                # Only create action message if documents were produced
-                if result.data.get("documents") and len(result.data.get("documents", [])) > 0:
-                    await self._createActionMessage(action, result, workflow, action.execResultLabel)
-                else:
-                    # Add validation success log instead of message
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"✅ Action validation successful: {action.execMethod}.{action.execAction}",
-                        "type": "success",
-                        "status": "running",
-                        "progress": 0,
-                        "agentName": "System"
-                    })
-                    
-            elif validation['status'] == 'retry':
-                action.status = TaskStatus.PENDING  # Keep pending for retry
-                logger.warning(f"Action {action.execMethod}.{action.execAction} needs retry: {validation.get('reason', 'No reason')}")
-                
-                # Add validation retry log
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"🔄 Action validation requires retry: {action.execMethod}.{action.execAction} - {validation.get('reason', 'No reason')}",
-                    "type": "warning",
-                    "status": "running",
-                    "progress": 0,
-                    "agentName": "System"
-                })
-            else:  # fail
-                action.setError(validation.get('reason', 'Action failed validation'))
-                logger.error(f"Action {action.execMethod}.{action.execAction} failed validation: {validation.get('reason', 'No reason')}")
-                
-                # Add validation failure log
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"❌ Action validation failed: {action.execMethod}.{action.execAction} - {validation.get('reason', 'No reason')}",
-                    "type": "error",
-                    "status": "running",
-                    "progress": 0,
-                    "agentName": "System"
-                })
-            
-            return action_result
-            
-        except Exception as e:
-            logger.error(f"Error executing action with validation: {str(e)}")
-            action.setError(str(e))
-            return ActionExecutionResult(
-                success=False,
-                data={},
-                metadata={},
-                error=str(e),
-                actionId=action.id,
-                actionMethod=action.execMethod,
-                actionName=action.execAction,
-                documents=[],
-                validation={
-                    'status': 'fail',
-                    'reason': f'Execution error: {str(e)}',
-                    'confidence': 0.0,
-                    'improvements': [],
-                    'quality_score': 0,
-                    'missing_elements': [],
-                    'suggested_retry_approach': ''
-                }
-            )
-
-    async def retryActionWithImprovements(self, action: TaskAction, previous_result: ActionExecutionResult, improvements: List[str]) -> ActionExecutionResult:
-        """Retry action with improvements based on previous failure"""
-        try:
-            logger.info(f"Retrying action {action.execMethod}.{action.execAction} with improvements")
-            
-            # Apply improvements to action parameters
-            enhanced_action = self._enhanceActionWithImprovements(action, improvements, previous_result)
-            
-            # Execute enhanced action
-            result = await self._executeSingleAction(enhanced_action, self.workflow)
-            
-            # Validate the retry result
-            validator = ActionValidator(self)
-            # Create a proper TaskContext for retry validation
-            retry_context = TaskContext(
-                task_step=TaskStep(
-                    id="retry_context",
-                    description="Action retry",
-                    dependencies=[],
-                    expected_outputs=[],
-                    success_criteria=[],
-                    required_documents=[],
-                    estimated_complexity="low",
-                    ai_prompt=""
-                ),
-                workflow=None,
-                workflow_id=None,
-                available_documents=[],
-                previous_results=[],
-                improvements=[],
-                retry_count=1,
-                previous_action_results=[],
-                previous_review_result=None,
-                is_regeneration=False,
-                failure_patterns=[],
-                failed_actions=[],
-                successful_actions=[]
-            )
-            validation = await validator.validateActionResult(result, enhanced_action, retry_context)
-            
-            # Create ActionExecutionResult model with retry metadata
-            action_result = ActionExecutionResult(
-                success=result.success,
-                data=result.data,
-                metadata=result.metadata,
-                validation=validation,
-                error=result.error,
-                actionId=action.id,
-                actionMethod=action.execMethod,
-                actionName=action.execAction,
-                documents=result.data.get("documents", []),
-                is_retry=True,
-                previous_error=previous_result.error,
-                applied_improvements=improvements
-            )
-            
-            # Log the retry action execution result as JSON (without document content)
-            retry_result_json = {
-                'success': action_result.success,
-                'actionId': action_result.actionId,
-                'actionMethod': action_result.actionMethod,
-                'actionName': action_result.actionName,
-                'validation': action_result.validation,
-                'error': action_result.error,
-                'is_retry': action_result.is_retry,
-                'previous_error': action_result.previous_error,
-                'applied_improvements': action_result.applied_improvements,
-                'documents_count': len(action_result.documents),
-                'document_names': [doc.filename if hasattr(doc, 'filename') else str(doc) for doc in action_result.documents],
-                'data_keys': list(action_result.data.keys()) if isinstance(action_result.data, dict) else [],
-                'metadata_keys': list(action_result.metadata.keys()) if isinstance(action_result.metadata, dict) else []
-            }
-            logger.info(f"Retry action execution result for {action.execMethod}.{action.execAction}: {json.dumps(retry_result_json, indent=2, ensure_ascii=False)}")
-            
-            # Update action status
-            if validation['status'] == 'success':
-                enhanced_action.setSuccess()
-                logger.info(f"Action retry successful: {enhanced_action.execMethod}.{enhanced_action.execAction}")
-            else:
-                enhanced_action.setError(validation.get('reason', 'Retry failed'))
-                logger.error(f"Action retry failed: {enhanced_action.execMethod}.{enhanced_action.execAction}")
-            
-            return action_result
-            
-        except Exception as e:
-            logger.error(f"Error retrying action: {str(e)}")
-            action.setError(str(e))
-            return ActionExecutionResult(
-                success=False,
-                data={},
-                metadata={},
-                error=str(e),
-                actionId=action.id,
-                actionMethod=action.execMethod,
-                actionName=action.execAction,
-                documents=[],
-                is_retry=True,
-                validation={
-                    'status': 'fail',
-                    'reason': f'Retry execution error: {str(e)}',
-                    'confidence': 0.0,
-                    'improvements': [],
-                    'quality_score': 0,
-                    'missing_elements': [],
-                    'suggested_retry_approach': ''
-                }
-            )
-
-    def _enhanceActionWithImprovements(self, action: TaskAction, improvements: List[str], previous_result: ActionExecutionResult) -> TaskAction:
-        """Enhance action parameters based on improvements and previous failure"""
-        enhanced_action = TaskAction(
-            id=action.id,
-            execMethod=action.execMethod,
-            execAction=action.execAction,
-            execParameters=action.execParameters.copy(),  # Copy to avoid modifying original
-            execResultLabel=action.execResultLabel,
-            status=action.status
-        )
-        
-        # Apply improvements based on failure patterns
-        for improvement in improvements:
-            if "incomplete_analysis" in improvement.lower():
-                # Enhance AI prompt for more comprehensive analysis
-                current_prompt = enhanced_action.execParameters.get('aiPrompt', '')
-                enhanced_prompt = current_prompt + "\n\nIMPORTANT: Provide comprehensive, detailed analysis covering all aspects. Be thorough and include all relevant information."
-                enhanced_action.execParameters['aiPrompt'] = enhanced_prompt
-                
-            elif "missing_content" in improvement.lower():
-                # Add content validation to prompt
-                current_prompt = enhanced_action.execParameters.get('aiPrompt', '')
-                enhanced_prompt = current_prompt + "\n\nVALIDATION: Ensure all content is extracted and no information is missed. Provide complete output."
-                enhanced_action.execParameters['aiPrompt'] = enhanced_prompt
-                
-            elif "wrong_format" in improvement.lower():
-                # Add format specification
-                current_prompt = enhanced_action.execParameters.get('aiPrompt', '')
-                enhanced_prompt = current_prompt + "\n\nFORMAT: Provide output in structured, well-organized format with clear sections and proper formatting."
-                enhanced_action.execParameters['aiPrompt'] = enhanced_prompt
-                
-            elif "timeout" in improvement.lower():
-                # Add timeout handling
-                current_prompt = enhanced_action.execParameters.get('aiPrompt', '')
-                enhanced_prompt = current_prompt + "\n\nEFFICIENCY: Provide concise but complete analysis. Focus on key information and avoid unnecessary details."
-                enhanced_action.execParameters['aiPrompt'] = enhanced_prompt
-        
-        # Apply specific improvements from validation
-        validation = previous_result.validation if hasattr(previous_result, 'validation') else {}
-        suggested_approach = validation.get('suggested_retry_approach', '') if isinstance(validation, dict) else ''
-        if suggested_approach:
-            current_prompt = enhanced_action.execParameters.get('aiPrompt', '')
-            enhanced_prompt = current_prompt + f"\n\nRETRY APPROACH: {suggested_approach}"
-            enhanced_action.execParameters['aiPrompt'] = enhanced_prompt
-        
-        return enhanced_action
diff --git a/modules/chat/documents/documentExtraction.py b/modules/chat/documents/documentExtraction.py
index 0ad6188f..fcebf79e 100644
--- a/modules/chat/documents/documentExtraction.py
+++ b/modules/chat/documents/documentExtraction.py
@@ -45,18 +45,96 @@ class DocumentExtraction:
         self._serviceCenter = serviceCenter
 
         self.supportedTypes: Dict[str, Callable[[bytes, str, str], Awaitable[List[ContentItem]]]] = {
+            # Text and data files
             'text/plain': self._processText,
             'text/csv': self._processCsv,
             'application/json': self._processJson,
             'application/xml': self._processXml,
             'text/html': self._processHtml,
             'image/svg+xml': self._processSvg,
+            
+            # Programming languages
+            'application/javascript': self._processText,
+            'application/typescript': self._processText,
+            'text/jsx': self._processText,
+            'text/tsx': self._processText,
+            'text/x-python': self._processText,
+            'text/x-java-source': self._processText,
+            'text/x-c': self._processText,
+            'text/x-c++src': self._processText,
+            'text/x-c++hdr': self._processText,
+            'text/x-csharp': self._processText,
+            'application/x-httpd-php': self._processText,
+            'text/x-ruby': self._processText,
+            'text/x-go': self._processText,
+            'text/x-rust': self._processText,
+            'text/x-swift': self._processText,
+            'text/x-kotlin': self._processText,
+            'text/x-scala': self._processText,
+            'text/x-r': self._processText,
+            'text/x-matlab': self._processText,
+            'text/x-perl': self._processText,
+            'application/x-sh': self._processText,
+            'application/x-powershell': self._processText,
+            'application/x-msdos-program': self._processText,
+            'text/vbscript': self._processText,
+            'text/x-lua': self._processText,
+            'application/sql': self._processText,
+            'application/dart': self._processText,
+            'text/x-elm': self._processText,
+            'text/x-clojure': self._processText,
+            'text/x-haskell': self._processText,
+            'text/x-fsharp': self._processText,
+            'text/x-ocaml': self._processText,
+            
+            # Web technologies
+            'text/css': self._processText,
+            'text/x-scss': self._processText,
+            'text/x-sass': self._processText,
+            'text/x-less': self._processText,
+            'text/x-vue': self._processText,
+            'text/x-svelte': self._processText,
+            'text/x-astro': self._processText,
+            
+            # Configuration and build files
+            'application/x-yaml': self._processText,
+            'application/toml': self._processText,
+            'text/x-dockerfile': self._processText,
+            'text/x-makefile': self._processText,
+            'text/x-cmake': self._processText,
+            'text/x-gradle': self._processText,
+            'text/x-maven': self._processText,
+            
+            # Documentation and markup
+            'text/markdown': self._processText,
+            'text/x-rst': self._processText,
+            'application/x-tex': self._processText,
+            'text/x-bibtex': self._processText,
+            'text/asciidoc': self._processText,
+            'text/x-wiki': self._processText,
+            
+            # Images
             'image/jpeg': self._processImage,
             'image/png': self._processImage,
             'image/gif': self._processImage,
+            'image/webp': self._processImage,
+            'image/bmp': self._processImage,
+            'image/tiff': self._processImage,
+            'image/x-icon': self._processImage,
+            
+            # Documents
             'application/pdf': self._processPdf,
             'application/vnd.openxmlformats-officedocument.wordprocessingml.document': self._processDocx,
-            'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': self._processXlsx
+            'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': self._processXlsx,
+            'application/vnd.openxmlformats-officedocument.presentationml.presentation': self._processPptx,
+            'application/vnd.oasis.opendocument.text': self._processText,
+            'application/vnd.oasis.opendocument.spreadsheet': self._processText,
+            'application/vnd.oasis.opendocument.presentation': self._processText,
+            
+            # Legacy Office formats
+            'application/msword': self._processLegacyDoc,
+            'application/vnd.ms-excel': self._processLegacyXls,
+            'application/vnd.ms-powerpoint': self._processLegacyPpt
         }
         
         self.chunkSizes = {
@@ -66,6 +144,12 @@ class DocumentExtraction:
             "json": 40000,        # JSON data
             "xml": 40000,         # XML data
             "html": 40000,        # HTML content
+            "markdown": 40000,    # Markdown content
+            "code": 80000,        # Programming code (increased for better preservation)
+            "script": 80000,      # Script files (increased for better preservation)
+            "javascript": 80000,  # JavaScript files specifically
+            "typescript": 80000,  # TypeScript files specifically
+            "config": 40000,      # Configuration files
             "image": 1024 * 1024,  # 1MB for images
             "video": 5 * 1024 * 1024,  # 5MB for video chunks
             "binary": 1024 * 1024,  # 1MB for binary data
@@ -75,6 +159,65 @@ class DocumentExtraction:
             "svg": 40000          # SVG content
         }
     
+    def _robustTextDecode(self, fileData: bytes, filename: str = "unknown") -> str:
+        """
+        Robustly decode text data with multiple encoding fallbacks.
+        
+        Args:
+            fileData: Raw bytes to decode
+            filename: Filename for logging purposes
+            
+        Returns:
+            Decoded text string
+            
+        Raises:
+            FileProcessingError: If all decoding attempts fail
+        """
+        # Try multiple encoding options in order of likelihood
+        encodings_to_try = ['utf-8', 'windows-1252', 'iso-8859-1', 'latin-1', 'cp1252']
+        content = None
+        
+        # First try UTF-8 (most common)
+        try:
+            content = fileData.decode('utf-8')
+
+            return content
+        except UnicodeDecodeError:
+            pass
+        
+        # Try other encodings
+        for encoding in encodings_to_try[1:]:
+            try:
+                content = fileData.decode(encoding)
+    
+                return content
+            except UnicodeDecodeError:
+                continue
+        
+        # If all encodings fail, try with error handling
+        try:
+            # Try with chardet for automatic detection
+            import chardet
+            detected = chardet.detect(fileData)
+            if detected['confidence'] > 0.7:
+                detected_encoding = detected['encoding']
+                content = fileData.decode(detected_encoding, errors='replace')
+    
+                return content
+            else:
+                # Last resort: decode with replacement characters
+                content = fileData.decode('utf-8', errors='replace')
+                logger.warning(f"{filename}: decoded with UTF-8 and replacement characters due to low encoding confidence")
+                return content
+        except ImportError:
+            # chardet not available, use replacement characters
+            content = fileData.decode('utf-8', errors='replace')
+            logger.warning(f"{filename}: decoded with UTF-8 and replacement characters (chardet not available)")
+            return content
+        
+        # This should never be reached, but just in case
+        raise FileProcessingError(f"Failed to decode {filename} with any encoding")
+
     def initialize(self) -> None:
         """Initialize the document processor."""
         pass
@@ -119,9 +262,9 @@ class DocumentExtraction:
 
 
 
-    async def processFileData(self, fileData: bytes, filename: str, mimeType: str, base64Encoded: bool = False, prompt: str = None, documentId: str = None) -> ExtractedContent:
+    async def processFileData(self, fileData: bytes, filename: str, mimeType: str, base64Encoded: bool = False, prompt: str = None, documentId: str = None, enableAI: bool = True) -> ExtractedContent:
         """
-        Process file data directly and extract its contents with AI processing.
+        Process file data directly and extract its contents with optional AI processing.
         
         Args:
             fileData: Raw file data as bytes
@@ -129,6 +272,8 @@ class DocumentExtraction:
             mimeType: MIME type of the file
             base64Encoded: Whether the data is base64 encoded
             prompt: Prompt for AI content extraction
+            documentId: Optional document ID
+            enableAI: Whether to enable AI processing (default: True)
             
         Returns:
             ExtractedContent containing the processed content
@@ -150,14 +295,16 @@ class DocumentExtraction:
                 processor = self.supportedTypes[mimeType]
                 contentItems = await processor(fileData, filename, mimeType)
             
-            # Process with AI if prompt provided
-            if prompt and contentItems:
+            # Process with AI if prompt provided and AI is enabled
+            if enableAI and prompt and contentItems:
                 try:
                     # Process each content item with AI
                     processedItems = await self._aiDataExtraction(contentItems, prompt)
                     contentItems = processedItems
                 except Exception as e:
                     logger.error(f"Error processing content with AI: {str(e)}")
+            elif not enableAI:
+                logger.debug(f"AI processing disabled for {filename}, returning raw extracted content")
             
             return ExtractedContent(
                 id=documentId if documentId else str(uuid.uuid4()),
@@ -171,16 +318,35 @@ class DocumentExtraction:
 
     
     async def _processText(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process text document"""
+        """Process text document with robust encoding detection and complete content extraction"""
         try:
-            content = fileData.decode('utf-8')
+            content = self._robustTextDecode(fileData, filename)
+            
+            # Validate that we got the complete content
+            if not content or len(content.strip()) == 0:
+                logger.warning(f"Empty content extracted from {filename}")
+                return [ContentItem(
+                    label="empty",
+                    data="[Empty file or no readable content]",
+                    metadata=ContentMetadata(
+                        size=0,
+                        pages=1,
+                        mimeType="text/plain",
+                        base64Encoded=False
+                    )
+                )]
+            
+            # Log content size for debugging
+            content_size = len(content.encode('utf-8'))
+
+            
             # Use documentUtility for mime type
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
                 label="main",
                 data=content,
                 metadata=ContentMetadata(
-                    size=len(content.encode('utf-8')),
+                    size=content_size,
                     pages=1,
                     mimeType=mime_type,
                     base64Encoded=False
@@ -191,9 +357,9 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process text document: {str(e)}")
     
     async def _processCsv(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process CSV document"""
+        """Process CSV document with robust encoding detection"""
         try:
-            content = fileData.decode('utf-8')
+            content = self._robustTextDecode(fileData, filename)
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
                 label="main",
@@ -210,9 +376,9 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process CSV document: {str(e)}")
     
     async def _processJson(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process JSON document"""
+        """Process JSON document with robust encoding detection"""
         try:
-            content = fileData.decode('utf-8')
+            content = self._robustTextDecode(fileData, filename)
             jsonData = json.loads(content)
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
@@ -230,9 +396,9 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process JSON document: {str(e)}")
     
     async def _processXml(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process XML document"""
+        """Process XML document with robust encoding detection"""
         try:
-            content = fileData.decode('utf-8')
+            content = self._robustTextDecode(fileData, filename)
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
                 label="main",
@@ -249,9 +415,9 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process XML document: {str(e)}")
     
     async def _processHtml(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process HTML document"""
+        """Process HTML document with robust encoding detection"""
         try:
-            content = fileData.decode('utf-8')
+            content = self._robustTextDecode(fileData, filename)
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
                 label="main",
@@ -268,19 +434,92 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process HTML document: {str(e)}")
     
     async def _processSvg(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process SVG document"""
+        """Process SVG document with robust encoding detection and meaningful content extraction"""
         try:
-            content = fileData.decode('utf-8')
-            isSvg = "<svg" in content.lower()
+            content = self._robustTextDecode(fileData, filename)
+            
+            # Check if it's actually SVG content
+            if "<svg" not in content.lower():
+                return [ContentItem(
+                    label="invalid_svg",
+                    data="Not a valid SVG file",
+                    metadata=ContentMetadata(
+                        size=len(content.encode('utf-8')),
+                        mimeType="text/plain",
+                        base64Encoded=False,
+                        error="Invalid SVG content"
+                    )
+                )]
+            
+            # Extract meaningful content from SVG
+            meaningful_content = []
+            
+            try:
+                # Parse SVG XML to extract meaningful elements
+                root = ET.fromstring(content)
+                
+                # Extract title
+                title_elem = root.find('.//{*}title')
+                if title_elem is not None and title_elem.text:
+                    meaningful_content.append(f"Title: {title_elem.text.strip()}")
+                
+                # Extract description
+                desc_elem = root.find('.//{*}desc')
+                if desc_elem is not None and desc_elem.text:
+                    meaningful_content.append(f"Description: {desc_elem.text.strip()}")
+                
+                # Extract text elements
+                text_elements = root.findall('.//{*}text')
+                for i, text_elem in enumerate(text_elements):
+                    if text_elem.text and text_elem.text.strip():
+                        meaningful_content.append(f"Text {i+1}: {text_elem.text.strip()}")
+                
+                # Extract metadata
+                metadata_elem = root.find('.//{*}metadata')
+                if metadata_elem is not None:
+                    for child in metadata_elem:
+                        if child.text and child.text.strip():
+                            meaningful_content.append(f"Metadata - {child.tag}: {child.text.strip()}")
+                
+                # Extract viewBox and dimensions
+                viewbox = root.get('viewBox')
+                if viewbox:
+                    meaningful_content.append(f"ViewBox: {viewbox}")
+                
+                width = root.get('width')
+                height = root.get('height')
+                if width and height:
+                    meaningful_content.append(f"Dimensions: {width} x {height}")
+                
+                # Count elements
+                element_count = len(root.findall('.//*'))
+                meaningful_content.append(f"Total elements: {element_count}")
+                
+                # If no meaningful content extracted, provide a summary
+                if not meaningful_content:
+                    meaningful_content.append("SVG file contains vector graphics")
+                    meaningful_content.append(f"Root element: {root.tag}")
+                    meaningful_content.append(f"Number of child elements: {len(root)}")
+                
+            except ET.ParseError as parseError:
+                logger.warning(f"SVG parsing failed, using raw content: {str(parseError)}")
+                # If XML parsing fails, extract basic information
+                meaningful_content.append("SVG file (XML parsing failed)")
+                meaningful_content.append(f"File size: {len(content)} characters")
+                if "<svg" in content.lower():
+                    meaningful_content.append("Contains SVG markup")
+            
+            # Combine all meaningful content
+            final_content = "\n".join(meaningful_content)
+            
             mime_type = getMimeTypeFromExtension(getFileExtension(filename), self._serviceCenter)
             return [ContentItem(
-                label="main",
-                data=content if isSvg else None,
+                label="svg_content",
+                data=final_content,
                 metadata=ContentMetadata(
-                    size=len(content.encode('utf-8')),
-                    mimeType=mime_type,
-                    base64Encoded=False,
-                    error=None if isSvg else "Invalid SVG content"
+                    size=len(final_content.encode('utf-8')),
+                    mimeType="text/plain",
+                    base64Encoded=False
                 )
             )]
         except Exception as e:
@@ -296,6 +535,41 @@ class DocumentExtraction:
             
             with io.BytesIO(fileData) as imgStream:
                 img = Image.open(imgStream)
+                
+                # For GIF files, provide descriptive information instead of AI processing
+                if mimeType == "image/gif":
+                    try:
+                        frame_count = getattr(img, 'n_frames', 1)
+                        duration = getattr(img, 'duration', 0)
+                        
+                        # Create a descriptive text about the GIF
+                        gif_description = f"GIF Image Analysis:\n"
+                        gif_description += f"- Dimensions: {img.width} x {img.height} pixels\n"
+                        gif_description += f"- Frame count: {frame_count}\n"
+                        gif_description += f"- Color mode: {img.mode}\n"
+                        if duration > 0:
+                            gif_description += f"- Duration: {duration}ms\n"
+                        gif_description += f"- File size: {len(fileData)} bytes\n"
+                        gif_description += f"- Format: {img.format}\n\n"
+                        gif_description += f"Note: This is an animated GIF image. The AI cannot directly analyze image content, but the file contains {frame_count} frame(s) of animation."
+                        
+                        return [ContentItem(
+                            label="gif_analysis",
+                            data=gif_description,
+                            metadata=ContentMetadata(
+                                size=len(gif_description.encode('utf-8')),
+                                width=img.width,
+                                height=img.height,
+                                colorMode=img.mode,
+                                mimeType="text/plain",
+                                base64Encoded=False
+                            )
+                        )]
+                    except Exception as gifError:
+                        logger.warning(f"GIF processing failed: {str(gifError)}")
+                        # Fallback to basic description
+                        pass
+                
                 metadata = ContentMetadata(
                     size=len(fileData),
                     width=img.width,
@@ -388,46 +662,199 @@ class DocumentExtraction:
             raise FileProcessingError(f"Failed to process PDF document: {str(e)}")
     
     async def _processDocx(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process Word document"""
+        """Process Word document with enhanced formatting preservation"""
         try:
             self._loadOfficeExtractor()
             if not officeExtractorLoaded:
                 raise FileProcessingError("Office extraction libraries not available")
             
+            contentItems = []
+            
             with io.BytesIO(fileData) as docxStream:
                 doc = docx.Document(docxStream)
                 
-                # Extract text
-                fullText = []
+                # Extract document properties
+                doc_properties = []
+                if doc.core_properties.title:
+                    doc_properties.append(f"Title: {doc.core_properties.title}")
+                if doc.core_properties.author:
+                    doc_properties.append(f"Author: {doc.core_properties.author}")
+                if doc.core_properties.subject:
+                    doc_properties.append(f"Subject: {doc.core_properties.subject}")
+                if doc.core_properties.keywords:
+                    doc_properties.append(f"Keywords: {doc.core_properties.keywords}")
+                if doc.core_properties.comments:
+                    doc_properties.append(f"Comments: {doc.core_properties.comments}")
+                
+                # Extract main content with formatting
+                main_content = []
+                
+                # Process paragraphs with formatting
                 for para in doc.paragraphs:
-                    fullText.append(para.text)
+                    if para.text.strip():
+                        # Get paragraph style
+                        style_name = para.style.name if para.style else "Normal"
+                        
+                        # Check for heading styles
+                        if style_name.startswith('Heading'):
+                            level = style_name.replace('Heading ', '')
+                            main_content.append(f"\n{'#' * int(level)} {para.text}")
+                        else:
+                            # Check for bold, italic, underline formatting
+                            formatted_text = para.text
+                            if para.runs:
+                                # Process individual runs for formatting
+                                run_texts = []
+                                for run in para.runs:
+                                    run_text = run.text
+                                    if run.bold:
+                                        run_text = f"**{run_text}**"
+                                    if run.italic:
+                                        run_text = f"*{run_text}*"
+                                    if run.underline:
+                                        run_text = f"__{run_text}__"
+                                    run_texts.append(run_text)
+                                formatted_text = ''.join(run_texts)
+                            
+                            main_content.append(formatted_text)
                 
-                # Extract tables
+                # Extract tables with better formatting
+                table_count = 0
                 for table in doc.tables:
-                    for row in table.rows:
-                        rowText = []
-                        for cell in row.cells:
-                            rowText.append(cell.text)
-                        fullText.append(" | ".join(rowText))
+                    table_count += 1
+                    main_content.append(f"\n\n--- Table {table_count} ---")
+                    
+                    # Get table headers (first row)
+                    if table.rows:
+                        header_row = table.rows[0]
+                        headers = [cell.text.strip() for cell in header_row.cells]
+                        main_content.append("| " + " | ".join(headers) + " |")
+                        main_content.append("|" + "|".join(["---"] * len(headers)) + "|")
+                        
+                        # Process data rows
+                        for row in table.rows[1:]:
+                            row_data = [cell.text.strip() for cell in row.cells]
+                            main_content.append("| " + " | ".join(row_data) + " |")
+                    
+                    main_content.append("--- End Table ---\n")
                 
-                content = "\n".join(fullText)
+                # Extract headers and footers if available
+                try:
+                    # Check for headers and footers in sections
+                    for section in doc.sections:
+                        # Header
+                        if section.header:
+                            header_text = []
+                            for para in section.header.paragraphs:
+                                if para.text.strip():
+                                    header_text.append(f"[Header] {para.text}")
+                            if header_text:
+                                main_content.insert(0, "\n".join(header_text) + "\n")
+                        
+                        # Footer
+                        if section.footer:
+                            footer_text = []
+                            for para in section.footer.paragraphs:
+                                if para.text.strip():
+                                    footer_text.append(f"[Footer] {para.text}")
+                            if footer_text:
+                                main_content.append("\n" + "\n".join(footer_text))
+                except Exception as header_footer_error:
+                    logger.debug(f"Could not extract headers/footers: {header_footer_error}")
                 
-                return [ContentItem(
+                # Extract comments if available
+                try:
+                    comments = []
+                    for comment in doc.part.comments_part.comments if doc.part.comments_part else []:
+                        comment_text = comment.text.strip()
+                        if comment_text:
+                            comments.append(f"[Comment] {comment_text}")
+                    
+                    if comments:
+                        main_content.append("\n\n--- Comments ---")
+                        main_content.extend(comments)
+                        main_content.append("--- End Comments ---")
+                except Exception as comment_error:
+                    logger.debug(f"Could not extract comments: {comment_error}")
+                
+                # Combine all content
+                if doc_properties:
+                    main_content.insert(0, "--- Document Properties ---\n" + "\n".join(doc_properties) + "\n--- End Properties ---\n")
+                
+                final_content = "\n".join(main_content)
+                
+                # Create main content item
+                contentItems.append(ContentItem(
                     label="main",
-                    data=content,
+                    data=final_content,
                     metadata=ContentMetadata(
-                        size=len(content.encode('utf-8')),
+                        size=len(final_content.encode('utf-8')),
                         pages=len(doc.paragraphs),
+                        mimeType="text/markdown",  # Use markdown for better formatting
+                        base64Encoded=False
+                    )
+                ))
+                
+                # Create separate content item for tables only (if tables exist)
+                if table_count > 0:
+                    table_content = []
+                    for i, table in enumerate(doc.tables):
+                        table_content.append(f"Table {i+1}:")
+                        if table.rows:
+                            # CSV format for tables
+                            for row in table.rows:
+                                row_data = [f'"{cell.text.strip()}"' for cell in row.cells]
+                                table_content.append(",".join(row_data))
+                        table_content.append("")  # Empty line between tables
+                    
+                    table_text = "\n".join(table_content)
+                    contentItems.append(ContentItem(
+                        label="tables",
+                        data=table_text,
+                        metadata=ContentMetadata(
+                            size=len(table_text.encode('utf-8')),
+                            pages=1,
+                            mimeType="text/csv",
+                            base64Encoded=False
+                        )
+                    ))
+                
+                # Create separate content item for document structure
+                structure_info = []
+                structure_info.append(f"Document Structure:")
+                structure_info.append(f"- Paragraphs: {len(doc.paragraphs)}")
+                structure_info.append(f"- Tables: {table_count}")
+                structure_info.append(f"- Sections: {len(doc.sections)}")
+                
+                # Count different paragraph styles
+                style_counts = {}
+                for para in doc.paragraphs:
+                    style_name = para.style.name if para.style else "Normal"
+                    style_counts[style_name] = style_counts.get(style_name, 0) + 1
+                
+                for style, count in style_counts.items():
+                    structure_info.append(f"- {style}: {count}")
+                
+                structure_text = "\n".join(structure_info)
+                contentItems.append(ContentItem(
+                    label="structure",
+                    data=structure_text,
+                    metadata=ContentMetadata(
+                        size=len(structure_text.encode('utf-8')),
+                        pages=1,
                         mimeType="text/plain",
                         base64Encoded=False
                     )
-                )]
+                ))
+            
+            return contentItems
+            
         except Exception as e:
             logger.error(f"Error processing Word document: {str(e)}")
             raise FileProcessingError(f"Failed to process Word document: {str(e)}")
     
     async def _processXlsx(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
-        """Process Excel document"""
+        """Process Excel document with enhanced table extraction and metadata"""
         try:
             self._loadOfficeExtractor()
             if not officeExtractorLoaded:
@@ -436,38 +863,494 @@ class DocumentExtraction:
             contentItems = []
             
             with io.BytesIO(fileData) as xlsxStream:
-                workbook = openpyxl.load_workbook(xlsxStream, data_only=True)
+                try:
+                    workbook = openpyxl.load_workbook(xlsxStream, data_only=True)
+        
+                except Exception as load_error:
+                    logger.error(f"Failed to load Excel workbook {filename}: {str(load_error)}")
+                    raise FileProcessingError(f"Failed to load Excel workbook: {str(load_error)}")
                 
-                for sheetName in workbook.sheetnames:
-                    sheet = workbook[sheetName]
-                    csvRows = []
-                    for row in sheet.iter_rows():
-                        csvRow = []
-                        for cell in row:
-                            value = cell.value
-                            if value is None:
-                                csvRow.append("")
+                # Extract workbook properties safely
+                workbook_props = []
+                try:
+                    if hasattr(workbook, 'properties'):
+                        props = workbook.properties
+                        
+                        
+                        # Log all available attributes for debugging
+                        for attr in dir(props):
+                            if not attr.startswith('_'):  # Skip private attributes
+                                try:
+                                    value = getattr(props, attr)
+                                    if value is not None:
+                                        pass
+                                except Exception as attr_error:
+                                    logger.debug(f"Could not read property {attr}: {str(attr_error)}")
+                        
+                        # Check each property safely before accessing
+                        if hasattr(props, 'title') and props.title:
+                            workbook_props.append(f"Title: {props.title}")
+                        if hasattr(props, 'creator') and props.creator:  # 'creator' is the correct attribute
+                            workbook_props.append(f"Author: {props.creator}")
+                        if hasattr(props, 'subject') and props.subject:
+                            workbook_props.append(f"Subject: {props.subject}")
+                        if hasattr(props, 'keywords') and props.keywords:
+                            workbook_props.append(f"Keywords: {props.keywords}")
+                        if hasattr(props, 'comments') and props.comments:
+                            workbook_props.append(f"Comments: {props.comments}")
+                        if hasattr(props, 'category') and props.category:
+                            workbook_props.append(f"Category: {props.category}")
+                        if hasattr(props, 'description') and props.description:
+                            workbook_props.append(f"Description: {props.description}")
+                        if hasattr(props, 'lastModifiedBy') and props.lastModifiedBy:
+                            workbook_props.append(f"Last Modified By: {props.lastModifiedBy}")
+                        if hasattr(props, 'created') and props.created:
+                            workbook_props.append(f"Created: {props.created}")
+                        if hasattr(props, 'modified') and props.modified:
+                            workbook_props.append(f"Modified: {props.modified}")
+                        
+                        # Try alternative property names that might exist
+                        if hasattr(props, 'author') and props.author:  # Some versions use 'author'
+                            workbook_props.append(f"Author (alt): {props.author}")
+                        if hasattr(props, 'manager') and props.manager:
+                            workbook_props.append(f"Manager: {props.manager}")
+                        if hasattr(props, 'company') and props.company:
+                            workbook_props.append(f"Company: {props.company}")
+                        if hasattr(props, 'status') and props.status:
+                            workbook_props.append(f"Status: {props.status}")
+                        if hasattr(props, 'revision') and props.revision:
+                            workbook_props.append(f"Revision: {props.revision}")
+                        
+                    else:
+                        # Try to find properties in other locations
+                        for attr in dir(workbook):
+                            if not attr.startswith('_') and 'prop' in attr.lower():
+                                pass
+                except Exception as props_error:
+                    logger.warning(f"Could not extract workbook properties: {str(props_error)}")
+                    workbook_props = []
+                
+                # Create workbook overview content item
+                overview_content = []
+                overview_content.append("Excel Workbook Overview")
+                overview_content.append("=" * 30)
+                overview_content.append(f"Total Sheets: {len(workbook.sheetnames)}")
+                overview_content.append(f"Sheet Names: {', '.join(workbook.sheetnames)}")
+                
+                if workbook_props:
+                    overview_content.append("\nWorkbook Properties:")
+                    overview_content.extend(workbook_props)
+                
+                overview_text = "\n".join(overview_content)
+                contentItems.append(ContentItem(
+                    label="overview",
+                    data=overview_text,
+                    metadata=ContentMetadata(
+                        size=len(overview_text.encode('utf-8')),
+                        pages=1,
+                        mimeType="text/plain",
+                        base64Encoded=False
+                    )
+                ))
+                
+                # Process each sheet
+                for sheetIndex, sheetName in enumerate(workbook.sheetnames):
+                    try:
+                        sheet = workbook[sheetName]
+                        logger.debug(f"Processing sheet {sheetIndex + 1}: {sheetName}")
+                        
+                        # Get sheet metadata
+                        sheet_metadata = []
+                        sheet_metadata.append(f"Sheet: {sheetName}")
+                        
+                        try:
+                            sheet_metadata.append(f"Dimensions: {sheet.dimensions}")
+                            sheet_metadata.append(f"Max Row: {sheet.max_row}")
+                            sheet_metadata.append(f"Max Column: {sheet.max_column}")
+                        except Exception as dim_error:
+                            logger.warning(f"Could not get sheet dimensions for {sheetName}: {str(dim_error)}")
+                            sheet_metadata.append("Dimensions: Unable to determine")
+                            sheet_metadata.append("Max Row: Unknown")
+                            sheet_metadata.append("Max Column: Unknown")
+                        
+                        # Check for sheet properties safely
+                        try:
+                            if hasattr(sheet, 'sheet_properties'):
+                                sheet_props = sheet.sheet_properties
+                                if hasattr(sheet_props, 'tabColor') and sheet_props.tabColor:
+                                    sheet_metadata.append(f"Tab Color: {sheet_props.tabColor}")
+                                if hasattr(sheet_props, 'hidden') and sheet_props.hidden:
+                                    sheet_metadata.append("Hidden: Yes")
+                                if hasattr(sheet_props, 'name') and sheet_props.name:
+                                    sheet_metadata.append(f"Internal Name: {sheet_props.name}")
+                        except Exception as sheet_props_error:
+                            logger.debug(f"Could not extract sheet properties for {sheetName}: {str(sheet_props_error)}")
+                        
+                        # Extract data from sheet
+                        sheet_data = []
+                        
+                        try:
+                            # Find the actual data range (skip empty rows/columns)
+                            min_row = sheet.min_row
+                            max_row = sheet.max_row
+                            min_col = sheet.min_column
+                            max_col = sheet.max_column
+                            
+                            # Adjust for empty sheets
+                            if max_row == 0 or max_col == 0:
+                                sheet_metadata.append("Content: Empty sheet")
+                                sheet_data.append("(Empty sheet)")
                             else:
-                                csvRow.append(str(value).replace('"', '""'))
-                        csvRows.append(','.join(f'"{cell}"' for cell in csvRow))
+                                # Extract all data with proper CSV formatting
+                                for row_num in range(min_row, max_row + 1):
+                                    row_data = []
+                                    for col_num in range(min_col, max_col + 1):
+                                        try:
+                                            cell = sheet.cell(row=row_num, column=col_num)
+                                            cell_value = cell.value
+                                            
+                                            # Handle different data types
+                                            if cell_value is None:
+                                                row_data.append("")
+                                            elif isinstance(cell_value, (int, float)):
+                                                row_data.append(str(cell_value))
+                                            elif isinstance(cell_value, datetime):
+                                                row_data.append(cell_value.strftime("%Y-%m-%d %H:%M:%S"))
+                                            else:
+                                                # Escape quotes and wrap in quotes for CSV
+                                                cell_str = str(cell_value).replace('"', '""')
+                                                row_data.append(f'"{cell_str}"')
+                                        except Exception as cell_error:
+                                            logger.debug(f"Error processing cell at row {row_num}, col {col_num}: {str(cell_error)}")
+                                            row_data.append("(Error reading cell)")
+                                    
+                                    sheet_data.append(",".join(row_data))
+                                
+                                sheet_metadata.append(f"Data Rows: {len(sheet_data)}")
+                                sheet_metadata.append(f"Data Columns: {max_col - min_col + 1}")
+                        except Exception as data_error:
+                            logger.warning(f"Could not extract data from sheet {sheetName}: {str(data_error)}")
+                            sheet_metadata.append("Content: Error extracting data")
+                            sheet_data.append(f"(Error: {str(data_error)})")
+                        
+                        # Create sheet content item
+                        sheet_content = "\n".join(sheet_metadata) + "\n\n" + "\n".join(sheet_data)
+                        contentItems.append(ContentItem(
+                            label=f"sheet_{sheetIndex + 1}_{sheetName}",
+                            data=sheet_content,
+                            metadata=ContentMetadata(
+                                size=len(sheet_content.encode('utf-8')),
+                                pages=1,
+                                mimeType="text/csv",
+                                base64Encoded=False
+                            )
+                        ))
+                        
+                        # Create separate CSV file for each sheet (clean format)
+                        if sheet_data and sheet_data[0].strip() and not sheet_data[0].startswith("(Error"):
+                            # Create clean CSV without metadata
+                            csv_content = "\n".join(sheet_data)
+                            contentItems.append(ContentItem(
+                                label=f"csv_{sheetIndex + 1}_{sheetName}",
+                                data=csv_content,
+                                metadata=ContentMetadata(
+                                    size=len(csv_content.encode('utf-8')),
+                                    pages=1,
+                                    mimeType="text/csv",
+                                    base64Encoded=False
+                                )
+                            ))
+                        
+                    except Exception as sheet_error:
+                        logger.error(f"Error processing sheet {sheetName}: {str(sheet_error)}")
+                        # Create error content item for this sheet
+                        error_content = f"Error processing sheet: {sheetName}\nError: {str(sheet_error)}"
+                        contentItems.append(ContentItem(
+                            label=f"error_sheet_{sheetIndex + 1}_{sheetName}",
+                            data=error_content,
+                            metadata=ContentMetadata(
+                                size=len(error_content.encode('utf-8')),
+                                pages=1,
+                                mimeType="text/plain",
+                                base64Encoded=False
+                            )
+                        ))
+                
+                # Create summary content item
+                try:
+                    summary_content = []
+                    summary_content.append("Excel Processing Summary")
+                    summary_content.append("=" * 30)
+                    summary_content.append(f"Total Sheets Processed: {len(workbook.sheetnames)}")
                     
-                    content = "\n".join(csvRows)
+                    total_rows = 0
+                    total_cells = 0
+                    for sheetName in workbook.sheetnames:
+                        try:
+                            sheet = workbook[sheetName]
+                            if hasattr(sheet, 'max_row') and hasattr(sheet, 'max_column'):
+                                if sheet.max_row > 0 and sheet.max_column > 0:
+                                    sheet_rows = sheet.max_row
+                                    sheet_cells = sheet.max_row * sheet.max_column
+                                    total_rows += sheet_rows
+                                    total_cells += sheet_cells
+                                    summary_content.append(f"- {sheetName}: {sheet_rows} rows, {sheet_cells} cells")
+                        except Exception as summary_error:
+                            logger.debug(f"Could not get summary for sheet {sheetName}: {str(summary_error)}")
+                            summary_content.append(f"- {sheetName}: Error getting summary")
+                    
+                    summary_content.append(f"\nTotal Rows: {total_rows}")
+                    summary_content.append(f"Total Cells: {total_cells}")
+                    
+                    summary_text = "\n".join(summary_content)
                     contentItems.append(ContentItem(
-                        label=sheetName,
-                        data=content,
+                        label="summary",
+                        data=summary_text,
                         metadata=ContentMetadata(
-                            size=len(content.encode('utf-8')),
+                            size=len(summary_text.encode('utf-8')),
                             pages=1,
-                            mimeType="text/csv",
+                            mimeType="text/plain",
                             base64Encoded=False
                         )
                     ))
+                except Exception as summary_error:
+                    logger.warning(f"Could not create summary: {str(summary_error)}")
             
             return contentItems
+            
         except Exception as e:
             logger.error(f"Error processing Excel document: {str(e)}")
             raise FileProcessingError(f"Failed to process Excel document: {str(e)}")
     
+    async def _processLegacyDoc(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
+        """Process legacy Word .doc document"""
+        try:
+            # Try to use antiword or similar tools for .doc files
+            # For now, we'll provide a basic binary extraction with metadata
+            contentItems = []
+            
+            # Create a basic content item explaining the limitation
+            info_content = f"""Legacy Word Document (.doc) - {filename}
+
+Note: This is a legacy .doc format file. For better content extraction, 
+consider converting to .docx format.
+
+File size: {len(fileData)} bytes
+Format: Microsoft Word 97-2003 Document
+
+Content extraction from .doc files requires specialized tools like:
+- antiword (Linux/Unix)
+- catdoc (Linux/Unix)
+- Microsoft Word (for conversion)
+
+The raw binary content is available but not human-readable."""
+            
+            contentItems.append(ContentItem(
+                label="info",
+                data=info_content,
+                metadata=ContentMetadata(
+                    size=len(info_content.encode('utf-8')),
+                    pages=1,
+                    mimeType="text/plain",
+                    base64Encoded=False
+                )
+            ))
+            
+            # Also provide the binary content for potential processing
+            contentItems.append(ContentItem(
+                label="binary",
+                data=base64.b64encode(fileData).decode('utf-8'),
+                metadata=ContentMetadata(
+                    size=len(fileData),
+                    mimeType=mimeType,
+                    base64Encoded=True
+                )
+            ))
+            
+            return contentItems
+            
+        except Exception as e:
+            logger.error(f"Error processing legacy Word document: {str(e)}")
+            raise FileProcessingError(f"Failed to process legacy Word document: {str(e)}")
+    
+    async def _processLegacyXls(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
+        """Process legacy Excel .xls document"""
+        try:
+            # Try to use xlrd or similar tools for .xls files
+            # For now, we'll provide a basic binary extraction with metadata
+            contentItems = []
+            
+            # Create a basic content item explaining the limitation
+            info_content = f"""Legacy Excel Document (.xls) - {filename}
+
+Note: This is a legacy .xls format file. For better content extraction, 
+consider converting to .xlsx format.
+
+File size: {len(fileData)} bytes
+Format: Microsoft Excel 97-2003 Workbook
+
+Content extraction from .xls files requires specialized tools like:
+- xlrd (Python library)
+- Microsoft Excel (for conversion)
+- LibreOffice (for conversion)
+
+The raw binary content is available but not human-readable."""
+            
+            contentItems.append(ContentItem(
+                label="info",
+                data=info_content,
+                metadata=ContentMetadata(
+                    size=len(info_content.encode('utf-8')),
+                    pages=1,
+                    mimeType="text/plain",
+                    base64Encoded=False
+                )
+            ))
+            
+            # Also provide the binary content for potential processing
+            contentItems.append(ContentItem(
+                label="binary",
+                data=base64.b64encode(fileData).decode('utf-8'),
+                metadata=ContentMetadata(
+                    size=len(fileData),
+                    mimeType=mimeType,
+                    base64Encoded=True
+                )
+            ))
+            
+            return contentItems
+            
+        except Exception as e:
+            logger.error(f"Error processing legacy Excel document: {str(e)}")
+            raise FileProcessingError(f"Failed to process legacy Excel document: {str(e)}")
+    
+    async def _processLegacyPpt(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
+        """Process legacy PowerPoint .ppt document"""
+        try:
+            # Try to use python-pptx or similar tools for .ppt files
+            # For now, we'll provide a basic binary extraction with metadata
+            contentItems = []
+            
+            # Create a basic content item explaining the limitation
+            info_content = f"""Legacy PowerPoint Document (.ppt) - {filename}
+
+Note: This is a legacy .ppt format file. For better content extraction, 
+consider converting to .pptx format.
+
+File size: {len(fileData)} bytes
+Format: Microsoft PowerPoint 97-2003 Presentation
+
+Content extraction from .ppt files requires specialized tools like:
+- python-pptx (limited support for .ppt)
+- Microsoft PowerPoint (for conversion)
+- LibreOffice (for conversion)
+
+The raw binary content is available but not human-readable."""
+            
+            contentItems.append(ContentItem(
+                label="info",
+                data=info_content,
+                metadata=ContentMetadata(
+                    size=len(info_content.encode('utf-8')),
+                    pages=1,
+                    mimeType="text/plain",
+                    base64Encoded=False
+                )
+            ))
+            
+            # Also provide the binary content for potential processing
+            contentItems.append(ContentItem(
+                label="binary",
+                data=base64.b64encode(fileData).decode('utf-8'),
+                metadata=ContentMetadata(
+                    size=len(fileData),
+                    mimeType=mimeType,
+                    base64Encoded=True
+                )
+            ))
+            
+            return contentItems
+            
+        except Exception as e:
+            logger.error(f"Error processing legacy PowerPoint document: {str(e)}")
+            raise FileProcessingError(f"Failed to process legacy PowerPoint document: {str(e)}")
+    
+    async def _processPptx(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
+        """Process PowerPoint document"""
+        try:
+            self._loadOfficeExtractor()
+            if not officeExtractorLoaded:
+                raise FileProcessingError("Office extraction libraries not available")
+            
+            contentItems = []
+            
+            try:
+                # Try to use python-pptx for PowerPoint processing
+                from pptx import Presentation
+                
+                with io.BytesIO(fileData) as pptxStream:
+                    prs = Presentation(pptxStream)
+                    
+                    for slideNum, slide in enumerate(prs.slides):
+                        slideText = []
+                        
+                        # Extract text from shapes
+                        for shape in slide.shapes:
+                            if hasattr(shape, "text") and shape.text:
+                                slideText.append(shape.text)
+                        
+                        # Extract text from text boxes
+                        for shape in slide.shapes:
+                            if shape.has_text_frame:
+                                for paragraph in shape.text_frame.paragraphs:
+                                    if paragraph.text:
+                                        slideText.append(paragraph.text)
+                        
+                        if slideText:
+                            content = "\n".join(slideText)
+                            contentItems.append(ContentItem(
+                                label=f"slide_{slideNum + 1}",
+                                data=content,
+                                metadata=ContentMetadata(
+                                    size=len(content.encode('utf-8')),
+                                    pages=1,
+                                    mimeType="text/plain",
+                                    base64Encoded=False
+                                )
+                            ))
+                
+                if not contentItems:
+                    # Fallback: treat as binary if no text extracted
+                    contentItems.append(ContentItem(
+                        label="presentation",
+                        data=base64.b64encode(fileData).decode('utf-8'),
+                        metadata=ContentMetadata(
+                            size=len(fileData),
+                            pages=len(prs.slides) if hasattr(prs, 'slides') else 1,
+                            mimeType="application/vnd.openxmlformats-officedocument.presentationml.presentation",
+                            base64Encoded=True
+                        )
+                    ))
+                    
+            except ImportError:
+                # python-pptx not available, treat as binary
+                contentItems.append(ContentItem(
+                    label="presentation",
+                    data=base64.b64encode(fileData).decode('utf-8'),
+                    metadata=ContentMetadata(
+                        size=len(fileData),
+                        pages=1,
+                        mimeType="application/vnd.openxmlformats-officedocument.presentationml.presentation",
+                        base64Encoded=True
+                    )
+                ))
+            
+            return contentItems
+            
+        except Exception as e:
+            logger.error(f"Error processing PowerPoint document: {str(e)}")
+            raise FileProcessingError(f"Failed to process PowerPoint document: {str(e)}")
+    
     async def _processBinary(self, fileData: bytes, filename: str, mimeType: str) -> List[ContentItem]:
         """Process binary document"""
         try:
@@ -502,11 +1385,14 @@ class DocumentExtraction:
             try:
                 # Get content type from metadata
                 mimeType = item.metadata.mimeType if hasattr(item.metadata, 'mimeType') else "text/plain"
-                logger.debug(f"Processing content item with MIME type: {mimeType}, label: {item.label}")
+    
                 
                 # Chunk content based on type
                 if mimeType.startswith('text/'):
                     chunks = self._chunkText(item.data, mimeType)
+                elif mimeType == "image/svg+xml":
+                    # SVG files are XML, treat as text
+                    chunks = self._chunkXml(item.data)
                 elif mimeType.startswith('image/'):
                     # Images should not be chunked - process as single unit
                     chunks = [item.data]
@@ -518,6 +1404,9 @@ class DocumentExtraction:
                     chunks = self._chunkXlsx(item.data)
                 elif mimeType.startswith('application/vnd.openxmlformats-officedocument.presentationml.presentation'):
                     chunks = self._chunkPptx(item.data)
+                elif mimeType.startswith('text/x-') or mimeType.startswith('application/') and any(keyword in mimeType for keyword in ['script', 'code', 'source', 'yaml', 'toml', 'dockerfile', 'makefile', 'cmake', 'gradle', 'maven']):
+                    # Programming languages, configuration files, and build files
+                    chunks = self._chunkCode(item.data)
                 else:
                     # Binary data - no chunking
                     chunks = [item.data]
@@ -527,15 +1416,24 @@ class DocumentExtraction:
                 for chunk in chunks:
                     # Process with AI based on content type
                     try:
-                        logger.debug(f"AI processing chunk with MIME type: {mimeType}")
-                        if mimeType.startswith('image/'):
-                            # For images, use image AI service with base64 data
-                            # chunk is already base64 encoded string from _processImage
-                            # Use the original prompt directly for images (no content embedding)
-                            logger.debug(f"Calling image AI service for MIME type: {mimeType}")
-                            processedContent = await self._serviceCenter.callAiImageBasic(prompt, chunk, mimeType)
+                        if mimeType.startswith('image/') and mimeType != "image/svg+xml":
+                            # For images (excluding SVG), extract meaningful content as text
+                            # Use AI to analyze the image and extract relevant information
+
+                            
+                            # Create a specific prompt for image content extraction
+                            imagePrompt = f"""
+                            Analyze this image and extract the actual content and information from it.
+                            Focus on extracting text, data, charts, diagrams, or any meaningful content.
+                            If there's text in the image, extract it. If there are charts or diagrams, describe the data.
+                            Return the extracted content in a clear, structured text format.
+                            
+                            Original prompt: {prompt}
+                            """
+                            
+                            processedContent = await self._serviceCenter.callAiImageBasic(imagePrompt, chunk, mimeType)
                         else:
-                            # For text content, use text AI service
+                            # For text content (including SVG), use text AI service
                             # Neutralize content if neutralizer is enabled (only for text)
                             contentToProcess = chunk
                             if self._neutralizer and contentToProcess:
@@ -553,8 +1451,12 @@ class DocumentExtraction:
                             Return ONLY the extracted information in a clear, concise format.
                             """
                             
-                            logger.debug(f"Calling text AI service for MIME type: {mimeType}")
-                            processedContent = await self._serviceCenter.callAiTextBasic(aiPrompt, contentToProcess)
+                            # Special handling for JavaScript and other code files - preserve complete content
+                            if mimeType == "application/javascript" or mimeType == "application/typescript" or mimeType.startswith("text/x-") or any(keyword in mimeType for keyword in ['script', 'code', 'source']):
+                                # For code files, preserve the complete content without AI processing
+                                processedContent = contentToProcess
+                            else:
+                                processedContent = await self._serviceCenter.callAiTextBasic(aiPrompt, contentToProcess)
                         
                         chunkResults.append(processedContent)
                     except Exception as aiError:
@@ -568,18 +1470,32 @@ class DocumentExtraction:
                             chunkResults.append(chunk)
                 
                 # Combine chunk results
-                combinedResult = "\n".join(chunkResults)
+                if chunkResults:
+                    # For text content, combine all chunks
+                    if (mimeType.startswith('text/') or 
+                        mimeType in ["application/pdf", "application/vnd.openxmlformats-officedocument.wordprocessingml.document", 
+                                    "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet", 
+                                    "application/vnd.openxmlformats-officedocument.presentationml.presentation"] or
+                        mimeType.startswith('text/x-') or 
+                        mimeType.startswith('application/') and any(keyword in mimeType for keyword in ['script', 'code', 'source', 'yaml', 'toml', 'dockerfile', 'makefile', 'cmake', 'gradle', 'maven', 'javascript', 'typescript', 'sql', 'dart'])):
+                        combinedResult = "\n".join(chunkResults)
+                    else:
+                        # For binary content, use the first result
+                        combinedResult = chunkResults[0]
+                else:
+                    # No chunks processed, use original content
+                    combinedResult = item.data
                 
                 # Only add processed item if we have results
-                if combinedResult.strip():
+                if combinedResult and combinedResult.strip():
                     processedItems.append(ContentItem(
                         label=item.label,
                         data=combinedResult,
                         metadata=ContentMetadata(
                             size=len(combinedResult.encode('utf-8')),
-                            pages=1,
-                            mimeType="text/plain",
-                            base64Encoded=False
+                            pages=item.metadata.pages if hasattr(item.metadata, 'pages') else 1,
+                            mimeType=item.metadata.mimeType if hasattr(item.metadata, 'mimeType') else "text/plain",
+                            base64Encoded=item.metadata.base64Encoded if hasattr(item.metadata, 'base64Encoded') else False
                         )
                     ))
                 else:
@@ -606,6 +1522,20 @@ class DocumentExtraction:
             return self._chunkXml(content)
         elif mimeType == "text/html":
             return self._chunkHtml(content)
+        elif mimeType == "text/markdown" or mimeType == "text/x-rst" or mimeType == "text/x-wiki":
+            return self._chunkMarkdown(content)
+        elif mimeType == "application/javascript" or mimeType == "application/typescript":
+            # JavaScript and TypeScript files get special handling
+            return self._chunkJavaScript(content)
+        elif mimeType.startswith("text/x-") or mimeType.startswith("application/") and any(keyword in mimeType for keyword in ['script', 'code', 'source', 'yaml', 'toml', 'dockerfile', 'makefile', 'cmake', 'gradle', 'maven']):
+            # Programming languages, configuration files, and build files
+            return self._chunkCode(content)
+        elif mimeType == "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
+            # Word documents with markdown formatting
+            return self._chunkWordDocument(content)
+        elif mimeType == "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet":
+            # Excel documents with structured data
+            return self._chunkExcelDocument(content)
         else:
             return self._chunkPlainText(content)
 
@@ -724,19 +1654,41 @@ class DocumentExtraction:
             return [content]
 
     def _chunkHtml(self, content: str) -> List[str]:
-        """Chunk HTML content"""
+        """Chunk HTML content with improved semantic chunking"""
         try:
             soup = BeautifulSoup(content, 'html.parser')
             chunks = []
             currentChunk = []
             currentSize = 0
             
+            # Use smaller chunk size for HTML to avoid token limits
+            html_chunk_size = min(self.chunkSizes["html"], 15000)  # Max 15KB per chunk
+            
             def processElement(element):
                 nonlocal currentChunk, currentSize
                 elementStr = str(element)
                 elementSize = len(elementStr.encode('utf-8'))
                 
-                if currentSize + elementSize > self.chunkSizes["html"]:
+                # If element is too large, split it
+                if elementSize > html_chunk_size:
+                    # Split large elements by their content
+                    if hasattr(element, 'get_text'):
+                        text_content = element.get_text(separator='\n', strip=True)
+                        if text_content:
+                            # Split text content into smaller chunks
+                            text_chunks = self._chunkTextBySize(text_content, html_chunk_size)
+                            for text_chunk in text_chunks:
+                                if currentChunk:
+                                    chunks.append(''.join(currentChunk))
+                                currentChunk = [f"<{element.name}>{text_chunk}</{element.name}>"]
+                                currentSize = len(currentChunk[0].encode('utf-8'))
+                    else:
+                        # For elements without text, just add them
+                        if currentChunk:
+                            chunks.append(''.join(currentChunk))
+                        currentChunk = [elementStr]
+                        currentSize = elementSize
+                elif currentSize + elementSize > html_chunk_size:
                     if currentChunk:
                         chunks.append(''.join(currentChunk))
                     currentChunk = [elementStr]
@@ -745,45 +1697,192 @@ class DocumentExtraction:
                     currentChunk.append(elementStr)
                     currentSize += elementSize
             
+            # Process elements in order of importance
+            for element in soup.find_all(['h1', 'h2', 'h3', 'h4', 'h5', 'h6']):
+                processElement(element)
+            
             for element in soup.find_all(['p', 'div', 'section', 'article']):
                 processElement(element)
             
+            for element in soup.find_all(['ul', 'ol', 'table']):
+                processElement(element)
+            
+            # Process remaining elements
+            for element in soup.find_all():
+                if element.name not in ['h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'p', 'div', 'section', 'article', 'ul', 'ol', 'table']:
+                    processElement(element)
+            
             if currentChunk:
                 chunks.append(''.join(currentChunk))
             
             return chunks
         except Exception:
             return [content]
+    
+    def _chunkTextBySize(self, text: str, max_size: int) -> List[str]:
+        """Helper method to chunk text by size"""
+        chunks = []
+        current_chunk = ""
+        
+        for line in text.split('\n'):
+            line_size = len(line.encode('utf-8'))
+            if len(current_chunk.encode('utf-8')) + line_size > max_size:
+                if current_chunk:
+                    chunks.append(current_chunk.strip())
+                current_chunk = line
+            else:
+                current_chunk += "\n" + line if current_chunk else line
+        
+        if current_chunk:
+            chunks.append(current_chunk.strip())
+        
+        return chunks
+
+    def _chunkMarkdown(self, content: str) -> List[str]:
+        """Chunk Markdown content"""
+        chunks = []
+        currentChunk = []
+        currentSize = 0
+        
+        # Split by headers, lists, and code blocks
+        # This is a simplified approach; a more robust solution would involve a proper Markdown parser
+        lines = content.split('\n')
+        for line in lines:
+            lineSize = len(line.encode('utf-8'))
+            if currentSize + lineSize > self.chunkSizes["text"]: # Use "text" chunk size for Markdown
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                currentChunk = [line]
+                currentSize = lineSize
+            else:
+                currentChunk.append(line)
+                currentSize += lineSize
+        
+        if currentChunk:
+            chunks.append('\n'.join(currentChunk))
+        
+        return chunks
+
+    def _chunkCode(self, content: str) -> List[str]:
+        """Chunk code content with optimized chunking for programming languages"""
+        chunks = []
+        currentChunk = []
+        currentSize = 0
+        
+        # Use larger chunk size for code to minimize unnecessary splitting
+        # Code files often have long lines and complex structures
+        code_chunk_size = min(self.chunkSizes["code"], 80000)  # Max 80KB per chunk for code
+        
+        # Split by lines to preserve code structure
+        lines = content.split('\n')
+        for line in lines:
+            lineSize = len(line.encode('utf-8'))
+            if currentSize + lineSize > code_chunk_size:
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                currentChunk = [line]
+                currentSize = lineSize
+            else:
+                currentChunk.append(line)
+                currentSize += lineSize
+        
+        if currentChunk:
+            chunks.append('\n'.join(currentChunk))
+        
+        return chunks
+
+    def _chunkJavaScript(self, content: str) -> List[str]:
+        """Chunk JavaScript content with optimized chunking for JavaScript files"""
+        chunks = []
+        currentChunk = []
+        currentSize = 0
+        
+        # Use larger chunk size for JavaScript to minimize unnecessary splitting
+        # JavaScript files often have long lines and complex structures
+        js_chunk_size = min(self.chunkSizes["javascript"], 80000)  # Max 80KB per chunk for JavaScript
+        
+        # Split by lines to preserve code structure
+        lines = content.split('\n')
+        for line in lines:
+            lineSize = len(line.encode('utf-8'))
+            if currentSize + lineSize > js_chunk_size:
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                currentChunk = [line]
+                currentSize = lineSize
+            else:
+                currentChunk.append(line)
+                currentSize += lineSize
+        
+        if currentChunk:
+            chunks.append('\n'.join(currentChunk))
+        
+        return chunks
 
     def _chunkBinary(self, content: str) -> List[str]:
         """Chunk binary content"""
         try:
-            binaryData = base64.b64decode(content)
-            chunks = []
-            chunkSize = self.chunkSizes["binary"]
-            
-            for i in range(0, len(binaryData), chunkSize):
-                chunk = binaryData[i:i + chunkSize]
-                chunks.append(base64.b64encode(chunk).decode('utf-8'))
-            
-            return chunks
+            # Check if content is base64 encoded or plain text
+            try:
+                # Try to decode as base64
+                binaryData = base64.b64decode(content)
+                # If successful, it's base64 - chunk the binary data
+                chunks = []
+                chunkSize = self.chunkSizes["binary"]
+                
+                for i in range(0, len(binaryData), chunkSize):
+                    chunk = binaryData[i:i + chunkSize]
+                    chunks.append(base64.b64encode(chunk).decode('utf-8'))
+                
+                return chunks
+            except Exception:
+                # If base64 decoding fails, treat as text and chunk by lines
+                lines = content.split('\n')
+                chunks = []
+                currentChunk = []
+                currentSize = 0
+                
+                for line in lines:
+                    lineSize = len(line.encode('utf-8'))
+                    if currentSize + lineSize > self.chunkSizes["binary"]:
+                        if currentChunk:
+                            chunks.append('\n'.join(currentChunk))
+                        currentChunk = [line]
+                        currentSize = lineSize
+                    else:
+                        currentChunk.append(line)
+                        currentSize += lineSize
+                
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                
+                return chunks
         except Exception:
             return [content]
 
     async def _chunkPdf(self, content: str) -> List[str]:
         """Chunk PDF content"""
         try:
-            pdfData = base64.b64decode(content)
+            # Content is already text from _processPdf, not base64
+            # Split by lines to create chunks
+            lines = content.split('\n')
             chunks = []
-            chunkSize = self.chunkSizes["pdf"]
+            currentChunk = []
+            currentSize = 0
             
-            with io.BytesIO(pdfData) as pdfStream:
-                pdfReader = PyPDF2.PdfReader(pdfStream)
-                for pageNum in range(len(pdfReader.pages)):
-                    page = pdfReader.pages[pageNum]
-                    pageText = page.extract_text()
-                    if pageText:
-                        chunks.append(pageText)
+            for line in lines:
+                lineSize = len(line.encode('utf-8'))
+                if currentSize + lineSize > self.chunkSizes["pdf"]:
+                    if currentChunk:
+                        chunks.append('\n'.join(currentChunk))
+                    currentChunk = [line]
+                    currentSize = lineSize
+                else:
+                    currentChunk.append(line)
+                    currentSize += lineSize
+            
+            if currentChunk:
+                chunks.append('\n'.join(currentChunk))
             
             return chunks
         except Exception:
@@ -792,20 +1891,26 @@ class DocumentExtraction:
     async def _chunkDocx(self, content: str) -> List[str]:
         """Chunk Word document content"""
         try:
-            docxData = base64.b64decode(content)
+            # Content is already text from _processDocx, not base64
+            # Split by lines to create chunks
+            lines = content.split('\n')
             chunks = []
-            chunkSize = self.chunkSizes["docx"]
+            currentChunk = []
+            currentSize = 0
             
-            with io.BytesIO(docxData) as docxStream:
-                doc = docx.Document(docxStream)
-                for para in doc.paragraphs:
-                    chunks.append(para.text)
-                for table in doc.tables:
-                    for row in table.rows:
-                        rowText = []
-                        for cell in row.cells:
-                            rowText.append(cell.text)
-                        chunks.append(" | ".join(rowText))
+            for line in lines:
+                lineSize = len(line.encode('utf-8'))
+                if currentSize + lineSize > self.chunkSizes["docx"]:
+                    if currentChunk:
+                        chunks.append('\n'.join(currentChunk))
+                    currentChunk = [line]
+                    currentSize = lineSize
+                else:
+                    currentChunk.append(line)
+                    currentSize += lineSize
+            
+            if currentChunk:
+                chunks.append('\n'.join(currentChunk))
             
             return chunks
         except Exception:
@@ -814,23 +1919,26 @@ class DocumentExtraction:
     async def _chunkXlsx(self, content: str) -> List[str]:
         """Chunk Excel document content"""
         try:
-            xlsxData = base64.b64decode(content)
+            # Content is already text (CSV format) from _processXlsx, not base64
+            # Split by lines to create chunks
+            lines = content.split('\n')
             chunks = []
-            chunkSize = self.chunkSizes["xlsx"]
+            currentChunk = []
+            currentSize = 0
             
-            with io.BytesIO(xlsxData) as xlsxStream:
-                workbook = openpyxl.load_workbook(xlsxStream, data_only=True)
-                for sheetName in workbook.sheetnames:
-                    sheet = workbook[sheetName]
-                    for row in sheet.iter_rows():
-                        rowText = []
-                        for cell in row:
-                            value = cell.value
-                            if value is None:
-                                rowText.append("")
-                            else:
-                                rowText.append(str(value).replace('"', '""'))
-                        chunks.append(','.join(f'"{cell}"' for cell in rowText))
+            for line in lines:
+                lineSize = len(line.encode('utf-8'))
+                if currentSize + lineSize > self.chunkSizes["xlsx"]:
+                    if currentChunk:
+                        chunks.append('\n'.join(currentChunk))
+                    currentChunk = [line]
+                    currentSize = lineSize
+                else:
+                    currentChunk.append(line)
+                    currentSize += lineSize
+            
+            if currentChunk:
+                chunks.append('\n'.join(currentChunk))
             
             return chunks
         except Exception:
@@ -839,18 +1947,89 @@ class DocumentExtraction:
     async def _chunkPptx(self, content: str) -> List[str]:
         """Chunk PowerPoint document content"""
         try:
-            pptxData = base64.b64decode(content)
+            # Content is already text from PowerPoint processing, not base64
+            # Split by lines to create chunks
+            lines = content.split('\n')
             chunks = []
-            chunkSize = self.chunkSizes["pptx"]
+            currentChunk = []
+            currentSize = 0
             
-            with io.BytesIO(pptxData) as pptxStream:
-                # openpyxl is not suitable for PowerPoint, so we'll just read text
-                # This is a placeholder and would require a different library for full pptx processing
-                # For now, we'll just return the base64 encoded content as a single chunk
-                chunks.append(content)
+            for line in lines:
+                lineSize = len(line.encode('utf-8'))
+                if currentSize + lineSize > self.chunkSizes["pptx"]:
+                    if currentChunk:
+                        chunks.append('\n'.join(currentChunk))
+                    currentChunk = [line]
+                    currentSize = lineSize
+                else:
+                    currentChunk.append(line)
+                    currentSize += lineSize
+            
+            if currentChunk:
+                chunks.append('\n'.join(currentChunk))
             
             return chunks
         except Exception:
             return [content]
 
+    def _chunkWordDocument(self, content: str) -> List[str]:
+        """Chunk Word document content with markdown formatting preservation"""
+        chunks = []
+        currentChunk = []
+        currentSize = 0
+        
+        # Use larger chunk size for Word documents to preserve formatting
+        word_chunk_size = min(self.chunkSizes["docx"], 60000)  # Max 60KB per chunk
+        
+        # Split by lines to preserve document structure
+        lines = content.split('\n')
+        for line in lines:
+            lineSize = len(line.encode('utf-8'))
+            
+            # Check if adding this line would exceed chunk size
+            if currentSize + lineSize > word_chunk_size:
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                currentChunk = [line]
+                currentSize = lineSize
+            else:
+                currentChunk.append(line)
+                currentSize += lineSize
+        
+        # Add the last chunk if it exists
+        if currentChunk:
+            chunks.append('\n'.join(currentChunk))
+        
+        return chunks
+
+    def _chunkExcelDocument(self, content: str) -> List[str]:
+        """Chunk Excel document content with data structure preservation"""
+        chunks = []
+        currentChunk = []
+        currentSize = 0
+        
+        # Use larger chunk size for Excel documents to preserve table structure
+        excel_chunk_size = min(self.chunkSizes["xlsx"], 80000)  # Max 80KB per chunk
+        
+        # Split by lines to preserve CSV structure
+        lines = content.split('\n')
+        for line in lines:
+            lineSize = len(line.encode('utf-8'))
+            
+            # Check if adding this line would exceed chunk size
+            if currentSize + lineSize > excel_chunk_size:
+                if currentChunk:
+                    chunks.append('\n'.join(currentChunk))
+                currentChunk = [line]
+                currentSize = lineSize
+            else:
+                currentChunk.append(line)
+                currentSize += lineSize
+        
+        # Add the last chunk if it exists
+        if currentChunk:
+            chunks.append('\n'.join(currentChunk))
+        
+        return chunks
+
         
\ No newline at end of file
diff --git a/modules/chat/documents/documentGeneration.py b/modules/chat/documents/documentGeneration.py
index a72de2e5..1a83ebf5 100644
--- a/modules/chat/documents/documentGeneration.py
+++ b/modules/chat/documents/documentGeneration.py
@@ -22,13 +22,11 @@ class DocumentGenerator:
         """
         try:
             documents = action_result.data.get("documents", [])
-            logger.debug(f"Processing {len(documents)} documents from action result")
             processed_documents = []
             for doc in documents:
                 processed_doc = self.processSingleDocument(doc, action)
                 if processed_doc:
                     processed_documents.append(processed_doc)
-            logger.debug(f"Successfully processed {len(processed_documents)} documents")
             return processed_documents
         except Exception as e:
             logger.error(f"Error processing action result documents: {str(e)}")
@@ -54,19 +52,29 @@ class DocumentGenerator:
                 # Dictionary format document - handle both 'documentName' and 'filename' keys
                 filename = doc.get('documentName', doc.get('filename', \
                     f"{action.execMethod}_{action.execAction}_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}"))
-                fileSize = doc.get('fileSize', len(str(doc.get('documentData', ''))))
                 mimeType = doc.get('mimeType', 'application/octet-stream')
-                if mimeType == "application/octet-stream":
-                    document_data = doc.get('documentData', '')
-                    mimeType = detectMimeTypeFromContent(document_data, filename, self.service)
                 
                 # Handle documentData structure - it might be a dict with 'content' key or direct content
                 document_data = doc.get('documentData', '')
                 if isinstance(document_data, dict) and 'content' in document_data:
+                    # This is the structure returned by extract action: documentData.content
                     content = document_data['content']
+                    # Also check for other potential content fields
+                    if not content and 'data' in document_data:
+                        content = document_data['data']
                 else:
+                    # Direct content (fallback)
                     content = document_data
                 
+                # Calculate file size from actual content
+                fileSize = len(str(content)) if content else 0
+                
+                # Detect mime type if not specified
+                if mimeType == "application/octet-stream":
+                    mimeType = detectMimeTypeFromContent(content, filename, self.service)
+                
+                logger.info(f"Processed document: {filename}, content length: {len(str(content))}, mimeType: {mimeType}")
+                
                 return {
                     'filename': filename,
                     'fileSize': fileSize,
@@ -96,20 +104,32 @@ class DocumentGenerator:
         Returns a list of created document objects.
         """
         try:
+            logger.info(f"Creating documents from action result for {action.execMethod}.{action.execAction}")
+            logger.info(f"Action result data keys: {list(action_result.data.keys())}")
+            
             processed_docs = self.processActionResultDocuments(action_result, action, workflow)
+            logger.info(f"Processed {len(processed_docs)} documents")
+            
             created_documents = []
-            for doc_data in processed_docs:
+            for i, doc_data in enumerate(processed_docs):
                 try:
                     document_name = doc_data['filename']
                     document_data = doc_data['content']
                     mime_type = doc_data['mimeType']
+                    
+                    logger.info(f"Creating document {i+1}: {document_name} (mime: {mime_type}, content length: {len(str(document_data))})")
+                    
                     # Convert document data to string content
                     content = convertDocumentDataToString(document_data, getFileExtension(document_name))
+                    
                     # Skip empty or minimal content
                     minimal_content_patterns = ['{}', '[]', 'null', '""', "''"]
                     if not content or content.strip() == "" or content.strip() in minimal_content_patterns:
                         logger.warning(f"Empty or minimal content for document {document_name}, skipping")
                         continue
+                    
+                    logger.info(f"Document {document_name} has content: {len(content)} characters")
+                    
                     # Create file in system
                     file_id = self.service.createFile(
                         fileName=document_name,
@@ -120,22 +140,27 @@ class DocumentGenerator:
                     if not file_id:
                         logger.error(f"Failed to create file for document {document_name}")
                         continue
-                    # Create document object
+                    
+                    logger.info(f"Created file with ID: {file_id}")
+                    
+                    # Create document object using existing file ID
                     document = self.service.createDocument(
                         fileName=document_name,
                         mimeType=mime_type,
                         content=content,
-                        base64encoded=False
+                        base64encoded=False,
+                        existing_file_id=file_id
                     )
                     if document:
                         created_documents.append(document)
-                        logger.debug(f"Created document: {document_name} ({len(content)} bytes, {mime_type})")
+                        logger.info(f"Successfully created ChatDocument: {document_name} (ID: {getattr(document, 'id', 'N/A')}, fileId: {getattr(document, 'fileId', 'N/A')})")
                     else:
                         logger.error(f"Failed to create ChatDocument object for {document_name}")
                 except Exception as e:
                     logger.error(f"Error creating document {doc_data.get('filename', 'unknown')}: {str(e)}")
                     continue
-            logger.info(f"Created {len(created_documents)} documents from action result")
+            
+            logger.info(f"Successfully created {len(created_documents)} documents")
             return created_documents
         except Exception as e:
             logger.error(f"Error creating documents from action result: {str(e)}")
diff --git a/modules/chat/handling/handlingTasks.py b/modules/chat/handling/handlingTasks.py
index 5b458160..c04658f7 100644
--- a/modules/chat/handling/handlingTasks.py
+++ b/modules/chat/handling/handlingTasks.py
@@ -16,22 +16,53 @@ from modules.chat.documents.documentGeneration import DocumentGenerator
 
 logger = logging.getLogger(__name__)
 
+class WorkflowStoppedException(Exception):
+    """Exception raised when a workflow is stopped by the user."""
+    pass
+
 class HandlingTasks:
     def __init__(self, chatInterface, service, workflow=None):
         self.chatInterface = chatInterface
         self.service = service
         self.workflow = workflow
         self.documentGenerator = DocumentGenerator(service)
+    
+    def _checkWorkflowStopped(self):
+        """
+        Check if workflow has been stopped by user and raise exception if so.
+        This function centralizes all workflow stop checking logic to avoid code duplication.
+        """
+        try:
+            # Get the current workflow status from the database to avoid stale data
+            current_workflow = self.chatInterface.getWorkflow(self.service.workflow.id)
+            if current_workflow and current_workflow.status == "stopped":
+                logger.info("Workflow stopped by user, aborting execution")
+                raise WorkflowStoppedException("Workflow was stopped by user")
+        except WorkflowStoppedException:
+            # Re-raise the WorkflowStoppedException immediately
+            raise
+        except Exception as e:
+            # If we can't get the current status due to other database issues, fall back to the in-memory object
+            logger.warning(f"Could not check current workflow status from database: {str(e)}")
+            if self.service.workflow.status == "stopped":
+                logger.info("Workflow stopped by user (from in-memory object), aborting execution")
+                raise WorkflowStoppedException("Workflow was stopped by user")
 
     async def generateTaskPlan(self, userInput: str, workflow) -> TaskPlan:
         """Generate a high-level task plan for the workflow."""
         try:
+            # Check workflow status before generating task plan
+            self._checkWorkflowStopped()
+            
             logger.info(f"Generating task plan for workflow {workflow.id}")
             available_docs = self.service.getAvailableDocuments(workflow)
-            logger.debug(f"Available documents: {available_docs}")
+
+            
+            # Check workflow status before calling AI service
+            self._checkWorkflowStopped()
             
             prompt = await self.service.callAiTextAdvanced(
-                createTaskPlanningPrompt(self, {
+                createTaskPlanningPrompt({
                     'user_request': userInput,
                     'available_documents': available_docs,
                     'workflow_id': workflow.id
@@ -53,16 +84,38 @@ class HandlingTasks:
             
             if not self._validateTaskPlan(task_plan_dict):
                 logger.error("Generated task plan failed validation")
+                logger.error(f"AI Response: {prompt}")
+                logger.error(f"Parsed Task Plan: {json.dumps(task_plan_dict, indent=2)}")
                 raise Exception("AI-generated task plan failed validation - AI is required for task planning")
             
-            tasks = [TaskStep(**task_dict) for task_dict in task_plan_dict.get('tasks', [])]
+            tasks = []
+            for task_dict in task_plan_dict.get('tasks', []):
+                # Map old 'description' field to new 'objective' field
+                if 'description' in task_dict and 'objective' not in task_dict:
+                    task_dict['objective'] = task_dict.pop('description')
+                tasks.append(TaskStep(**task_dict))
             task_plan = TaskPlan(
                 overview=task_plan_dict.get('overview', ''),
                 tasks=tasks
             )
             
             logger.info(f"Task plan generated successfully with {len(tasks)} tasks")
-            logger.debug(f"Task plan: {json.dumps(task_plan_dict, indent=2)}")
+            
+            # Log the generated tasks
+            for i, task in enumerate(tasks):
+                logger.info(f"  Task {i+1}: {task.objective}")
+                if hasattr(task, 'success_criteria') and task.success_criteria:
+                    logger.info(f"    Success criteria: {task.success_criteria}")
+            
+            # Log the complete task plan
+            logger.info("=== GENERATED TASK PLAN ===")
+            logger.info(f"Overview: {task_plan.overview}")
+            logger.info(f"Total tasks: {len(tasks)}")
+            
+            # Log the RAW AI-generated task plan JSON for debugging
+            logger.info("=== RAW AI TASK PLAN JSON ===")
+            logger.info(f"AI Response with task plan: {prompt}")
+            logger.info("=== END RAW AI TASK PLAN JSON ===")
             
             return task_plan
         except Exception as e:
@@ -72,12 +125,14 @@ class HandlingTasks:
     async def generateTaskActions(self, task_step, workflow, previous_results=None, enhanced_context=None) -> List[TaskAction]:
         """Generate actions for a given task step."""
         try:
-            logger.info(f"Generating actions for task: {task_step.description}")
+            # Check workflow status before generating actions
+            self._checkWorkflowStopped()
+            
+            logger.info(f"Generating actions for task: {task_step.objective}")
             
             available_docs = self.service.getAvailableDocuments(workflow)
             available_connections = self.service.getConnectionReferenceList()
-            logger.debug(f"Available documents: {available_docs}")
-            logger.debug(f"Available connections: {available_connections}")
+
             
             context = enhanced_context or TaskContext(
                 task_step=task_step,
@@ -94,8 +149,11 @@ class HandlingTasks:
                 failed_actions=[],
                 successful_actions=[]
             )
+            # Check workflow status before calling AI service
+            self._checkWorkflowStopped()
+            
             prompt = await self.service.callAiTextAdvanced(
-                await createActionDefinitionPrompt(self, context)
+                await createActionDefinitionPrompt(context, self.service)
             )
             # Inline parseActionResponse logic here
             json_start = prompt.find('{')
@@ -126,40 +184,169 @@ class HandlingTasks:
             }) for a in actions]
             
             valid_actions = [ta for ta in task_actions if ta]
-            logger.info(f"Generated {len(valid_actions)} actions for task: {task_step.description}")
-            logger.debug(f"Task actions plan: {json.dumps(action_data, indent=2)}")
+            logger.info(f"Generated {len(valid_actions)} actions for task: {task_step.objective}")
+            
+            # Log the generated actions
+            for i, action in enumerate(valid_actions):
+                logger.info(f"  Action {i+1}: {action.execMethod}.{action.execAction}")
+                if action.expectedDocumentFormats:
+                    logger.info(f"    Expected formats: {action.expectedDocumentFormats}")
+                if action.execParameters.get('documentList'):
+                    logger.info(f"    Input documents: {action.execParameters['documentList']}")
+            
+            # Log the complete action plan
+            logger.info("=== GENERATED ACTION PLAN ===")
+            logger.info(f"Task: {task_step.objective}")
+            logger.info(f"Total actions: {len(valid_actions)}")
+            
+            # Log the RAW AI-generated action plan JSON for debugging
+            logger.info("=== RAW AI ACTION PLAN JSON ===")
+            logger.info(f"AI Response with parsed actions: {prompt}")
+            logger.info("=== END RAW AI ACTION PLAN JSON ===")
             
             return valid_actions
         except Exception as e:
             logger.error(f"Error in generateTaskActions: {str(e)}")
             return []
 
-    async def executeTask(self, task_step, workflow, context) -> TaskResult:
+    async def executeTask(self, task_step, workflow, context, task_index=None, total_tasks=None) -> TaskResult:
         """Execute all actions for a task step, with state management and retries."""
-        logger.info(f"Executing task: {task_step.description}")
+        logger.info(f"=== STARTING TASK {task_index or '?'}: {task_step.objective} ===")
+        
+        # Create database log entry for task start in format expected by frontend
+        if task_index is not None:
+            if total_tasks is not None:
+                self.chatInterface.createWorkflowLog({
+                    "workflowId": workflow.id,
+                    "message": f"Executing task {task_index}/{total_tasks}",
+                    "type": "info"
+                })
+            else:
+                self.chatInterface.createWorkflowLog({
+                    "workflowId": workflow.id,
+                    "message": f"Executing task {task_index}/?",
+                    "type": "info"
+                })
+            
+            # Create a task start message for the user
+            task_progress = f"{task_index}/{total_tasks}" if total_tasks is not None else str(task_index)
+            task_start_message = {
+                "workflowId": workflow.id,
+                "role": "assistant",
+                "message": f"🚀 Starting Task {task_progress}\n\nObjective: {task_step.objective}",
+                "status": "step",
+                "sequenceNr": len(workflow.messages) + 1,
+                "publishedAt": datetime.now(UTC).isoformat(),
+                "documentsLabel": f"task_{task_index}_start",
+                "documents": []
+            }
+            
+            message = self.chatInterface.createWorkflowMessage(task_start_message)
+            if message:
+                workflow.messages.append(message)
+                logger.info(f"Task start message created for task {task_index}")
+        
         state = TaskExecutionState(task_step)
         retry_context = context
         max_retries = state.max_retries
         for attempt in range(max_retries):
             logger.info(f"Task execution attempt {attempt+1}/{max_retries}")
+            
+            # Check workflow status before starting task execution
+            self._checkWorkflowStopped()
+            
             actions = await self.generateTaskActions(task_step, workflow, previous_results=retry_context.previous_results, enhanced_context=retry_context)
             if not actions:
                 logger.error("No actions defined for task step, aborting task execution")
                 break
+            
+            # Log total actions count for this task
+            total_actions = len(actions)
+            logger.info(f"Task {task_index or '?'} has {total_actions} actions")
+            
             action_results = []
-            for action in actions:
-                result = await self.executeSingleAction(action, workflow)
+            for action_idx, action in enumerate(actions):
+                # Check workflow status before each action execution
+                self._checkWorkflowStopped()
+                
+                # Log action start in format expected by frontend
+                action_number = action_idx + 1
+                logger.info(f"Task {task_index} - Starting action {action_number}/{total_actions}")
+                
+                # Create database log entry for action start
+                self.chatInterface.createWorkflowLog({
+                    "workflowId": workflow.id,
+                    "message": f"Task {task_index} - Starting action {action_number}/{total_actions}",
+                    "type": "info"
+                })
+                
+                # Create an action start message for the user
+                action_start_message = {
+                    "workflowId": workflow.id,
+                    "role": "assistant",
+                    "message": f"⚡ Task {task_index} - Action {action_number}/{total_actions}\n\nMethod: {action.execMethod}.{action.execAction}",
+                    "status": "step",
+                    "sequenceNr": len(workflow.messages) + 1,
+                    "publishedAt": datetime.now(UTC).isoformat(),
+                    "documentsLabel": f"action_{action_number}_start",
+                    "documents": []
+                }
+                
+                message = self.chatInterface.createWorkflowMessage(action_start_message)
+                if message:
+                    workflow.messages.append(message)
+                    logger.info(f"Action start message created for action {action_number}")
+                
+                # Pass action index to executeSingleAction with task context
+                result = await self.executeSingleAction(action, workflow, task_step, task_index, action_number, total_actions)
                 action_results.append(result)
                 if result.success:
                     state.addSuccessfulAction(result)
                 else:
                     state.addFailedAction(result)
+            
+            # Check workflow status before review
+            self._checkWorkflowStopped()
+            
             review_result = await self.reviewTaskCompletion(task_step, actions, action_results, workflow)
             success = review_result.status == 'success'
             feedback = review_result.reason
             error = None if success else review_result.reason
             if success:
-                logger.info(f"Task step '{task_step.description}' completed successfully")
+                logger.info(f"=== TASK {task_index or '?'} COMPLETED SUCCESSFULLY: {task_step.objective} ===")
+                
+                # Create database log entry for task completion
+                if total_tasks is not None:
+                    self.chatInterface.createWorkflowLog({
+                        "workflowId": workflow.id,
+                        "message": f"🎯 Task {task_index}/{total_tasks} completed",
+                        "type": "success"
+                    })
+                else:
+                    self.chatInterface.createWorkflowLog({
+                        "workflowId": workflow.id,
+                        "message": f"🎯 Task {task_index}/? completed",
+                        "type": "success"
+                    })
+                
+                # Create a task completion message for the user
+                task_progress = f"{task_index}/{total_tasks}" if total_tasks is not None else str(task_index)
+                task_completion_message = {
+                    "workflowId": workflow.id,
+                    "role": "assistant",
+                    "message": f"🎯 Task {task_progress} Completed Successfully!\n\nObjective: {task_step.objective}\n\nFeedback: {feedback or 'Task completed successfully'}",
+                    "status": "step",
+                    "sequenceNr": len(workflow.messages) + 1,
+                    "publishedAt": datetime.now(UTC).isoformat(),
+                    "documentsLabel": f"task_{task_index}_completion",
+                    "documents": []
+                }
+                
+                message = self.chatInterface.createWorkflowMessage(task_completion_message)
+                if message:
+                    workflow.messages.append(message)
+                    logger.info(f"Task completion message created for task {task_index}")
+                
                 return TaskResult(
                     taskId=task_step.id,
                     status=TaskStatus.COMPLETED,
@@ -168,7 +355,7 @@ class HandlingTasks:
                     error=None
                 )
             elif review_result.status == 'retry' and state.canRetry():
-                logger.warning(f"Task step '{task_step.description}' requires retry: {review_result.improvements}")
+                logger.warning(f"Task step '{task_step.objective}' requires retry: {review_result.improvements}")
                 state.incrementRetryCount()
                 retry_context.retry_count = state.retry_count
                 retry_context.improvements = review_result.improvements
@@ -180,7 +367,7 @@ class HandlingTasks:
                 retry_context.successful_actions = state.successful_actions
                 continue
             else:
-                logger.error(f"Task step '{task_step.description}' failed after {attempt+1} attempts")
+                logger.error(f"=== TASK {task_index or '?'} FAILED: {task_step.objective} after {attempt+1} attempts ===")
                 return TaskResult(
                     taskId=task_step.id,
                     status=TaskStatus.FAILED,
@@ -188,7 +375,7 @@ class HandlingTasks:
                     feedback=feedback,
                     error=error
                 )
-        logger.error(f"Task step '{task_step.description}' failed after all retries")
+        logger.error(f"=== TASK {task_index or '?'} FAILED AFTER ALL RETRIES: {task_step.objective} ===")
         return TaskResult(
             taskId=task_step.id,
             status=TaskStatus.FAILED,
@@ -199,6 +386,9 @@ class HandlingTasks:
 
     async def reviewTaskCompletion(self, task_step, task_actions, action_results, workflow):
         try:
+            # Check workflow status before reviewing task completion
+            self._checkWorkflowStopped()
+            
             review_context = ReviewContext(
                 task_step=task_step,
                 action_results=action_results,
@@ -210,8 +400,11 @@ class HandlingTasks:
                     'errors': [result.error for result in action_results if not result.success]
                 }
             )
+            # Check workflow status before calling AI service
+            self._checkWorkflowStopped()
+            
             # Use promptFactory for review prompt
-            prompt = await createResultReviewPrompt(self, review_context)
+            prompt = await createResultReviewPrompt(review_context)
             response = await self.service.callAiTextAdvanced(prompt)
             # Inline parseReviewResponse logic here
             json_start = response.find('{')
@@ -239,10 +432,6 @@ class HandlingTasks:
                 improvements = []
             
             # Ensure all list fields are properly typed
-            missing_outputs = review.get('missing_outputs', [])
-            if not isinstance(missing_outputs, list):
-                missing_outputs = []
-                
             met_criteria = review.get('met_criteria', [])
             if not isinstance(met_criteria, list):
                 met_criteria = []
@@ -256,14 +445,14 @@ class HandlingTasks:
                 reason=review.get('reason', 'No reason provided'),
                 improvements=improvements,
                 quality_score=review.get('quality_score', 5),
-                missing_outputs=missing_outputs,
+                missing_outputs=[],
                 met_criteria=met_criteria,
                 unmet_criteria=unmet_criteria,
                 confidence=review.get('confidence', 0.5)
             )
             
             # Enhanced validation logging
-            logger.info(f"VALIDATION RESULT - Task: '{task_step.description}' - Status: {review_result.status.upper()}, Quality: {review_result.quality_score}/10")
+            logger.info(f"VALIDATION RESULT - Task: '{task_step.objective}' - Status: {review_result.status.upper()}, Quality: {review_result.quality_score}/10")
             if review_result.status == 'success':
                 logger.info(f"VALIDATION SUCCESS - Task completed successfully")
                 if review_result.met_criteria:
@@ -274,8 +463,6 @@ class HandlingTasks:
                     logger.warning(f"Unmet criteria: {', '.join(review_result.unmet_criteria)}")
             else:
                 logger.error(f"VALIDATION FAILED - Task failed: {review_result.reason}")
-                if review_result.missing_outputs:
-                    logger.error(f"Missing outputs: {', '.join(review_result.missing_outputs)}")
             
             return review_result
         except Exception as e:
@@ -288,26 +475,22 @@ class HandlingTasks:
 
     async def prepareTaskHandover(self, task_step, task_actions, review_result, workflow):
         try:
+            # Check workflow status before preparing task handover
+            self._checkWorkflowStopped()
+            
             # Log handover status summary
             if hasattr(review_result, 'status'):
                 status = review_result.status
-                if hasattr(review_result, 'missing_outputs'):
-                    missing = review_result.missing_outputs
-                else:
-                    missing = []
                 if hasattr(review_result, 'met_criteria'):
                     met = review_result.met_criteria
                 else:
                     met = []
                 
-                logger.debug(f"Task handover status: {status}")
-                logger.debug(f"Promised documents: {task_step.expected_outputs}")
-                logger.debug(f"Delivered documents: {met}")
-                logger.debug(f"Missing documents: {missing}")
+                
             
             handover_data = {
                 'task_id': task_step.id,
-                'task_description': task_step.description,
+                'task_description': task_step.objective,
                 'actions': [action.to_dict() for action in task_actions],
                 'review_result': review_result.to_dict() if hasattr(review_result, 'to_dict') else review_result,
                 'workflow_id': workflow.id,
@@ -321,20 +504,35 @@ class HandlingTasks:
 
     # --- Helper action handling methods ---
 
-    async def executeSingleAction(self, action, workflow):
+    async def executeSingleAction(self, action, workflow, task_step, task_index=None, action_index=None, total_actions=None):
         """Execute a single action and return ActionResult with enhanced document processing"""
         try:
-            logger.info(f"Executing action: {action.execMethod}.{action.execAction}")
+            # Check workflow status before executing action
+            self._checkWorkflowStopped()
             
-            # Log input documents and connections
+            # Use passed indices or fallback to '?'
+            task_num = task_index if task_index is not None else '?'
+            action_num = action_index if action_index is not None else '?'
+            
+            logger.info(f"=== TASK {task_num} ACTION {action_num}: {action.execMethod}.{action.execAction} ===")
+            
+            # Log input parameters
             input_docs = action.execParameters.get('documentList', [])
-            logger.debug(f"Input documents: {input_docs}")
-            logger.debug(f"Input connections: {action.execParameters.get('connections', [])}")
+            input_connections = action.execParameters.get('connections', [])
+            logger.info(f"Input documents: {input_docs} (type: {type(input_docs)})")
+            if input_connections:
+                logger.info(f"Input connections: {input_connections}")
+            
+            # Log all action parameters for debugging
+            logger.info(f"All action parameters: {action.execParameters}")
             
             enhanced_parameters = action.execParameters.copy()
             if action.expectedDocumentFormats:
                 enhanced_parameters['expectedDocumentFormats'] = action.expectedDocumentFormats
-                logger.debug(f"Expected document formats: {action.expectedDocumentFormats}")
+                logger.info(f"Expected formats: {action.expectedDocumentFormats}")
+            
+            # Check workflow status before executing the action
+            self._checkWorkflowStopped()
             
             result = await self.service.executeAction(
                 methodName=action.execMethod,
@@ -350,11 +548,51 @@ class HandlingTasks:
                 action.setSuccess()
                 action.result = result.data.get("result", "")
                 action.execResultLabel = result_label
-                await self.createActionMessage(action, result, workflow, result_label, created_documents)
-                logger.info(f"Action {action.execMethod}.{action.execAction} executed successfully")
+                await self.createActionMessage(action, result, workflow, result_label, created_documents, task_step, task_index)
+                
+                # Log action results
+                logger.info(f"✓ Action completed successfully")
+                
+                # Create database log entry for action completion
+                if total_actions is not None:
+                    self.chatInterface.createWorkflowLog({
+                        "workflowId": workflow.id,
+                        "message": f"✅ Task {task_num} - Action {action_num}/{total_actions} completed",
+                        "type": "success"
+                    })
+                else:
+                    self.chatInterface.createWorkflowLog({
+                        "workflowId": workflow.id,
+                        "message": f"✅ Task {task_num} - Action {action_num}/? completed",
+                        "type": "success"
+                    })
+                
+                if created_documents:
+                    logger.info(f"Output documents ({len(created_documents)}):")
+                    for i, doc in enumerate(created_documents):
+                        if hasattr(doc, 'filename'):
+                            logger.info(f"  {i+1}. {doc.filename}")
+                        elif isinstance(doc, dict) and 'filename' in doc:
+                            logger.info(f"  {i+1}. {doc['filename']}")
+                        else:
+                            logger.info(f"  {i+1}. {type(doc).__name__}")
+                    
+                    # Log document details for debugging
+                    logger.info("Document details:")
+                    for i, doc in enumerate(created_documents):
+                        if hasattr(doc, 'filename'):
+                            logger.info(f"  Doc {i+1}: filename={doc.filename}, type={type(doc)}")
+                            if hasattr(doc, 'id'):
+                                logger.info(f"    ID: {doc.id}")
+                            if hasattr(doc, 'fileId'):
+                                logger.info(f"    File ID: {doc.fileId}")
+                        elif isinstance(doc, dict):
+                            logger.info(f"  Doc {i+1}: dict with keys: {list(doc.keys())}")
+                else:
+                    logger.info("Output: No documents created")
             else:
                 action.setError(result.error or "Action execution failed")
-                logger.error(f"Action {action.execMethod}.{action.execAction} failed: {result.error}")
+                logger.error(f"✗ Action failed: {result.error}")
             
             # Extract document filenames for the ActionResult
             document_filenames = []
@@ -367,6 +605,9 @@ class HandlingTasks:
             # Also include the original documents from the service result for validation
             original_documents = result.data.get("documents", [])
             
+            # Log action summary
+            logger.info(f"=== TASK {task_num} ACTION {action_num} COMPLETED ===")
+            
             return ActionResult(
                 success=result.success,
                 data={
@@ -407,9 +648,12 @@ class HandlingTasks:
                 error=str(e)
             )
 
-    async def createActionMessage(self, action, result, workflow, result_label=None, created_documents=None):
+    async def createActionMessage(self, action, result, workflow, result_label=None, created_documents=None, task_step=None, task_index=None):
         """Create and store a message for the action result in the workflow with enhanced document processing"""
         try:
+            # Check workflow status before creating action message
+            self._checkWorkflowStopped()
+            
             if result_label is None:
                 result_label = action.execResultLabel
             
@@ -417,25 +661,29 @@ class HandlingTasks:
             if created_documents is None:
                 created_documents = self.documentGenerator.createDocumentsFromActionResult(result, action, workflow)
             
-            # Log delivered documents with sizes
+            # Log delivered documents
             if created_documents:
-                doc_info = []
-                for doc in created_documents:
-                    if hasattr(doc, 'filename') and hasattr(doc, 'fileSize'):
-                        doc_info.append(f"{doc.filename} ({doc.fileSize} bytes)")
-                    elif hasattr(doc, 'filename'):
-                        doc_info.append(f"{doc.filename}")
-                    else:
-                        doc_info.append("unknown document")
-                logger.debug(f"Produced result label: {result_label}")
-                logger.debug(f"Delivered documents: {doc_info}")
+                logger.info(f"Result label: {result_label} - {len(created_documents)} documents")
             else:
-                logger.debug(f"Produced result label: {result_label} (no documents)")
+                logger.info(f"Result label: {result_label} - No documents")
+            
+            # Create a more meaningful message that includes task context
+            task_objective = task_step.objective if task_step else 'Unknown task'
+            
+            # Build a user-friendly message
+            if created_documents and len(created_documents) > 0:
+                doc_names = [doc.filename if hasattr(doc, 'filename') else str(doc) for doc in created_documents[:3]]
+                if len(created_documents) > 3:
+                    doc_names.append(f"... and {len(created_documents) - 3} more")
+                
+                message_text = f"✅ Task {task_index or '?'} - Action {action.execMethod}.{action.execAction} completed\n\nObjective: {task_objective}\n\nGenerated {len(created_documents)} document(s): {', '.join(doc_names)}"
+            else:
+                message_text = f"✅ Task {task_index or '?'} - Action {action.execMethod}.{action.execAction} completed\n\nObjective: {task_objective}\n\nAction executed successfully"
             
             message_data = {
                 "workflowId": workflow.id,
                 "role": "assistant",
-                "message": f"Executed action {action.execMethod}.{action.execAction}",
+                "message": message_text,
                 "status": "step",
                 "sequenceNr": len(workflow.messages) + 1,
                 "publishedAt": datetime.now(UTC).isoformat(),
@@ -449,7 +697,7 @@ class HandlingTasks:
             message = self.chatInterface.createWorkflowMessage(message_data)
             if message:
                 workflow.messages.append(message)
-                logger.info(f"Created action message for {action.execMethod}.{action.execAction} with {len(created_documents)} documents")
+                logger.info(f"Message created: {action.execMethod}.{action.execAction}")
             else:
                 logger.error(f"Failed to create workflow message for action {action.execMethod}.{action.execAction}")
         except Exception as e:
@@ -459,29 +707,59 @@ class HandlingTasks:
 
     def _validateTaskPlan(self, task_plan: Dict[str, Any]) -> bool:
         try:
+
+            
             if not isinstance(task_plan, dict):
+                logger.error("Task plan is not a dictionary")
                 return False
+                
             if 'tasks' not in task_plan or not isinstance(task_plan['tasks'], list):
+                logger.error(f"Task plan missing 'tasks' field or not a list. Found: {type(task_plan.get('tasks', 'MISSING'))}")
                 return False
+                
+            # First pass: collect all task IDs to validate dependencies
             task_ids = set()
             for task in task_plan['tasks']:
                 if not isinstance(task, dict):
+                    logger.error(f"Task is not a dictionary: {type(task)}")
                     return False
-                required_fields = ['id', 'description', 'expected_outputs', 'success_criteria']
-                if not all(field in task for field in required_fields):
-                    return False
-                if task['id'] in task_ids:
+                if 'id' not in task:
+                    logger.error(f"Task missing 'id' field: {task}")
                     return False
                 task_ids.add(task['id'])
+            
+            # Second pass: validate each task
+            for i, task in enumerate(task_plan['tasks']):
+    
+                
+                if not isinstance(task, dict):
+                    logger.error(f"Task {i} is not a dictionary: {type(task)}")
+                    return False
+                    
+                required_fields = ['id', 'objective', 'success_criteria']
+                missing_fields = [field for field in required_fields if field not in task]
+                if missing_fields:
+                    logger.error(f"Task {i} missing required fields: {missing_fields}")
+                    return False
+                    
+                # Check for duplicate IDs (shouldn't happen after first pass, but safety check)
+                if task['id'] in task_ids and list(task_plan['tasks']).count(task['id']) > 1:
+                    logger.error(f"Task {i} has duplicate ID: {task['id']}")
+                    return False
+                
                 dependencies = task.get('dependencies', [])
                 if not isinstance(dependencies, list):
+                    logger.error(f"Task {i} dependencies is not a list: {type(dependencies)}")
                     return False
+                    
                 for dep in dependencies:
                     if dep not in task_ids and dep != 'task_0':
+                        logger.error(f"Task {i} has invalid dependency: {dep} (available: {list(task_ids) + ['task_0']})")
                         return False
-                if 'ai_prompt' in task and not isinstance(task['ai_prompt'], str):
-                    return False
+                        
+            logger.info(f"Task plan validation successful with {len(task_ids)} tasks")
             return True
+            
         except Exception as e:
             logger.error(f"Error validating task plan: {str(e)}")
             return False
diff --git a/modules/chat/handling/promptFactory.py b/modules/chat/handling/promptFactory.py
index c3936bef..a1fd9348 100644
--- a/modules/chat/handling/promptFactory.py
+++ b/modules/chat/handling/promptFactory.py
@@ -7,7 +7,7 @@ from typing import Any, Dict
 
 # Prompt creation helpers extracted from managerChat.py
 
-def createTaskPlanningPrompt(self, context: Dict[str, Any]) -> str:
+def createTaskPlanningPrompt(context: Dict[str, Any]) -> str:
     """Create prompt for task planning"""
     return f"""You are a task planning AI that analyzes user requests and creates structured task plans.
 
@@ -19,17 +19,16 @@ INSTRUCTIONS:
 1. Analyze the user request and available documents
 2. Break down the request into 2-4 meaningful high-level task steps
 3. Focus on business outcomes, not technical operations
-4. For document processing, create ONE task with a comprehensive AI prompt rather than multiple granular tasks
-5. Each task should produce meaningful, usable outputs
-6. Ensure proper handover between tasks using result labels
-7. Return a JSON object with the exact structure shown below
+4. Each task should produce meaningful, usable outputs
+5. Ensure proper handover between tasks using result labels
+6. Return a JSON object with the exact structure shown below
 
 TASK PLANNING PRINCIPLES:
-- Combine related operations into single tasks (e.g., \"Extract and analyze all candidate profiles\" instead of separate \"read file\" and \"analyze content\" tasks)
-- Use comprehensive AI prompts for document processing rather than multiple small tasks
+- Break down complex requests into logical, sequential steps
 - Focus on business value and outcomes
 - Keep tasks at a meaningful level of abstraction
 - Each task should produce results that can be used by subsequent tasks
+- Ensure clear dependencies and handovers between tasks
 
 REQUIRED JSON STRUCTURE:
 {{
@@ -37,31 +36,34 @@ REQUIRED JSON STRUCTURE:
     \"tasks\": [
         {{
             \"id\": \"task_1\",
-            \"description\": \"Clear description of what this task accomplishes (business outcome)\",
+            \"objective\": \"Clear business objective this task accomplishes\",
             \"dependencies\": [\"task_0\"],  // IDs of tasks that must complete first
-            \"expected_outputs\": [\"output1\", \"output2\"],
             \"success_criteria\": [\"criteria1\", \"criteria2\"],
-            \"required_documents\": [\"doc1\", \"doc2\"],
-            \"estimated_complexity\": \"low|medium|high\",
-            \"ai_prompt\": \"Comprehensive AI prompt for document processing tasks (if applicable)\"
+            \"estimated_complexity\": \"low|medium|high\"
         }}
     ]
 }}
 
-EXAMPLES OF GOOD TASK DESCRIPTIONS:
-- \"Extract and analyze all candidate profiles to identify key qualifications and experience\"
-- \"Create evaluation matrix and rate candidates against product designer criteria\"
-- \"Generate comprehensive PowerPoint presentation for management decision\"
-- \"Store final presentation in SharePoint for specified account\"
+EXAMPLES OF GOOD TASK OBJECTIVES:
+- \"Extract key information from documents for email preparation\"
+- \"Draft professional email incorporating analyzed information\"
+- \"Send email using specified email account\"
+- \"Store email draft and confirmation in system\"
 
-EXAMPLES OF BAD TASK DESCRIPTIONS:
+EXAMPLES OF GOOD SUCCESS CRITERIA:
+- \"Document analysis completed with key points identified\"
+- \"Email draft created with professional tone and clear structure\"
+- \"Email successfully sent with delivery confirmation\"
+- \"All outputs properly stored and accessible for future use\"
+
+EXAMPLES OF BAD TASK OBJECTIVES:
 - \"Open and read the PDF file\" (too granular)
 - \"Identify table structure\" (technical detail)
 - \"Convert data to CSV format\" (implementation detail)
 
 NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
 
-async def createActionDefinitionPrompt(self, context) -> str:
+async def createActionDefinitionPrompt(context, service) -> str:
     """Create prompt for action generation with enhanced document extraction guidance and retry context"""
     task_step = context.task_step
     workflow = context.workflow
@@ -71,23 +73,32 @@ async def createActionDefinitionPrompt(self, context) -> str:
     retry_count = context.retry_count or 0
     previous_action_results = context.previous_action_results or []
     previous_review_result = context.previous_review_result
-    methodList = self.service.getMethodsList()
+    methodList = service.getMethodsList()
     method_actions = {}
     for sig in methodList:
         if '.' in sig:
             method, rest = sig.split('.', 1)
             action = rest.split('(')[0]
             method_actions.setdefault(method, []).append((action, sig))
-    messageSummary = await self.service.summarizeChat(workflow.messages)
-    docRefs = self.service.getDocumentReferenceList()
-    connRefs = self.service.getConnectionReferenceList()
-    all_doc_refs = docRefs.get('chat', []) + docRefs.get('history', [])
+    messageSummary = await service.summarizeChat(workflow.messages)
+    # Get ALL documents from the entire workflow, not just current round
+    docRefs = service.getDocumentReferenceList()
+    connRefs = service.getConnectionReferenceList()
+    
+    # Get documents from current round (chat) and entire workflow history
+    current_round_docs = docRefs.get('chat', [])
+    workflow_history_docs = docRefs.get('history', [])
+    
+    # Combine all documents, prioritizing current round first, then workflow history
+    all_doc_refs = current_round_docs + workflow_history_docs
+    
+    # Log document availability for debugging
+    logging.debug(f"Document references - Current round: {len(current_round_docs)}, Workflow history: {len(workflow_history_docs)}, Total: {len(all_doc_refs)}")
     available_methods_str = ''
     for method, actions in method_actions.items():
         available_methods_str += f"- {method}:\n"
         for action, sig in actions:
             available_methods_str += f"    - {action}: {sig}\n"
-    task_ai_prompt = task_step.ai_prompt or ''
     retry_context = ""
     if retry_count > 0:
         retry_context = f"""
@@ -105,17 +116,36 @@ Previous review feedback:
 - Status: {previous_review_result.status or 'unknown'}
 - Reason: {previous_review_result.reason or 'No reason provided'}
 - Quality Score: {previous_review_result.quality_score or 0}/10
-- Missing Outputs: {', '.join(previous_review_result.missing_outputs or [])}
 - Unmet Criteria: {', '.join(previous_review_result.unmet_criteria or [])}
 """
-    expected_outputs_str = ', '.join(task_step.expected_outputs or [])
     success_criteria_str = ', '.join(task_step.success_criteria or [])
     previous_results_str = ', '.join(previous_results) if previous_results else 'None'
     improvements_str = str(improvements) if improvements else 'None'
     available_connections_str = '\n'.join(f"- {conn}" for conn in connRefs)
-    available_documents_str = '\n'.join(
-        f"- {doc.documentsLabel} contains {', '.join(doc.documents)}" for doc in all_doc_refs
-    )
+    # Build comprehensive document list showing both current round and workflow history
+    if all_doc_refs:
+        available_documents_str = "CURRENT ROUND DOCUMENTS:\n"
+        if current_round_docs:
+            for doc in current_round_docs:
+                available_documents_str += f"- {doc.documentsLabel} contains {', '.join(doc.documents)}\n"
+        else:
+            available_documents_str += "- No documents in current round\n"
+        
+        available_documents_str += "\nWORKFLOW HISTORY DOCUMENTS:\n"
+        if workflow_history_docs:
+            for doc in workflow_history_docs:
+                available_documents_str += f"- {doc.documentsLabel} contains {', '.join(doc.documents)}\n"
+        else:
+            available_documents_str += "- No documents in workflow history\n"
+    else:
+        available_documents_str = "NO DOCUMENTS AVAILABLE - This workflow has no documents to process."
+    
+    # Debug logging for document availability
+    logging.debug(f"Available documents string length: {len(available_documents_str)}")
+    logging.debug(f"Current round docs count: {len(current_round_docs)}")
+    logging.debug(f"Workflow history docs count: {len(workflow_history_docs)}")
+    logging.debug(f"Total doc refs: {len(all_doc_refs)}")
+    
     prompt = f"""
 You are an action generation AI that creates specific actions to accomplish a task step.
 
@@ -130,12 +160,11 @@ CRITICAL DOCUMENT REFERENCE RULES:
 - NEVER invent new labels or use message IDs
 - NEVER use formats like "msg_xxx:documents" or "task_X_results" (these will fail)
 - ONLY use the exact labels shown in AVAILABLE DOCUMENTS
-- **When generating multiple actions, you may only use as input documents those that are already present in AVAILABLE DOCUMENTS or produced by actions that come earlier in the list. Do NOT use as input any document label that will be produced by a later action.**
+- When generating multiple actions, you may only use as input documents those that are already present in AVAILABLE DOCUMENTS or produced by actions that come earlier in the list. Do NOT use as input any document label that will be produced by a later action.
+- If AVAILABLE DOCUMENTS shows "NO DOCUMENTS AVAILABLE", you CANNOT create document extraction actions. Instead, create actions that generate new content or inform the user that documents are needed.
 
-TASK STEP: {task_step.description} (ID: {task_step.id})
-EXPECTED OUTPUTS: {expected_outputs_str}
+TASK STEP: {task_step.objective} (ID: {task_step.id})
 SUCCESS CRITERIA: {success_criteria_str}
-TASK AI PROMPT: {task_ai_prompt if task_ai_prompt else 'None provided'}
 
 CONTEXT - Chat History:
 {messageSummary}
@@ -180,7 +209,8 @@ ACTION GENERATION PRINCIPLES:
 INSTRUCTIONS:
 - Generate actions to accomplish this task step using available documents, connections, and previous results
 - Use docItem for single documents and docList labels for groups of documents as shown in AVAILABLE DOCUMENTS
-- Always pass documentList as a LIST of references (docItem and/or docList)
+- If AVAILABLE DOCUMENTS shows "NO DOCUMENTS AVAILABLE", you cannot create document extraction actions. Instead, create actions that generate new content or inform the user that documents are needed.
+- Always pass documentList as a LIST of references (docItem and/or docList) - this list CANNOT be empty for document extraction actions
 - For resultLabel, use the format: "task{{task_id}}_action{{action_number}}_{{short_label}}" where:
     - {{task_id}} = the current task's id (e.g., 1)
     - {{action_number}} = the sequence number of the action within the task (e.g., 2)
@@ -202,8 +232,8 @@ REQUIRED JSON STRUCTURE:
             "resultLabel": "task1_action3_analysis_results",
             "expectedDocumentFormats": [  // OPTIONAL: Specify expected document formats when needed
                 {{
-                    "extension": ".csv",
-                    "mimeType": "text/csv",
+                    "extension": ".txt",
+                    "mimeType": "text/plain",
                     "description": "Structured data output"
                 }}
             ],
@@ -314,19 +344,33 @@ EXAMPLES OF GOOD ACTIONS:
     ]
 }}
 
-NOTE: Respond with ONLY the JSON object. Do not include any explanatory text."""
-    logging.debug(f"[ACTION PLAN PROMPT] Available Documents Section:\n{available_documents_str}\nUser Connections Section:\n{available_connections_str}\nAvailable Methods (summarized):\n{', '.join(method_actions.keys())}")
+6. When no documents are available (NO DOCUMENTS AVAILABLE scenario):
+{{
+    "method": "document",
+    "action": "generateReport",
+    "parameters": {{
+        "documentList": [],
+        "title": "Workflow Status Report"
+    }},
+    "resultLabel": "task1_action1_status_report",
+    "description": "Generate a status report informing the user that no documents are available for processing and requesting document upload or alternative input."
+}}
+
+IMPORTANT NOTES:
+- Respond with ONLY the JSON object. Do not include any explanatory text.
+- Before creating any document extraction action, verify that AVAILABLE DOCUMENTS contains actual document references.
+- If AVAILABLE DOCUMENTS shows "NO DOCUMENTS AVAILABLE", use example 6 above to create a status report action instead of document extraction."""
+    logging.debug(f"[ACTION PLAN PROMPT] Available Documents Section:\n{available_documents_str}\nUser Connections Section:\n{available_connections_str}\nAvailable Methods (detailed):\n{available_methods_str}")
     return prompt
 
-async def createResultReviewPrompt(self, review_context) -> str:
+async def createResultReviewPrompt(review_context) -> str:
     """Create prompt for result review"""
     task_step = review_context.task_step
     step_result = review_context.step_result or {}
     step_result_serializable = {
         'task_step': {
             'id': task_step.id,
-            'description': task_step.description,
-            'expected_outputs': task_step.expected_outputs or [],
+            'objective': task_step.objective,
             'success_criteria': task_step.success_criteria or []
         },
         'action_results': [],
@@ -380,12 +424,10 @@ async def createResultReviewPrompt(self, review_context) -> str:
         }
         step_result_serializable['action_results'].append(serializable_action_result)
     step_result_json = json.dumps(step_result_serializable, indent=2, ensure_ascii=False)
-    expected_outputs_str = ', '.join(task_step.expected_outputs or [])
     success_criteria_str = ', '.join(task_step.success_criteria or [])
     return f"""You are a result review AI that evaluates task step completion with BASIC validation.
 
-TASK STEP: {task_step.description}
-EXPECTED OUTPUTS: {expected_outputs_str}
+TASK STEP: {task_step.objective}
 SUCCESS CRITERIA: {success_criteria_str}
 
 STEP RESULT: {step_result_json}
@@ -402,8 +444,8 @@ VALIDATION PRINCIPLES:
 - Text outputs are SECONDARY indicators
 - Only retry for CLEAR technical issues, not minor imperfections
 - Don't be picky about formatting or minor details
-- Check if ANY documents were produced (documents_count > 0), not specific expected output names
-- If documents were produced, consider it a SUCCESS regardless of expected output names
+- Check if ANY documents were produced (documents_count > 0)
+- If documents were produced, consider it a SUCCESS
 
 EXAMPLES OF SUCCESS:
 - Document extraction produced a file (even if imperfect)
@@ -428,7 +470,6 @@ REQUIRED JSON STRUCTURE:
     "reason": "Brief explanation",
     "improvements": ["specific technical fixes only"],
     "quality_score": 1-10,
-    "missing_outputs": [],
     "met_criteria": ["basic functionality achieved"],
     "unmet_criteria": []
 }}
@@ -437,6 +478,6 @@ VALIDATION LOGIC:
 - If ANY action has documents_count > 0, mark as SUCCESS
 - If ALL actions have documents_count = 0 AND no meaningful text output, mark as FAILED
 - Only mark as RETRY for clear technical issues that can be fixed
-- Do NOT fail based on expected output name mismatches - focus on actual document production
+- Focus on actual document production and functionality, not specific output names
 
 NOTE: Respond with ONLY the JSON object. Be GENEROUS with success ratings.""" 
\ No newline at end of file
diff --git a/modules/chat/managerChat.py b/modules/chat/managerChat.py
index e7c0475e..b394fc24 100644
--- a/modules/chat/managerChat.py
+++ b/modules/chat/managerChat.py
@@ -4,15 +4,7 @@ from modules.interfaces.interfaceAppModel import User
 from modules.interfaces.interfaceChatModel import ChatWorkflow, UserInputRequest, TaskStep, TaskAction, ActionResult, ReviewResult, TaskPlan, WorkflowResult, TaskContext
 from modules.chat.serviceCenter import ServiceCenter
 from modules.interfaces.interfaceChatObjects import ChatObjects
-from .handling.handlingTasks import HandlingTasks
-
-logger = logging.getLogger(__name__)
-
-# ===== STATE MANAGEMENT AND VALIDATION CLASSES =====
-
-class WorkflowStoppedException(Exception):
-    """Exception raised when workflow is stopped by user"""
-    pass
+from .handling.handlingTasks import HandlingTasks, WorkflowStoppedException
 
 logger = logging.getLogger(__name__)
 
@@ -47,16 +39,15 @@ class ChatManager:
                 raise Exception("No tasks generated in task plan.")
             
             # Phase 2-5: For each task, execute and get results
-            logger.info(f"Phase 2: Executing {len(task_plan.tasks)} tasks")
+            total_tasks = len(task_plan.tasks)
+            logger.info(f"Phase 2: Executing {total_tasks} tasks")
             all_task_results = []
             previous_results = []
             for idx, task_step in enumerate(task_plan.tasks):
-                logger.info(f"Task {idx+1}/{len(task_plan.tasks)}: {task_step.description}")
+                # Pass task index to executeTask method
+                current_task_index = idx + 1
                 
-                # Check if workflow has been stopped before each task
-                if self.service.workflow.status == "stopped":
-                    logger.info("Workflow stopped by user, aborting execution")
-                    raise WorkflowStoppedException("Workflow was stopped by user")
+                logger.info(f"Task {idx+1}/{total_tasks}: {task_step.objective}")
                 
                 # Create task context for this task
                 task_context = TaskContext(
@@ -67,7 +58,7 @@ class ChatManager:
                     previous_results=previous_results
                 )
                 # Execute task (this handles action generation, execution, and review internally)
-                task_result = await self.handlingTasks.executeTask(task_step, workflow, task_context)
+                task_result = await self.handlingTasks.executeTask(task_step, workflow, task_context, current_task_index, total_tasks)
                 # Handover
                 handover_data = await self.handlingTasks.prepareTaskHandover(task_step, [], task_result, workflow)
                 # Collect results
@@ -90,6 +81,15 @@ class ChatManager:
             )
             logger.info(f"Unified workflow execution completed successfully for workflow {workflow.id}")
             return workflow_result
+        except WorkflowStoppedException:
+            logger.info(f"Workflow {workflow.id} was stopped by user")
+            return WorkflowResult(
+                status="stopped", 
+                completed_tasks=0,
+                total_tasks=0,
+                execution_time=0.0,
+                final_results_count=0
+            )
         except Exception as e:
             logger.error(f"Error in executeUnifiedWorkflow: {str(e)}")
             return WorkflowResult(
diff --git a/modules/chat/serviceCenter.py b/modules/chat/serviceCenter.py
index 8a0d5df6..b5595ba6 100644
--- a/modules/chat/serviceCenter.py
+++ b/modules/chat/serviceCenter.py
@@ -310,54 +310,43 @@ class ServiceCenter:
         chat_exchanges = []
         history_exchanges = []
         
-        # Process messages in reverse order to find current chat round
+        # Process messages in reverse order; "first" marks boundary: include up to and including
+        # the first "first" message in the chat container, older messages in the history container
+        in_current_round = True
         for message in reversed(self.workflow.messages):
-            # Get document references from message
+            is_first = getattr(message, "status", None) == "first"
+            
+            # Build a DocumentExchange if message has documents
+            doc_exchange = None
             if message.documents:
-                # For messages with action context, create DocumentExchange with docList reference
                 if message.actionId and message.documentsLabel:
                     doc_ref = self.getDocumentReferenceFromMessage(message)
                     if doc_ref:
-                        # Create DocumentExchange with single docList reference
                         doc_exchange = DocumentExchange(
                             documentsLabel=message.documentsLabel,
                             documents=[doc_ref]
                         )
-                        
-                        # Add to appropriate list based on message status
-                        if message.status == "first":
-                            chat_exchanges.append(doc_exchange)
-                            break  # Stop after finding first message
-                        elif message.status == "step":
-                            chat_exchanges.append(doc_exchange)
-                        else:
-                            history_exchanges.append(doc_exchange)
-                # For regular messages, create DocumentExchange with individual docItem references
                 else:
                     doc_refs = []
                     for doc in message.documents:
                         doc_ref = self.getDocumentReferenceFromChatDocument(doc)
                         doc_refs.append(doc_ref)
-                    
                     if doc_refs:
-                        # Create DocumentExchange with individual document references
                         doc_exchange = DocumentExchange(
                             documentsLabel=f"{message.id}:documents",
                             documents=doc_refs
                         )
-                        
-                        # Add to appropriate list based on message status
-                        if message.status == "first":
-                            chat_exchanges.append(doc_exchange)
-                            break  # Stop after finding first message
-                        elif message.status == "step":
-                            chat_exchanges.append(doc_exchange)
-                        else:
-                            history_exchanges.append(doc_exchange)
             
-            # Stop processing if we hit a first message
-            if message.status == "first":
-                break
+            # Append to appropriate container based on boundary
+            if doc_exchange:
+                if in_current_round:
+                    chat_exchanges.append(doc_exchange)
+                else:
+                    history_exchanges.append(doc_exchange)
+            
+            # Flip boundary after including the "first" message in chat
+            if in_current_round and is_first:
+                in_current_round = False
         
         # Sort both lists by datetime in descending order
         chat_exchanges.sort(key=lambda x: x.documentsLabel, reverse=True)
@@ -393,31 +382,7 @@ class ServiceCenter:
         try:
             # ADDED LOGGING: Print workflow id, message count, and all message labels and document counts
             import logging
-            logger = logging.getLogger(__name__)
-            logger.debug(f"WORKFLOW STATE at getChatDocumentsFromDocumentList: id={id(self.workflow)}, message_count={len(self.workflow.messages) if hasattr(self.workflow, 'messages') else 'N/A'}")
-            for idx, message in enumerate(getattr(self.workflow, 'messages', [])):
-                label = getattr(message, 'documentsLabel', None)
-                docs = getattr(message, 'documents', None)
-                logger.debug(f"  Message {idx}: label='{label}', documents_count={len(docs) if docs else 0}")
-            # DEBUG LOGGING: Print all document labels and their documents before extraction
-            import logging
-            logger = logging.getLogger(__name__)
-            logger.info("==== DEBUG: Listing all workflow message document labels and contained documents ====")
-            for message in self.workflow.messages:
-                label = getattr(message, 'documentsLabel', None)
-                docs = getattr(message, 'documents', None)
-                if label is not None:
-                    doc_names = []
-                    if docs:
-                        for doc in docs:
-                            if hasattr(doc, 'filename'):
-                                doc_names.append(doc.filename)
-                            elif isinstance(doc, dict) and 'filename' in doc:
-                                doc_names.append(doc['filename'])
-                            else:
-                                doc_names.append(str(doc))
-                    logger.info(f"Message label: '{label}' | Documents: {doc_names if doc_names else 'None'}")
-            logger.info("==== END DEBUG LIST ====")
+
             all_documents = []
             for doc_ref in documentList:
                 # Parse reference format
@@ -434,12 +399,12 @@ class ServiceCenter:
                             found = True
                             break
                     if not found:
-                        logger.warning(f"No documents found for label: {label}")
+                        logger.debug(f"No documents found for label: {label}")
                     continue
                 
                 # Handle structured reference format
                 if len(parts) < 3:
-                    logger.warning(f"Invalid document reference format: {doc_ref}")
+                    logger.debug(f"Invalid document reference format: {doc_ref}")
                     continue
                     
                 ref_type = parts[0]
@@ -487,7 +452,7 @@ class ServiceCenter:
     
     def getConnectionReferenceFromUserConnection(self, connection: UserConnection) -> str:
         """Get connection reference from UserConnection"""
-        return f"connection:{connection.authority}:{connection.externalUsername}:{connection.id}"
+        return f"connection:{connection.authority.value}:{connection.externalUsername}:{connection.id}"
     
     def getUserConnectionFromConnectionReference(self, connectionReference: str) -> Optional[UserConnection]:
         """Get UserConnection from reference string"""
@@ -506,7 +471,7 @@ class ServiceCenter:
             
             # Find matching connection
             for conn in user_connections:
-                if str(conn.id) == conn_id and conn.authority == authority and conn.externalUsername == username:
+                if str(conn.id) == conn_id and conn.authority.value == authority and conn.externalUsername == username:
                     return conn
             return None
             
@@ -700,16 +665,16 @@ Please provide a clear summary of this message."""
     async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> ExtractedContent:
         """Extract content from ChatDocument using prompt"""
         try:
-            # Extract file data from ChatDocument
-            if document.data:
-                fileData = document.data.encode('utf-8') if isinstance(document.data, str) else document.data
-            else:
-                # Try to get file data from service center if document has fileId
-                if hasattr(document, 'fileId') and document.fileId:
-                    fileData = self.getFileData(document.fileId)
-                else:
-                    logger.error(f"No file data available in document: {document}")
-                    raise ValueError("No file data available in document")
+            # ChatDocument is just a reference, so we need to get file data using fileId
+            if not hasattr(document, 'fileId') or not document.fileId:
+                logger.error(f"Document {document.id} has no fileId")
+                raise ValueError("Document has no fileId")
+            
+            # Get file data from service center using document's fileId
+            fileData = self.getFileData(document.fileId)
+            if not fileData:
+                logger.error(f"No file data found for fileId: {document.fileId}")
+                raise ValueError("No file data found for document")
             
             # Get filename and mime type from document
             filename = document.filename if hasattr(document, 'filename') else "document"
@@ -739,11 +704,11 @@ Please provide a clear summary of this message."""
         """Extract content from file data directly using prompt"""
         try:
             return await self.documentProcessor.processFileData(
-                prompt=prompt,
                 fileData=fileData,
                 filename=filename,
                 mimeType=mimeType,
                 base64Encoded=base64Encoded,
+                prompt=prompt,
                 documentId=documentId
             )
         except Exception as e:
@@ -771,15 +736,19 @@ Please provide a clear summary of this message."""
         
         return file_item.id
     
-    def createDocument(self, fileName: str, mimeType: str, content: str, base64encoded: bool = True) -> ChatDocument:
+    def createDocument(self, fileName: str, mimeType: str, content: str, base64encoded: bool = True, existing_file_id: str = None) -> ChatDocument:
         """Create document from file data object created by AI call"""
-        # First create the file and get its ID
-        file_id = self.createFile(fileName, mimeType, content, base64encoded)
+        # Use existing file ID if provided, otherwise create new file
+        if existing_file_id:
+            file_id = existing_file_id
+        else:
+            # First create the file and get its ID
+            file_id = self.createFile(fileName, mimeType, content, base64encoded)
         
         # Get file info for metadata
         file_info = self.interfaceComponent.getFile(file_id)
         
-        # Create document with file reference
+        # Create document with file reference (ChatDocument is just a reference, not a data container)
         return ChatDocument(
             id=str(uuid.uuid4()),
             fileId=file_id,
@@ -807,8 +776,7 @@ Please provide a clear summary of this message."""
                     bytesReceived=bytesReceived
                 )
                 
-                # Log the stats event
-                logger.debug(f"Workflow stats updated - Event: {eventLabel}, Sent: {bytesSent}, Received: {bytesReceived}, Tokens: {tokenCount}")
+
                 
         except Exception as e:
             logger.error(f"Error updating workflow stats: {str(e)}")
diff --git a/modules/interfaces/interfaceAiCalls.py b/modules/interfaces/interfaceAiCalls.py
index 1b0525f7..2c47ff33 100644
--- a/modules/interfaces/interfaceAiCalls.py
+++ b/modules/interfaces/interfaceAiCalls.py
@@ -62,33 +62,42 @@ class AiCalls:
         Advanced text processing using Anthropic.
         Fallback to OpenAI if Anthropic is overloaded or rate-limited.
         """
-        messages = []
-        if context:
-            messages.append({
-                "role": "system",
-                "content": context
-            })
-        messages.append({
-            "role": "user",
-            "content": prompt
-        })
-        if hasattr(self, 'userLanguage') and self.userLanguage:
-            ltext = f"Please respond in '{self.userLanguage}' language."
-            if messages and messages[0]["role"] == "system":
-                if "language" not in messages[0]["content"].lower():
-                    messages[0]["content"] = f"{ltext} {messages[0]['content']}"
-            else:
-                messages.insert(0, {
-                    "role": "system", 
-                    "content": ltext
-                })
+        # For Anthropic, we need to handle system content differently
+        # Anthropic expects system content in a top-level parameter, not as a message role
         try:
-            response = await self.anthropicService.callAiBasic(messages)
+            # Create messages without system role for Anthropic
+            anthropic_messages = []
+            if hasattr(self, 'userLanguage') and self.userLanguage:
+                ltext = f"Please respond in '{self.userLanguage}' language."
+                if context:
+                    # Combine context and language instruction
+                    full_context = f"{ltext}\n\n{context}"
+                else:
+                    full_context = ltext
+            else:
+                full_context = context
+            
+            # Add user message
+            anthropic_messages.append({
+                "role": "user",
+                "content": prompt
+            })
+            
+            # Call Anthropic - let the connector handle system content conversion
+            if full_context:
+                # Send context as part of the user message for Anthropic
+                enhanced_prompt = f"Context:\n{full_context}\n\nUser Request:\n{prompt}"
+                response = await self.anthropicService.callAiBasic([
+                    {"role": "user", "content": enhanced_prompt}
+                ])
+            else:
+                response = await self.anthropicService.callAiBasic(anthropic_messages)
+            
             return response["choices"][0]["message"]["content"]
         except Exception as e:
             err_str = str(e)
             logger.warning(f"[UI NOTICE] Advanced AI failed, falling back to Basic AI (OpenAI). Reason: {err_str}")
-            # Optionally, you could surface this message to the UI via a return value or error object
+            # Fallback to OpenAI basic
             return await self.callAiTextBasic(prompt, context)
 
     async def callAiImageBasic(self, prompt: str, imageData: Union[str, bytes], mimeType: str = None) -> str:
diff --git a/modules/interfaces/interfaceAppObjects.py b/modules/interfaces/interfaceAppObjects.py
index a89e2f5a..56397be9 100644
--- a/modules/interfaces/interfaceAppObjects.py
+++ b/modules/interfaces/interfaceAppObjects.py
@@ -753,8 +753,8 @@ class AppObjects:
             logger.error(f"Error saving token: {str(e)}")
             raise
 
-    def getToken(self, authority: AuthAuthority) -> Optional[Token]:
-        """Get the latest token for the current user and authority"""
+    def getToken(self, authority: str) -> Optional[Token]:
+        """Get the latest valid token for the current user and authority"""
         try:
             # Get tokens for this user and authority
             tokens = self.db.getRecordset("tokens", recordFilter={
@@ -767,13 +767,20 @@ class AppObjects:
                 
             # Sort by creation date and get the latest
             tokens.sort(key=lambda x: x.get("createdAt", ""), reverse=True)
-            return Token(**tokens[0])
+            latest_token = Token(**tokens[0])
+            
+            # Check if token is expired
+            if latest_token.expiresAt and latest_token.expiresAt < datetime.now().timestamp():
+                logger.warning(f"Token for {authority} is expired (expiresAt: {latest_token.expiresAt})")
+                return None  # Don't return expired tokens
+            
+            return latest_token
             
         except Exception as e:
             logger.error(f"Error getting token: {str(e)}")
             return None
 
-    def deleteToken(self, authority: AuthAuthority) -> None:
+    def deleteToken(self, authority: str) -> None:
         """Delete all tokens for the current user and authority"""
         try:
             # Get tokens to delete
diff --git a/modules/interfaces/interfaceChatModel.py b/modules/interfaces/interfaceChatModel.py
index a3a5ed43..2b28b3bc 100644
--- a/modules/interfaces/interfaceChatModel.py
+++ b/modules/interfaces/interfaceChatModel.py
@@ -256,6 +256,7 @@ class TaskAction(BaseModel, ModelMixin):
     execResultLabel: Optional[str] = Field(None, description="Label for the set of result documents")
     # NEW: Optional document format specification
     expectedDocumentFormats: Optional[List[Dict[str, str]]] = Field(None, description="Expected document formats (optional)")
+
     status: TaskStatus = Field(default=TaskStatus.PENDING, description="Action status")
     error: Optional[str] = Field(None, description="Error message if action failed")
     retryCount: int = Field(default=0, description="Number of retries attempted")
@@ -530,13 +531,11 @@ register_model_labels(
 
 class TaskStep(BaseModel, ModelMixin):
     id: str
-    description: str
+    objective: str
     dependencies: Optional[list[str]] = []
-    expected_outputs: Optional[list[str]] = []
     success_criteria: Optional[list[str]] = []
-    required_documents: Optional[list[str]] = []
     estimated_complexity: Optional[str] = None
-    ai_prompt: Optional[str] = None
+
 
 class TaskContext(BaseModel, ModelMixin):
     task_step: TaskStep
diff --git a/modules/interfaces/interfaceChatObjects.py b/modules/interfaces/interfaceChatObjects.py
index 74d70245..7105f5de 100644
--- a/modules/interfaces/interfaceChatObjects.py
+++ b/modules/interfaces/interfaceChatObjects.py
@@ -880,7 +880,30 @@ class ChatObjects:
                 workflow = self.loadWorkflowState(workflowId)
                 if not workflow:
                     raise ValueError(f"Workflow {workflowId} not found")
+                
+                # Check if workflow is currently running and stop it first
+                if workflow.status == "running":
+                    logger.info(f"Stopping running workflow {workflowId} before processing new prompt")
                     
+                    # Stop the running workflow
+                    workflow.status = "stopped"
+                    workflow.lastActivity = currentTime
+                    self.updateWorkflow(workflowId, {
+                        "status": "stopped",
+                        "lastActivity": currentTime
+                    })
+                    
+                    # Add log entry for workflow stop
+                    self.createWorkflowLog({
+                        "workflowId": workflowId,
+                        "message": "Workflow stopped for new prompt",
+                        "type": "info",
+                        "status": "stopped",
+                        "progress": 100
+                    })
+                    
+                    # Wait a moment for any running processes to detect the stop
+                    await asyncio.sleep(0.1)
                 
                 # Update workflow - set status back to running for resumed workflows
                 self.updateWorkflow(workflowId, {
diff --git a/modules/methods/methodDocument.py b/modules/methods/methodDocument.py
index 9e0b6dba..e7f9d86c 100644
--- a/modules/methods/methodDocument.py
+++ b/modules/methods/methodDocument.py
@@ -5,7 +5,6 @@ Handles document operations using the document service.
 
 import logging
 from typing import Dict, Any, List, Optional
-import uuid
 from datetime import datetime, UTC
 
 from modules.chat.methodBase import MethodBase, ActionResult, action
@@ -24,19 +23,19 @@ class MethodDocument(MethodBase):
     @action
     async def extract(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        Extract specific content from document with ai prompt and return it in the specified format
+        Extract specific content from document with AI prompt and return it in the specified format.
         
         Parameters:
             documentList (str): Reference to the document list to extract content from
             aiPrompt (str): AI prompt for content extraction
-            includeMetadata (bool, optional): Whether to include metadata (default: True)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
+            includeMetadata (bool, optional): Whether to include metadata (default: True)
         """
         try:
             documentList = parameters.get("documentList")
             aiPrompt = parameters.get("aiPrompt")
-            includeMetadata = parameters.get("includeMetadata", True)
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
+            includeMetadata = parameters.get("includeMetadata", True)
             
             if not documentList:
                 return self._createResult(
@@ -60,32 +59,7 @@ class MethodDocument(MethodBase):
                     error="No documents found for the provided reference"
                 )
             
-            # Determine output format based on expected formats
-            output_extension = ".txt"  # Default
-            output_mime_type = "text/plain"  # Default
-            
-            if expectedDocumentFormats and len(expectedDocumentFormats) > 0:
-                # Use the first expected format
-                expected_format = expectedDocumentFormats[0]
-                output_extension = expected_format.get("extension", ".txt")
-                output_mime_type = expected_format.get("mimeType", "text/plain")
-                logger.info(f"Using expected format: {output_extension} ({output_mime_type})")
-                logger.info(f"Expected document formats: {expectedDocumentFormats}")
-            else:
-                logger.info("No expected format specified, using default .txt format")
-            
-            # Enhance AI prompt to specify output format
-            enhanced_prompt = aiPrompt
-            if output_extension == ".csv":
-                enhanced_prompt += f"\n\nCRITICAL: Deliver the result as pure CSV data without any markdown formatting, code blocks, or additional text. Output only the CSV content with proper headers and data rows. Do not include ```csv or ``` markers."
-            elif output_extension == ".json":
-                enhanced_prompt += f"\n\nCRITICAL: Deliver the result as pure JSON data without any markdown formatting, code blocks, or additional text. Output only the JSON content. Do not include ```json or ``` markers."
-            elif output_extension == ".xml":
-                enhanced_prompt += f"\n\nCRITICAL: Deliver the result as pure XML data without any markdown formatting, code blocks, or additional text. Output only the XML content. Do not include ```xml or ``` markers."
-            elif output_extension != ".txt":
-                enhanced_prompt += f"\n\nCRITICAL: Deliver the result as pure {output_extension.upper()} data without any markdown formatting, code blocks, or additional text. Output only the {output_extension.upper()} content. Do not include any markdown markers."
-            
-            # Extract content from all documents
+            # Extract content from all documents using AI
             all_extracted_content = []
             file_infos = []
             
@@ -99,7 +73,7 @@ class MethodDocument(MethodBase):
                     continue
                 
                 extracted_content = await self.service.extractContentFromFileData(
-                    prompt=enhanced_prompt,  # Use enhanced prompt instead of original
+                    prompt=aiPrompt,
                     fileData=file_data,
                     filename=file_info.get('name', 'document'),
                     mimeType=file_info.get('mimeType', 'application/octet-stream'),
@@ -118,21 +92,7 @@ class MethodDocument(MethodBase):
                     error="No content could be extracted from any documents"
                 )
             
-            # Extract text content from ExtractedContent objects
-            text_contents = []
-            for content_obj in all_extracted_content:
-                if hasattr(content_obj, 'contents') and content_obj.contents:
-                    # Extract text from ContentItem objects
-                    for content_item in content_obj.contents:
-                        if hasattr(content_item, 'data') and content_item.data:
-                            text_contents.append(content_item.data)
-                elif isinstance(content_obj, str):
-                    text_contents.append(content_obj)
-                else:
-                    # Fallback: convert to string representation
-                    text_contents.append(str(content_obj))
-            
-            # Process each document individually and create separate output files
+            # Process each document individually with its own format conversion
             output_documents = []
             
             for i, (chatDocument, extracted_content) in enumerate(zip(chatDocuments, all_extracted_content)):
@@ -140,36 +100,68 @@ class MethodDocument(MethodBase):
                 text_content = ""
                 if hasattr(extracted_content, 'contents') and extracted_content.contents:
                     # Extract text from ContentItem objects
+                    text_parts = []
                     for content_item in extracted_content.contents:
                         if hasattr(content_item, 'data') and content_item.data:
-                            text_content += content_item.data + "\n"
+                            text_parts.append(content_item.data)
+                    text_content = "\n".join(text_parts)
                 elif isinstance(extracted_content, str):
                     text_content = extracted_content
                 else:
-                    # Fallback: convert to string representation
                     text_content = str(extracted_content)
                 
-                # Create output filename based on original filename
+                # Get the expected format for this document (or use default)
+                target_format = None
+                if expectedDocumentFormats and i < len(expectedDocumentFormats):
+                    target_format = expectedDocumentFormats[i]
+                elif expectedDocumentFormats and len(expectedDocumentFormats) > 0:
+                    # If fewer formats than documents, use the last format for remaining documents
+                    target_format = expectedDocumentFormats[-1]
+                
+                # Determine output format and filename
+                if target_format:
+                    target_extension = target_format.get("extension", ".txt")
+                    target_mime_type = target_format.get("mimeType", "text/plain")
+                    
+                    # Check if format conversion is needed
+                    if target_extension not in [".txt", ".text"] or target_mime_type != "text/plain":
+                        logger.info(f"Converting document {i+1} to format: {target_extension} ({target_mime_type})")
+                        # Use AI to convert format
+                        formatted_content = await self._convertContentToFormat(text_content, target_format)
+                        final_content = formatted_content
+                        final_mime_type = target_mime_type
+                        final_extension = target_extension
+                    else:
+                        logger.info(f"Document {i+1}: No format conversion needed, using plain text")
+                        final_content = text_content
+                        final_mime_type = "text/plain"
+                        final_extension = ".txt"
+                else:
+                    logger.info(f"Document {i+1}: No expected format specified, using plain text")
+                    final_content = text_content
+                    final_mime_type = "text/plain"
+                    final_extension = ".txt"
+                
+                # Create output filename based on original filename and target format
                 original_filename = chatDocument.filename
                 base_name = original_filename.rsplit('.', 1)[0] if '.' in original_filename else original_filename
-                output_filename = f"{base_name}_extracted_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}{output_extension}"
+                output_filename = f"{base_name}_extracted_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}{final_extension}"
                 
                 # Create result data for this document
                 result_data = {
                     "documentCount": 1,
-                    "content": text_content,
+                    "content": final_content,
                     "originalFilename": original_filename,
                     "fileInfos": [file_infos[i]] if includeMetadata and i < len(file_infos) else None,
                     "timestamp": datetime.now(UTC).isoformat()
                 }
                 
-                logger.info(f"Created output document: {output_filename} with {len(text_content)} characters")
-                logger.info(f"Content preview: {text_content[:200]}...")
+                logger.info(f"Created output document: {output_filename} with {len(final_content)} characters")
                 
                 output_documents.append({
                     "documentName": output_filename,
                     "documentData": result_data,
-                    "mimeType": output_mime_type
+                    "mimeType": final_mime_type
                 })
             
             return self._createResult(
@@ -186,6 +178,327 @@ class MethodDocument(MethodBase):
                 error=str(e)
             )
 
+    @action
+    async def generate(self, parameters: Dict[str, Any]) -> ActionResult:
+        """
+        Generate documents in specific formats from document references.
+        This action automatically extracts content from documents and converts it to the specified format.
+        
+        Parameters:
+            documentList (list): List of document references to extract content from
+            expectedDocumentFormats (list): Expected document formats with extension, mimeType, description
+            originalDocuments (list, optional): List of original document names
+            includeMetadata (bool, optional): Whether to include metadata (default: True)
+        """
+        try:
+            document_list = parameters.get("documentList", [])
+            expected_document_formats = parameters.get("expectedDocumentFormats", [])
+            original_documents = parameters.get("originalDocuments", [])
+            include_metadata = parameters.get("includeMetadata", True)
+            
+            if not document_list:
+                return self._createResult(
+                    success=False,
+                    data={},
+                    error="Document list is required for generation"
+                )
+            
+            if not expected_document_formats or len(expected_document_formats) == 0:
+                return self._createResult(
+                    success=False,
+                    data={},
+                    error="Expected document formats specification is required"
+                )
+            
+            # Get chat documents for original documents list
+            chat_documents = self.service.getChatDocumentsFromDocumentList(document_list)
+            logger.info(f"Found {len(chat_documents)} chat documents")
+            
+            if not chat_documents:
+                return self._createResult(
+                    success=False,
+                    data={},
+                    error="No documents found for the provided documentList reference"
+                )
+            
+            # Update original documents list if not provided
+            if not original_documents:
+                original_documents = [doc.filename if hasattr(doc, 'filename') else str(doc.id) for doc in chat_documents]
+            
+            # Process each document individually with its own format conversion
+            output_documents = []
+            
+            for i, chat_document in enumerate(chat_documents):
+                # Extract content from this document
+                # ChatDocument is just a reference, so we need to get file data using fileId
+                content = ""
+                if hasattr(chat_document, 'fileId') and chat_document.fileId:
+                    # Need to get file data
+                    file_data = self.service.getFileData(chat_document.fileId)
+                    if file_data:
+                        if isinstance(file_data, bytes):
+                            content = file_data.decode('utf-8', errors='ignore')
+                        else:
+                            content = str(file_data)
+                    else:
+                        logger.warning(f"Could not get file data for document {i+1}, skipping")
+                        continue
+                else:
+                    logger.warning(f"Document {i+1} has no fileId, skipping")
+                    continue
+                
+                if not content:
+                    logger.warning(f"Could not extract content from document {i+1}, skipping")
+                    continue
+                
+                logger.info(f"Extracted content from document {i+1}: {len(content)} characters")
+                
+                # Get the expected format for this document (or use default)
+                target_format = None
+                if i < len(expected_document_formats):
+                    target_format = expected_document_formats[i]
+                elif len(expected_document_formats) > 0:
+                    # If fewer formats than documents, use the last format for remaining documents
+                    target_format = expected_document_formats[-1]
+                
+                if not target_format:
+                    logger.warning(f"No expected format for document {i+1}, skipping")
+                    continue
+                
+                # Use AI to convert format
+                formatted_content = await self._convertContentToFormat(content, target_format)
+                if not formatted_content:
+                    logger.warning(f"Failed to format document {i+1}, skipping")
+                    continue
+                
+                target_extension = target_format.get("extension", ".txt")
+                target_mime_type = target_format.get("mimeType", "text/plain")
+                
+                # Create output filename
+                timestamp = datetime.now(UTC).strftime('%Y%m%d_%H%M%S')
+                if i < len(original_documents):
+                    base_name = original_documents[i].rsplit('.', 1)[0] if '.' in original_documents[i] else original_documents[i]
+                else:
+                    base_name = f"document_{i+1}"
+                output_filename = f"{base_name}_generated_{timestamp}{target_extension}"
+                
+                # Create result data
+                result_data = {
+                    "documentCount": 1,
+                    "content": formatted_content,
+                    "outputFormat": target_format,
+                    "originalDocument": original_documents[i] if i < len(original_documents) else f"document_{i+1}",
+                    "timestamp": datetime.now(UTC).isoformat()
+                }
+                
+                logger.info(f"Generated document: {output_filename} with {len(formatted_content)} characters")
+                
+                output_documents.append({
+                    "documentName": output_filename,
+                    "documentData": result_data,
+                    "mimeType": target_mime_type
+                })
+            
+            if not output_documents:
+                return self._createResult(
+                    success=False,
+                    data={},
+                    error="No documents could be generated"
+                )
+            
+            return self._createResult(
+                success=True,
+                data={
+                    "documents": output_documents
+                }
+            )
+        except Exception as e:
+            logger.error(f"Error generating document: {str(e)}")
+            return self._createResult(
+                success=False,
+                data={},
+                error=str(e)
+            )
+
+    async def _convertContentToFormat(self, content: str, target_format: Dict[str, Any]) -> str:
+        """
+        Helper function to convert content to the specified format using AI.
+        """
+        try:
+            extension = target_format.get("extension", ".txt")
+            mime_type = target_format.get("mimeType", "text/plain")
+            
+            logger.info(f"Converting content to format: {extension} ({mime_type})")
+            
+            # Create AI prompt for format conversion
+            format_prompts = {
+                ".csv": f"""
+                Convert the following content into a proper CSV format.
+                
+                Requirements:
+                1. Output ONLY the CSV data without any markdown, code blocks, or additional text
+                2. Use appropriate headers based on the content
+                3. Ensure proper CSV formatting with commas and quotes where needed
+                4. Make the data easily readable and importable into spreadsheet applications
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the CSV data:
+                """,
+                
+                ".json": f"""
+                Convert the following content into a proper JSON format.
+                
+                Requirements:
+                1. Output ONLY the JSON data without any markdown, code blocks, or additional text
+                2. Structure the data logically with appropriate keys and values
+                3. Ensure valid JSON syntax
+                4. Make the data easily parseable and readable
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the JSON data:
+                """,
+                
+                ".xml": f"""
+                Convert the following content into a proper XML format.
+                
+                Requirements:
+                1. Output ONLY the XML data without any markdown, code blocks, or additional text
+                2. Use appropriate XML tags and structure
+                3. Ensure valid XML syntax
+                4. Make the data easily parseable and readable
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the XML data:
+                """,
+                
+                ".html": f"""
+                Convert the following content into a proper HTML format.
+                
+                Requirements:
+                1. Output ONLY the HTML data without any markdown, code blocks, or additional text
+                2. Use appropriate HTML tags and structure
+                3. Ensure valid HTML syntax
+                4. Make the data easily readable in web browsers
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the HTML data:
+                """,
+                
+                ".md": f"""
+                Convert the following content into a proper Markdown format.
+                
+                Requirements:
+                1. Output ONLY the Markdown data without any code blocks or additional text
+                2. Use appropriate Markdown syntax for headers, lists, emphasis, etc.
+                3. Structure the content logically
+                4. Make the data easily readable and convertible to other formats
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the Markdown data:
+                """
+            }
+            
+            # Get the appropriate prompt for the target format
+            if extension in format_prompts:
+                ai_prompt = format_prompts[extension]
+            else:
+                # Generic format conversion
+                ai_prompt = f"""
+                Convert the following content into {extension.upper()} format.
+                
+                Requirements:
+                1. Output ONLY the {extension.upper()} data without any markdown, code blocks, or additional text
+                2. Use appropriate formatting for {extension.upper()} files
+                3. Ensure the output is valid and usable
+                4. Make the data easily readable and importable
+                
+                Content to convert:
+                {content}
+                
+                Generate ONLY the {extension.upper()} data:
+                """
+            
+            # Call AI to generate the formatted content
+            logger.info(f"Calling AI for {extension} format conversion")
+            formatted_content = await self.service.callAiTextBasic(ai_prompt, content)
+            
+            if not formatted_content or formatted_content.strip() == "":
+                logger.warning("AI format conversion failed, using fallback")
+                return self._generateFallbackFormattedContent(content, extension, mime_type)
+            
+            # Clean up the AI response
+            formatted_content = formatted_content.strip()
+            
+            # Remove markdown code blocks if present
+            if formatted_content.startswith("```") and formatted_content.endswith("```"):
+                lines = formatted_content.split('\n')
+                if len(lines) > 2:
+                    formatted_content = '\n'.join(lines[1:-1])
+            
+            return formatted_content
+            
+        except Exception as e:
+            logger.error(f"Error in AI format conversion: {str(e)}")
+            return self._generateFallbackFormattedContent(content, extension, mime_type)
+
+    def _generateFallbackFormattedContent(self, content: str, extension: str, mime_type: str) -> str:
+        """
+        Generate fallback formatted content when AI conversion fails.
+        """
+        try:
+            if extension == ".csv":
+                # Simple CSV fallback - split by lines and create basic CSV
+                lines = content.strip().split('\n')
+                if lines:
+                    # Create a simple CSV with line numbers and content
+                    csv_lines = ["Line,Content"]
+                    for i, line in enumerate(lines, 1):
+                        # Escape quotes and wrap in quotes if comma present
+                        if ',' in line:
+                            line = f'"{line.replace(chr(34), chr(34) + chr(34))}"'
+                        csv_lines.append(f"{i},{line}")
+                    return '\n'.join(csv_lines)
+                return "Line,Content\n1,No content available"
+                
+            elif extension == ".json":
+                # Simple JSON fallback
+                content_escaped = content.replace('"', '\\"')
+                timestamp = datetime.now(UTC).isoformat()
+                return f'{{"content": "{content_escaped}", "format": "json", "timestamp": "{timestamp}"}}'
+                
+            elif extension == ".xml":
+                # Simple XML fallback
+                timestamp = datetime.now(UTC).isoformat()
+                return f'<?xml version="1.0" encoding="UTF-8"?>\n<document>\n<content>{content}</content>\n<format>xml</format>\n<timestamp>{timestamp}</timestamp>\n</document>'
+                
+            elif extension == ".html":
+                # Simple HTML fallback
+                timestamp = datetime.now(UTC).strftime('%Y-%m-%d %H:%M:%S UTC')
+                return f'<!DOCTYPE html>\n<html>\n<head><meta charset="UTF-8"><title>Generated Document</title></head>\n<body>\n<pre>{content}</pre>\n<p><em>Generated on {timestamp}</em></p>\n</body>\n</html>'
+                
+            elif extension == ".md":
+                # Simple Markdown fallback
+                timestamp = datetime.now(UTC).strftime('%Y-%m-%d %H:%M:%S UTC')
+                return f"# Generated Document\n\n{content}\n\n---\n*Generated on {timestamp}*"
+                
+            else:
+                # Generic fallback - return content as-is
+                return content
+                
+        except Exception as e:
+            logger.error(f"Error in fallback format conversion: {str(e)}")
+            return content
+
     @action
     async def generateReport(self, parameters: Dict[str, Any]) -> ActionResult:
         """
@@ -209,6 +522,8 @@ class MethodDocument(MethodBase):
                 )
             
             chatDocuments = self.service.getChatDocumentsFromDocumentList(documentList)
+            logger.info(f"Retrieved {len(chatDocuments)} chat documents for report generation")
+            
             if not chatDocuments:
                 return self._createResult(
                     success=False,
@@ -261,15 +576,30 @@ class MethodDocument(MethodBase):
             
             for doc in chatDocuments:
                 content = ""
-                if hasattr(doc, 'content') and doc.content:
-                    content = doc.content.strip()
-                elif hasattr(doc, 'data') and doc.data:
-                    content = doc.data.strip()
+                logger.info(f"Processing document: type={type(doc)}")
+                
+                # Get actual file content using the fileId reference
+                try:
+                    file_data = self.service.getFileData(doc.fileId)
+                    if file_data:
+                        # Convert bytes to string
+                        if isinstance(file_data, bytes):
+                            content = file_data.decode('utf-8')
+                        else:
+                            content = str(file_data)
+                        logger.info(f"  Retrieved content from file: {len(content)} characters")
+                    else:
+                        logger.warning(f"  No file data found for fileId: {doc.fileId}")
+                except Exception as e:
+                    logger.error(f"  Error retrieving file data: {str(e)}")
                 
                 # Skip empty documents
                 if content:
                     validDocuments.append(doc)
                     allContent.append(f"Document: {doc.filename}\n{content}\n")
+                    logger.info(f"  Added document to valid documents list")
+                else:
+                    logger.warning(f"  Skipping document with no content")
             
             if not validDocuments:
                 # If no valid documents, create a simple report
@@ -354,10 +684,17 @@ class MethodDocument(MethodBase):
             
             # Add document content if available
             content = ""
-            if hasattr(doc, 'content') and doc.content:
-                content = doc.content
-            elif hasattr(doc, 'data') and doc.data:
-                content = doc.data
+            if hasattr(doc, 'fileId') and doc.fileId:
+                # ChatDocument is just a reference, so we need to get file data using fileId
+                try:
+                    file_data = self.service.getFileData(doc.fileId)
+                    if file_data:
+                        if isinstance(file_data, bytes):
+                            content = file_data.decode('utf-8')
+                        else:
+                            content = str(file_data)
+                except Exception as e:
+                    logger.warning(f"Could not retrieve content for document {doc.filename}: {str(e)}")
             
             if content:
                 html.append(f"<div style='white-space:pre-wrap; border:1px solid #ccc; padding:0.5em; margin-bottom:1em; background-color:#f9f9f9;'>{content}</div>")
diff --git a/modules/methods/methodOutlook.py b/modules/methods/methodOutlook.py
index 4fbd3cdf..6c9ed260 100644
--- a/modules/methods/methodOutlook.py
+++ b/modules/methods/methodOutlook.py
@@ -26,13 +26,13 @@ class MethodOutlook(MethodBase):
         """Get Microsoft connection from connection reference"""
         try:
             userConnection = self.service.getUserConnectionFromConnectionReference(connectionReference)
-            if not userConnection or userConnection.authority != "msft" or userConnection.status != "active":
+            if not userConnection or userConnection.authority.value != "msft" or userConnection.status.value != "active":
                 return None
             
             # Get the corresponding token for this user and authority
-            token = self.service.interfaceApp.getToken(userConnection.authority)
+            token = self.service.interfaceApp.getToken(userConnection.authority.value)
             if not token:
-                logger.warning(f"No token found for user {userConnection.userId} and authority {userConnection.authority}")
+                logger.warning(f"No token found for user {userConnection.userId} and authority {userConnection.authority.value}")
                 return None
             
             return {
@@ -80,24 +80,78 @@ class MethodOutlook(MethodBase):
                     error="No valid Microsoft connection found for the provided connection reference"
                 )
             
-            # Create email reading prompt
-            email_prompt = f"""
-            Simulate reading emails from Microsoft Outlook.
-            
-            Connection: {connection['id']}
-            Folder: {folder}
-            Limit: {limit}
-            Filter: {filter or 'None'}
-            
-            Please provide:
-            1. List of emails with subject, sender, date, and content
-            2. Summary of email statistics
-            3. Important or urgent emails highlighted
-            4. Email categorization if possible
-            """
-            
-            # Use AI to simulate email reading
-            email_data = await self.service.interfaceAiCalls.callAiTextAdvanced(email_prompt)
+            # Read emails using Microsoft Graph API
+            try:
+                import requests
+                
+                # Microsoft Graph API endpoint for messages
+                graph_url = "https://graph.microsoft.com/v1.0"
+                headers = {
+                    "Authorization": f"Bearer {connection['accessToken']}",
+                    "Content-Type": "application/json"
+                }
+                
+                # Build the API request
+                api_url = f"{graph_url}/me/mailFolders/{folder}/messages"
+                params = {
+                    "$top": limit,
+                    "$orderby": "receivedDateTime desc"
+                }
+                
+                if filter:
+                    params["$filter"] = filter
+                
+                # Make the API call
+                response = requests.get(api_url, headers=headers, params=params)
+                response.raise_for_status()
+                
+                emails_data = response.json()
+                email_data = {
+                    "emails": emails_data.get("value", []),
+                    "count": len(emails_data.get("value", [])),
+                    "folder": folder,
+                    "filter": filter,
+                    "apiResponse": emails_data
+                }
+                
+                logger.info(f"Successfully retrieved {len(emails_data.get('value', []))} emails from {folder}")
+                
+            except ImportError:
+                logger.error("requests module not available, falling back to simulation")
+                # Fallback to simulation if requests module is not available
+                email_prompt = f"""
+                Simulate reading emails from Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                Folder: {folder}
+                Limit: {limit}
+                Filter: {filter or 'None'}
+                
+                Please provide:
+                1. List of emails with subject, sender, date, and content
+                2. Summary of email statistics
+                3. Important or urgent emails highlighted
+                4. Email categorization if possible
+                """
+                email_data = await self.service.interfaceAiCalls.callAiTextAdvanced(email_prompt)
+            except Exception as e:
+                logger.error(f"Error reading emails from Microsoft Graph API: {str(e)}")
+                # Fallback to simulation on API error
+                email_prompt = f"""
+                Simulate reading emails from Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                Folder: {folder}
+                Limit: {limit}
+                Filter: {filter or 'None'}
+                
+                Please provide:
+                1. List of emails with subject, sender, date, and content
+                2. Summary of email statistics
+                3. Important or urgent emails highlighted
+                4. Email categorization if possible
+                """
+                email_data = await self.service.interfaceAiCalls.callAiTextAdvanced(email_prompt)
             
             # Create result data
             result_data = {
@@ -151,7 +205,7 @@ class MethodOutlook(MethodBase):
     @action
     async def sendEmail(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        Send email via Outlook
+        Create email draft in Outlook for sending out
         
         Parameters:
             connectionReference (str): Reference to the Microsoft connection
@@ -160,6 +214,7 @@ class MethodOutlook(MethodBase):
             body (str): Email body content
             cc (List[str], optional): CC recipients
             bcc (List[str], optional): BCC recipients
+            attachments (List[str], optional): List of document references to attach
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
@@ -169,6 +224,7 @@ class MethodOutlook(MethodBase):
             body = parameters.get("body")
             cc = parameters.get("cc", [])
             bcc = parameters.get("bcc", [])
+            attachments = parameters.get("attachments", [])
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
             if not connectionReference or not to or not subject or not body:
@@ -187,26 +243,111 @@ class MethodOutlook(MethodBase):
                     error="No valid Microsoft connection found for the provided connection reference"
                 )
             
-            # Create email sending prompt
-            send_prompt = f"""
-            Simulate sending an email via Microsoft Outlook.
-            
-            Connection: {connection['id']}
-            To: {to}
-            Subject: {subject}
-            Body: {body}
-            CC: {cc}
-            BCC: {bcc}
-            
-            Please provide:
-            1. Email composition details
-            2. Validation of email addresses
-            3. Email formatting and structure
-            4. Delivery confirmation simulation
-            """
-            
-            # Use AI to simulate email sending
-            send_result = await self.service.interfaceAiCalls.callAiTextAdvanced(send_prompt)
+            # Create email draft using Microsoft Graph API
+            try:
+                import requests
+                
+                # Microsoft Graph API endpoint for creating draft messages
+                graph_url = "https://graph.microsoft.com/v1.0"
+                headers = {
+                    "Authorization": f"Bearer {connection['accessToken']}",
+                    "Content-Type": "application/json"
+                }
+                
+                # Build the email message
+                message = {
+                    "subject": subject,
+                    "body": {
+                        "contentType": "HTML",
+                        "content": body
+                    },
+                    "toRecipients": [{"emailAddress": {"address": email}} for email in to],
+                    "ccRecipients": [{"emailAddress": {"address": email}} for email in cc] if cc else [],
+                    "bccRecipients": [{"emailAddress": {"address": email}} for email in bcc] if bcc else []
+                }
+                
+                # Add attachments if provided
+                if attachments:
+                    message["attachments"] = []
+                    for attachment_ref in attachments:
+                        # Get attachment document from service center
+                        attachment_docs = self.service.getChatDocumentsFromDocumentList([attachment_ref])
+                        if attachment_docs:
+                            for doc in attachment_docs:
+                                # Create attachment object for Graph API
+                                attachment = {
+                                    "@odata.type": "#microsoft.graph.fileAttachment",
+                                    "name": doc.filename,
+                                    "contentType": doc.mimeType,
+                                    "contentBytes": doc.data if hasattr(doc, 'data') else ""
+                                }
+                                message["attachments"].append(attachment)
+                
+                # Create the draft message
+                api_url = f"{graph_url}/me/messages"
+                response = requests.post(api_url, headers=headers, json=message)
+                response.raise_for_status()
+                
+                draft_data = response.json()
+                draft_result = {
+                    "status": "draft_created",
+                    "messageId": draft_data.get("id", "unknown"),
+                    "draftId": draft_data.get("id", "unknown"),
+                    "recipients": to,
+                    "cc": cc,
+                    "bcc": bcc,
+                    "attachments": len(attachments) if attachments else 0,
+                    "draftLocation": "Drafts folder",
+                    "apiResponse": response.status_code,
+                    "draftData": draft_data
+                }
+                
+                logger.info(f"Successfully created email draft for {len(to)} recipients with {len(attachments) if attachments else 0} attachments")
+                
+            except ImportError:
+                logger.error("requests module not available, falling back to simulation")
+                # Fallback to simulation if requests module is not available
+                send_prompt = f"""
+                Simulate creating an email draft in Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                To: {to}
+                Subject: {subject}
+                Body: {body}
+                CC: {cc}
+                BCC: {bcc}
+                Attachments: {attachments if attachments else 'None'}
+                
+                Please provide:
+                1. Email composition details
+                2. Validation of email addresses
+                3. Email formatting and structure
+                4. Attachment processing and validation
+                5. Draft creation confirmation
+                """
+                draft_result = await self.service.interfaceAiCalls.callAiTextAdvanced(send_prompt)
+            except Exception as e:
+                logger.error(f"Error creating email draft via Microsoft Graph API: {str(e)}")
+                # Fallback to simulation on API error
+                send_prompt = f"""
+                Simulate creating an email draft in Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                To: {to}
+                Subject: {subject}
+                Body: {body}
+                CC: {cc}
+                BCC: {bcc}
+                Attachments: {attachments if attachments else 'None'}
+                
+                Please provide:
+                1. Email composition details
+                2. Validation of email addresses
+                3. Email formatting and structure
+                4. Attachment processing and validation
+                5. Draft creation confirmation
+                """
+                draft_result = await self.service.interfaceAiCalls.callAiTextAdvanced(send_prompt)
             
             # Create result data
             result_data = {
@@ -216,7 +357,8 @@ class MethodOutlook(MethodBase):
                 "body": body,
                 "cc": cc,
                 "bcc": bcc,
-                "sendResult": send_result,
+                "attachments": attachments,
+                "draftResult": draft_result,
                 "connection": {
                     "id": connection["id"],
                     "authority": "microsoft",
@@ -243,7 +385,7 @@ class MethodOutlook(MethodBase):
                 data={
                     "documents": [
                         {
-                            "documentName": f"outlook_email_sent_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}{output_extension}",
+                            "documentName": f"outlook_email_draft_{datetime.now(UTC).strftime('%Y%m%d_%H%M%S')}{output_extension}",
                             "documentData": result_data,
                             "mimeType": output_mime_type
                         }
@@ -252,7 +394,7 @@ class MethodOutlook(MethodBase):
             )
             
         except Exception as e:
-            logger.error(f"Error sending email: {str(e)}")
+            logger.error(f"Error creating email draft: {str(e)}")
             return self._createResult(
                 success=False,
                 data={},
@@ -294,24 +436,81 @@ class MethodOutlook(MethodBase):
                     error="No valid Microsoft connection found for the provided connection reference"
                 )
             
-            # Create email search prompt
-            search_prompt = f"""
-            Simulate searching emails in Microsoft Outlook.
-            
-            Connection: {connection['id']}
-            Query: {query}
-            Folder: {folder}
-            Limit: {limit}
-            
-            Please provide:
-            1. Search results with relevant emails
-            2. Search statistics and relevance scores
-            3. Email previews and key information
-            4. Search suggestions and refinements
-            """
-            
-            # Use AI to simulate email search
-            search_result = await self.service.interfaceAiCalls.callAiTextAdvanced(search_prompt)
+            # Search emails using Microsoft Graph API
+            try:
+                import requests
+                
+                # Microsoft Graph API endpoint for searching messages
+                graph_url = "https://graph.microsoft.com/v1.0"
+                headers = {
+                    "Authorization": f"Bearer {connection['accessToken']}",
+                    "Content-Type": "application/json"
+                }
+                
+                # Build the search API request
+                api_url = f"{graph_url}/me/messages"
+                params = {
+                    "$top": limit,
+                    "$orderby": "receivedDateTime desc",
+                    "$search": f'"{query}"'
+                }
+                
+                # Add folder filter if specified
+                if folder and folder.lower() != "all":
+                    params["$filter"] = f"parentFolderId eq '{folder}'"
+                
+                # Make the API call
+                response = requests.get(api_url, headers=headers, params=params)
+                response.raise_for_status()
+                
+                search_data = response.json()
+                search_result = {
+                    "query": query,
+                    "results": search_data.get("value", []),
+                    "count": len(search_data.get("value", [])),
+                    "folder": folder,
+                    "limit": limit,
+                    "apiResponse": search_data
+                }
+                
+                logger.info(f"Successfully searched emails with query '{query}', found {len(search_data.get('value', []))} results")
+                
+            except ImportError:
+                logger.error("requests module not available, falling back to simulation")
+                # Fallback to simulation if requests module is not available
+                search_prompt = f"""
+                Simulate searching emails in Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                Query: {query}
+                Folder: {folder}
+                Limit: {limit}
+                
+                Please provide:
+                1. Search results with relevant emails
+                2. Search statistics and relevance scores
+                3. Email previews and key information
+                4. Search suggestions and refinements
+                """
+                search_result = await self.service.interfaceAiCalls.callAiTextAdvanced(search_prompt)
+            except Exception as e:
+                logger.error(f"Error searching emails via Microsoft Graph API: {str(e)}")
+                # Fallback to simulation on API error
+                search_prompt = f"""
+                Simulate searching emails in Microsoft Outlook.
+                
+                Connection: {connection['id']}
+                Query: {query}
+                Folder: {folder}
+                Limit: {limit}
+                
+                Please provide:
+                1. Search results with relevant emails
+                2. Search statistics and relevance scores
+                3. Email previews and key information
+                4. Search suggestions and refinements
+                """
+                search_result = await self.service.interfaceAiCalls.callAiTextAdvanced(search_prompt)
             
             # Create result data
             result_data = {
diff --git a/modules/methods/methodSharepoint.py b/modules/methods/methodSharepoint.py
index 8b156237..884974c3 100644
--- a/modules/methods/methodSharepoint.py
+++ b/modules/methods/methodSharepoint.py
@@ -32,9 +32,9 @@ class MethodSharepoint(MethodBase):
                 return None
             
             # Get the corresponding token for this user and authority
-            token = self.service.interfaceApp.getToken(userConnection.authority)
+            token = self.service.interfaceApp.getToken(userConnection.authority.value)
             if not token:
-                logger.warning(f"No token found for user {userConnection.userId} and authority {userConnection.authority}")
+                logger.warning(f"No token found for user {userConnection.userId} and authority {userConnection.authority.value}")
                 return None
             
             return {
diff --git a/modules/workflow/managerWorkflow.py b/modules/workflow/managerWorkflow.py
index c6b1b6ad..0f7cd683 100644
--- a/modules/workflow/managerWorkflow.py
+++ b/modules/workflow/managerWorkflow.py
@@ -8,7 +8,8 @@ from modules.interfaces.interfaceAppObjects import User
 
 from modules.interfaces.interfaceChatModel import (UserInputRequest, ChatMessage, ChatWorkflow, TaskItem, TaskStatus)
 from modules.interfaces.interfaceChatObjects import ChatObjects
-from modules.chat.managerChat import ChatManager, WorkflowStoppedException
+from modules.chat.managerChat import ChatManager
+from modules.chat.handling.handlingTasks import WorkflowStoppedException
 from modules.interfaces.interfaceChatModel import WorkflowResult
 
 logger = logging.getLogger(__name__)
@@ -52,6 +53,21 @@ class WorkflowManager:
                 "lastActivity": workflow.lastActivity
             })
             
+            # Create final stopped message
+            stopped_message = {
+                "workflowId": workflow.id,
+                "role": "assistant",
+                "message": "🛑 Workflow stopped by user",
+                "status": "last",
+                "sequenceNr": len(workflow.messages) + 1,
+                "publishedAt": datetime.now(UTC).isoformat(),
+                "documentsLabel": "workflow_stopped",
+                "documents": []
+            }
+            message = self.chatInterface.createWorkflowMessage(stopped_message)
+            if message:
+                workflow.messages.append(message)
+            
             # Add log entry
             self.chatInterface.createWorkflowLog({
                 "workflowId": workflow.id,
@@ -99,6 +115,8 @@ class WorkflowManager:
     async def _sendFirstMessage(self, userInput: UserInputRequest, workflow: ChatWorkflow) -> ChatMessage:
         """Send first message to start workflow"""
         try:
+            self.chatManager.handlingTasks._checkWorkflowStopped()
+            
             # Create initial message using interface
             messageData = {
                 "workflowId": workflow.id,
@@ -130,6 +148,8 @@ class WorkflowManager:
     async def _generateWorkflowFeedback(self, workflow: ChatWorkflow) -> str:
         """Generate feedback message for workflow completion"""
         try:
+            self.chatManager.handlingTasks._checkWorkflowStopped()
+            
             # Count messages by role
             user_messages = [msg for msg in workflow.messages if msg.role == 'user']
             assistant_messages = [msg for msg in workflow.messages if msg.role == 'assistant']
@@ -155,9 +175,13 @@ class WorkflowManager:
     async def _sendLastMessage(self, workflow: ChatWorkflow) -> None:
         """Send last message to complete workflow"""
         try:
+            self.chatManager.handlingTasks._checkWorkflowStopped()
+            
             # Generate feedback
             feedback = await self._generateWorkflowFeedback(workflow)
             
+            self.chatManager.handlingTasks._checkWorkflowStopped()
+            
             # Create last message using interface
             messageData = {
                 "workflowId": workflow.id,
@@ -199,7 +223,60 @@ class WorkflowManager:
     async def _processWorkflowResults(self, workflow: ChatWorkflow, workflow_result: WorkflowResult, initial_message: ChatMessage) -> None:
         """Process workflow results and create appropriate messages"""
         try:
-            if workflow_result.status == 'failed':
+            try:
+                self.chatManager.handlingTasks._checkWorkflowStopped()
+            except WorkflowStoppedException:
+                logger.info(f"Workflow {workflow.id} was stopped during result processing")
+                
+                # Create final stopped message
+                stopped_message = {
+                    "workflowId": workflow.id,
+                    "role": "assistant",
+                    "message": "🛑 Workflow stopped by user",
+                    "status": "last",
+                    "sequenceNr": len(workflow.messages) + 1,
+                    "publishedAt": datetime.now(UTC).isoformat(),
+                    "documentsLabel": "workflow_stopped",
+                    "documents": []
+                }
+                message = self.chatInterface.createWorkflowMessage(stopped_message)
+                if message:
+                    workflow.messages.append(message)
+                
+                # Update workflow status to stopped
+                workflow.status = "stopped"
+                workflow.lastActivity = datetime.now(UTC).isoformat()
+                self.chatInterface.updateWorkflow(workflow.id, {
+                    "status": "stopped",
+                    "lastActivity": workflow.lastActivity
+                })
+                return
+            
+            if workflow_result.status == 'stopped':
+                # Create stopped message
+                stopped_message = {
+                    "workflowId": workflow.id,
+                    "role": "assistant",
+                    "message": "🛑 Workflow stopped by user",
+                    "status": "last",
+                    "sequenceNr": len(workflow.messages) + 1,
+                    "publishedAt": datetime.now(UTC).isoformat(),
+                    "documentsLabel": "workflow_stopped",
+                    "documents": []
+                }
+                message = self.chatInterface.createWorkflowMessage(stopped_message)
+                if message:
+                    workflow.messages.append(message)
+                
+                # Update workflow status to stopped
+                workflow.status = "stopped"
+                workflow.lastActivity = datetime.now(UTC).isoformat()
+                self.chatInterface.updateWorkflow(workflow.id, {
+                    "status": "stopped",
+                    "lastActivity": workflow.lastActivity
+                })
+                return
+            elif workflow_result.status == 'failed':
                 # Create error message
                 error_message = {
                     "workflowId": workflow.id,
diff --git a/requirements.txt b/requirements.txt
index 28085d1d..7802da0b 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -25,6 +25,7 @@ PyMuPDF>=1.23.7     # Statt dem ungenauen 'fitz'
 PyPDF2==3.0.1
 python-docx>=0.8.11 # Für Word-Dokumente
 openpyxl>=3.1.2     # Für Excel-Dateien
+python-pptx>=0.6.21 # Für PowerPoint-Dateien
 
 ## Data Processing & Analysis
 numpy==1.26.3       # Version die mit pandas und matplotlib kompatibel ist
@@ -52,3 +53,14 @@ sortedcontainers>=2.4.0     # Required by trio
 
 ## MSFT Integration
 msal==1.24.1
+
+# Enhanced Office document processing
+python-docx>=0.8.11
+openpyxl>=3.0.9
+python-pptx>=0.6.21
+xlrd>=2.0.1  # For legacy .xls files
+Pillow>=9.0.0  # For image processing
+PyPDF2>=3.0.0
+PyMuPDF>=1.20.0
+beautifulsoup4>=4.11.0
+chardet>=4.0.0  # For encoding detection
diff --git a/test_documentExtraction.py b/test_documentExtraction.py
new file mode 100644
index 00000000..2e34e1a3
--- /dev/null
+++ b/test_documentExtraction.py
@@ -0,0 +1,855 @@
+#!/usr/bin/env python3
+"""
+Test script for DocumentExtraction class.
+Processes all files in d:/temp folder and stores extracted content in d:/temp/extracted.
+
+Features:
+- Option to extract content WITH AI processing (default)
+- Option to extract content WITHOUT AI processing (content-only mode)
+- Supports all document types: text, images, PDFs, Office documents, etc.
+- Detailed logging and progress tracking
+- Separate output directories for AI vs content-only modes
+
+Usage:
+- Interactive mode: python test_documentExtraction.py
+- Content-only mode: python test_documentExtraction.py --no-ai
+- Content-only mode: python test_documentExtraction.py --content-only
+- Specify custom input/output: python test_documentExtraction.py --input-dir /path/to/input --output-dir /path/to/output --no-ai
+"""
+
+import os
+import asyncio
+import logging
+import sys
+import argparse
+from pathlib import Path
+from typing import List, Optional
+from datetime import datetime, UTC
+
+# Configure logging
+logging.basicConfig(
+    level=logging.DEBUG,  # Changed from INFO to DEBUG
+    format='%(asctime)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+# Filter out specific unwanted log messages
+class LogFilter(logging.Filter):
+    """Filter to hide specific unwanted log messages."""
+    
+    def filter(self, record):
+        # Hide workflow stats update errors
+        if "Workflow" in record.getMessage() and "not found for stats update" in record.getMessage():
+            return False
+        
+        # Hide HTTP request info messages
+        if "HTTP Request:" in record.getMessage() and "POST https://api.openai.com" in record.getMessage():
+            return False
+        
+        # Hide HTTP response info messages
+        if "HTTP/1.1 200 OK" in record.getMessage():
+            return False
+        
+        return True
+
+# Apply the filter to the root logger
+root_logger = logging.getLogger()
+root_logger.addFilter(LogFilter())
+
+def check_dependencies():
+    """Check if required dependencies are available and provide installation instructions."""
+    missing_deps = []
+    
+    # Check for required dependencies
+    try:
+        import bs4
+        logger.info("✓ beautifulsoup4 is available")
+    except ImportError:
+        missing_deps.append("beautifulsoup4")
+        logger.error("✗ beautifulsoup4 is missing")
+    
+    try:
+        import PyPDF2
+        logger.info("✓ PyPDF2 is available")
+    except ImportError:
+        missing_deps.append("PyPDF2")
+        logger.error("✗ PyPDF2 is missing")
+    
+    try:
+        import fitz
+        logger.info("✓ PyMuPDF (fitz) is available")
+    except ImportError:
+        missing_deps.append("PyMuPDF")
+        logger.error("✗ PyMuPDF (fitz) is missing")
+    
+    try:
+        import docx
+        logger.info("✓ python-docx is available")
+    except ImportError:
+        missing_deps.append("python-docx")
+        logger.error("✗ python-docx is missing")
+    
+    try:
+        import openpyxl
+        logger.info("✓ openpyxl is available")
+    except ImportError:
+        missing_deps.append("openpyxl")
+        logger.error("✗ openpyxl is missing")
+    
+    try:
+        import pptx
+        logger.info("✓ python-pptx is available")
+    except ImportError:
+        missing_deps.append("python-pptx")
+        logger.error("✗ python-pptx is missing")
+    
+    try:
+        from PIL import Image
+        logger.info("✓ Pillow (PIL) is available")
+    except ImportError:
+        missing_deps.append("Pillow")
+        logger.error("✗ Pillow (PIL) is missing")
+    
+    if missing_deps:
+        logger.error("\n" + "="*60)
+        logger.error("MISSING DEPENDENCIES DETECTED!")
+        logger.error("="*60)
+        logger.error("The following packages are required but not installed:")
+        for dep in missing_deps:
+            logger.error(f"  - {dep}")
+        logger.error("\nTo install all dependencies, run:")
+        logger.error("pip install -r requirements.txt")
+        logger.error("\nOr install individual packages:")
+        for dep in missing_deps:
+            if dep == "beautifulsoup4":
+                logger.error(f"  pip install {dep}")
+            elif dep == "PyMuPDF":
+                logger.error(f"  pip install {dep}")
+            elif dep == "Pillow":
+                logger.error(f"  pip install {dep}")
+            else:
+                logger.error(f"  pip install {dep}")
+        logger.error("="*60)
+        return False
+    
+    logger.info("✓ All required dependencies are available!")
+    return True
+
+def check_module_imports():
+    """Check if we can import the required modules."""
+    try:
+        # Add the gateway directory to the path so we can import our modules
+        sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
+        
+        from modules.chat.documents.documentExtraction import DocumentExtraction
+        from modules.chat.serviceCenter import ServiceCenter
+        from modules.interfaces.interfaceAppModel import User, UserConnection
+        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem
+        
+        logger.info("✓ All required modules imported successfully")
+        return True
+    except ImportError as e:
+        logger.error(f"✗ Failed to import required modules: {e}")
+        logger.error("Make sure you're running this script from the gateway directory")
+        return False
+    except Exception as e:
+        logger.error(f"✗ Unexpected error importing modules: {e}")
+        return False
+
+def create_mock_service_center():
+    """Create a proper ServiceCenter for testing purposes with all required fields."""
+    try:
+        from modules.chat.serviceCenter import ServiceCenter
+        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
+        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
+        from modules.interfaces.interfaceChatModel import ChatLog, ChatMessage, ChatStat
+        
+        # Create proper user with all required fields
+        mock_user = User(
+            id="test_user_001",
+            username="testuser",
+            email="test@example.com",
+            fullName="Test User",
+            language="en",
+            enabled=True,
+            privilege=UserPrivilege.USER,
+            authenticationAuthority=AuthAuthority.LOCAL,
+            mandateId="test_mandate_001"
+        )
+        
+        # Create proper workflow with all required fields
+        current_time = datetime.now(UTC).isoformat()
+        mock_workflow = ChatWorkflow(
+            id="test_workflow_001",
+            mandateId="test_mandate_001",
+            status="active",
+            name="Test Document Extraction Workflow",
+            currentRound=1,
+            lastActivity=current_time,
+            startedAt=current_time,
+            logs=[],
+            messages=[],
+            stats=None,
+            tasks=[]
+        )
+        
+        # Create service center
+        service_center = ServiceCenter(mock_user, mock_workflow)
+        logger.info("✓ ServiceCenter created successfully with proper objects")
+        return service_center
+        
+    except Exception as e:
+        logger.error(f"✗ Failed to create ServiceCenter: {e}")
+        return None
+
+class DocumentExtractionTester:
+    """Test class for DocumentExtraction functionality."""
+    
+    def __init__(self, input_dir: str = "d:/temp/test-extraction", output_dir: str = None, enable_ai: bool = True):
+        """
+        Initialize the tester.
+        
+        Args:
+            input_dir: Directory containing files to process
+            output_dir: Directory to store extracted content (auto-generated if None)
+            enable_ai: Whether to enable AI processing (default: True)
+        """
+        self.input_dir = Path(input_dir)
+        
+        # Auto-generate output directory if not specified
+        if output_dir is None:
+            if enable_ai:
+                self.output_dir = Path(input_dir) / "extracted"
+            else:
+                self.output_dir = Path(input_dir) / "extracted-raw"
+        else:
+            self.output_dir = Path(output_dir)
+            
+        self.extractor = None
+        self.service_center = None
+        self.enable_ai = enable_ai
+        
+        if enable_ai:
+            self.prompt = "Make a summary of each sentence for each page or chapter of the document"
+        else:
+            self.prompt = None  # No prompt needed for content-only extraction
+        
+        # Track processing results for summary
+        self.processing_results = []
+        
+        # Ensure output directory exists
+        logger.info(f"Creating output directory: {self.output_dir}")
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+        
+        # Verify directory was created
+        if self.output_dir.exists():
+            logger.info(f"✓ Output directory created/verified: {self.output_dir}")
+            logger.info(f"Output directory absolute path: {self.output_dir.absolute()}")
+        else:
+            logger.error(f"✗ Failed to create output directory: {self.output_dir}")
+        
+        # Log configuration
+        logger.info(f"Configuration: AI processing = {'ENABLED' if self.enable_ai else 'DISABLED'}")
+        logger.info(f"Input directory: {self.input_dir}")
+        logger.info(f"Output directory: {self.output_dir}")
+        
+        # Test basic file writing capability
+        test_file = self.output_dir / "test_write_capability.txt"
+        try:
+            logger.info(f"Testing file write capability to: {test_file}")
+            logger.info(f"Absolute path: {test_file.absolute()}")
+            
+            with open(test_file, 'w', encoding='utf-8') as f:
+                f.write("Test file to verify write capability")
+            
+            if test_file.exists():
+                actual_size = test_file.stat().st_size
+                logger.info(f"✓ Basic file writing test passed: {test_file} (size: {actual_size} bytes)")
+                
+                # Test reading the file back
+                with open(test_file, 'r', encoding='utf-8') as f:
+                    content = f.read()
+                logger.info(f"✓ File read test passed: content length = {len(content)}")
+                
+                # Clean up test file
+                test_file.unlink()
+                logger.info("✓ Test file cleaned up")
+            else:
+                logger.error(f"✗ Basic file writing test failed: {test_file}")
+        except Exception as e:
+            logger.error(f"✗ Basic file writing test failed with error: {e}")
+            import traceback
+            traceback.print_exc()
+        
+        # Supported file extensions for content extraction
+        self.supported_extensions = {
+            # Text and data files
+            '.txt', '.csv', '.json', '.xml', '.html', '.htm', '.svg',
+            '.md', '.markdown', '.rst', '.log', '.ini', '.cfg', '.conf',
+            
+            # Programming languages
+            '.js', '.ts', '.jsx', '.tsx', '.py', '.java', '.c', '.cpp', '.cc', '.cxx',
+            '.h', '.hpp', '.cs', '.php', '.rb', '.go', '.rs', '.swift', '.kt', '.scala',
+            '.r', '.m', '.pl', '.sh', '.bash', '.zsh', '.fish', '.ps1', '.bat', '.cmd',
+            '.vbs', '.lua', '.sql', '.r', '.dart', '.elm', '.clj', '.hs', '.fs', '.ml',
+            
+            # Web technologies
+            '.css', '.scss', '.sass', '.less', '.vue', '.svelte', '.astro',
+            
+            # Configuration and build files
+            '.yaml', '.yml', '.toml', '.env', '.gitignore', '.dockerfile', '.dockerignore',
+            '.makefile', '.cmake', '.gradle', '.maven', '.pom', '.sln', '.vcxproj',
+            '.csproj', '.fsproj', '.vbproj', '.xcodeproj', '.pbxproj',
+            
+            # Documentation and markup
+            '.tex', '.bib', '.adoc', '.asciidoc', '.wiki', '.creole',
+            
+            # Images
+            '.jpg', '.jpeg', '.png', '.gif', '.webp', '.bmp', '.tiff', '.ico',
+            
+            # Documents
+            '.pdf', '.docx', '.xlsx', '.pptx', '.odt', '.ods', '.odp',
+            
+            # Legacy Office formats
+            '.doc', '.xls', '.ppt',
+            
+            # Archives and binaries
+            '.zip', '.tar', '.gz', '.7z', '.rar', '.exe', '.dll', '.so', '.dylib'
+        }
+    
+    def initialize_extractor(self):
+        """Initialize the DocumentExtraction instance with a proper ServiceCenter."""
+        try:
+            # First create the service center
+            self.service_center = create_mock_service_center()
+            if not self.service_center:
+                logger.error("Failed to create ServiceCenter!")
+                return False
+            
+            # Now create DocumentExtraction with the service center
+            from modules.chat.documents.documentExtraction import DocumentExtraction
+            self.extractor = DocumentExtraction(self.service_center)
+            logger.info("✓ DocumentExtraction initialized successfully with ServiceCenter")
+            return True
+        except Exception as e:
+            logger.error(f"✗ Failed to initialize DocumentExtraction: {e}")
+            return False
+    
+    def get_files_to_process(self) -> List[Path]:
+        """Get list of files to process from input directory."""
+        if not self.input_dir.exists():
+            logger.error(f"Input directory {self.input_dir} does not exist!")
+            logger.info("Creating input directory and adding a test file...")
+            self.input_dir.mkdir(parents=True, exist_ok=True)
+            
+            # Create a test file if none exist
+            test_file = self.input_dir / "test.txt"
+            with open(test_file, 'w') as f:
+                f.write("This is a test file for document extraction.\nIt contains multiple lines.\nAnd some special characters: äöüß")
+            logger.info(f"Created test file: {test_file}")
+        
+        files = []
+        all_files = list(self.input_dir.iterdir())
+        logger.info(f"All files in directory: {[f.name for f in all_files]}")
+        
+        for file_path in all_files:
+            if file_path.is_file():
+                logger.debug(f"Checking file: {file_path.name} (extension: {file_path.suffix})")
+                if file_path.suffix.lower() in self.supported_extensions:
+                    files.append(file_path)
+                    logger.debug(f"Added file: {file_path.name}")
+                else:
+                    logger.debug(f"Skipped file: {file_path.name} (unsupported extension)")
+        
+        logger.info(f"Found {len(files)} supported files to process")
+        if files:
+            logger.info(f"Files to process: {[f.name for f in files]}")
+        return files
+    
+    async def process_single_file(self, file_path: Path) -> bool:
+        """
+        Process a single file and extract its content.
+        
+        Args:
+            file_path: Path to the file to process
+            
+        Returns:
+            True if successful, False otherwise
+        """
+        if not self.extractor:
+            logger.error("DocumentExtraction not initialized!")
+            return False
+            
+        try:
+            logger.info(f"Processing file: {file_path.name}")
+            
+            # Read file data
+            with open(file_path, 'rb') as f:
+                file_data = f.read()
+            
+            logger.debug(f"File size: {len(file_data)} bytes")
+            
+            # Determine MIME type based on extension
+            mime_type = self._get_mime_type(file_path.suffix)
+            logger.debug(f"MIME type: {mime_type}")
+            
+            # Process the file with or without AI based on configuration
+            extracted_content = await self.extractor.processFileData(
+                fileData=file_data,
+                filename=file_path.name,
+                mimeType=mime_type,
+                base64Encoded=False,
+                prompt=self.prompt,
+                enableAI=self.enable_ai
+            )
+            
+            logger.debug(f"Extracted {len(extracted_content.contents)} content items")
+            
+            # Debug: Show content details
+            for i, content_item in enumerate(extracted_content.contents):
+                logger.debug(f"Content item {i+1}: label='{content_item.label}', has_data={content_item.data is not None}, data_length={len(content_item.data) if content_item.data else 0}")
+            
+            # Special logging for JavaScript files
+            if mime_type == "application/javascript":
+                logger.debug(f"JavaScript file detected: {file_path.name}")
+                logger.debug(f"Original file size: {len(file_data)} bytes")
+                for i, content_item in enumerate(extracted_content.contents):
+                    if content_item.data:
+                        content_size = len(content_item.data.encode('utf-8'))
+                        logger.debug(f"JavaScript content item {i+1}: {content_size} bytes")
+                        # Check if content was truncated
+                        if content_size < len(file_data) * 0.9:  # If less than 90% of original
+                            logger.warning(f"JavaScript content may be truncated: {content_size} bytes vs {len(file_data)} bytes original")
+            
+            # Track processing result
+            result = {
+                'filename': file_path.name,
+                'status': 'OK',
+                'content_items': 0,
+                'output_files': [],
+                'total_content_size': 0
+            }
+            
+            # Save each content item as a separate file
+            if extracted_content.contents:
+                for i, content_item in enumerate(extracted_content.contents):
+                    if content_item.data:
+                        content_size = len(content_item.data.encode('utf-8'))
+                        result['total_content_size'] += content_size
+                        logger.debug(f"Content item {i+1}: {content_item.label}, size: {content_size} bytes")
+                        
+                        # Generate filename with new naming convention
+                        if len(extracted_content.contents) == 1:
+                            # Single content item
+                            output_filename = f"{file_path.stem} - {content_item.label} 1.txt"
+                        else:
+                            # Multiple content items - add sequence number
+                            output_filename = f"{file_path.stem} - {content_item.label} {i+1}.txt"
+                        
+                        output_file = self.output_dir / output_filename
+                        
+                        # Write only the raw extracted content
+                        logger.debug(f"Attempting to write to: {output_file}")
+                        try:
+                            with open(output_file, 'w', encoding='utf-8') as f:
+                                f.write(content_item.data)
+                            
+                            # Verify file was created
+                            if output_file.exists():
+                                actual_size = output_file.stat().st_size
+                                logger.info(f"✓ File created successfully: {output_filename} (expected: {content_size} bytes, actual: {actual_size} bytes)")
+                            else:
+                                logger.error(f"✗ File was not created: {output_file}")
+                            
+                            result['output_files'].append(output_filename)
+                            result['content_items'] += 1
+                        except Exception as write_error:
+                            logger.error(f"✗ Error writing file {output_filename}: {write_error}")
+                            import traceback
+                            traceback.print_exc()
+                    else:
+                        logger.warning(f"Content item {i+1} has no data, skipping")
+            else:
+                logger.warning(f"No content extracted from {file_path.name}")
+                result['status'] = 'FAIL'
+                result['error'] = 'No content extracted'
+            
+            # Add result to tracking list
+            self.processing_results.append(result)
+            
+            logger.info(f"Successfully processed {file_path.name} - Total content: {result['total_content_size']} bytes")
+            return True
+            
+        except Exception as e:
+            error_msg = str(e)
+            logger.error(f"Error processing {file_path.name}: {error_msg}")
+            
+            # Track failed result
+            result = {
+                'filename': file_path.name,
+                'status': 'FAIL',
+                'content_items': 0,
+                'output_files': [],
+                'error': error_msg,
+                'total_content_size': 0
+            }
+            self.processing_results.append(result)
+            
+            return False
+    
+    def _get_mime_type(self, extension: str) -> str:
+        """Get MIME type based on file extension."""
+        mime_types = {
+            # Text and data files
+            '.txt': 'text/plain',
+            '.csv': 'text/csv',
+            '.json': 'application/json',
+            '.xml': 'application/xml',
+            '.html': 'text/html',
+            '.htm': 'text/html',
+            '.svg': 'image/svg+xml',
+            '.md': 'text/markdown',
+            '.markdown': 'text/markdown',
+            '.rst': 'text/x-rst',
+            '.log': 'text/plain',
+            '.ini': 'text/plain',
+            '.cfg': 'text/plain',
+            '.conf': 'text/plain',
+            
+            # Programming languages
+            '.js': 'application/javascript',
+            '.ts': 'application/typescript',
+            '.jsx': 'text/jsx',
+            '.tsx': 'text/tsx',
+            '.py': 'text/x-python',
+            '.java': 'text/x-java-source',
+            '.c': 'text/x-c',
+            '.cpp': 'text/x-c++src',
+            '.cc': 'text/x-c++src',
+            '.cxx': 'text/x-c++src',
+            '.h': 'text/x-c',
+            '.hpp': 'text/x-c++hdr',
+            '.cs': 'text/x-csharp',
+            '.php': 'application/x-httpd-php',
+            '.rb': 'text/x-ruby',
+            '.go': 'text/x-go',
+            '.rs': 'text/x-rust',
+            '.swift': 'text/x-swift',
+            '.kt': 'text/x-kotlin',
+            '.scala': 'text/x-scala',
+            '.r': 'text/x-r',
+            '.m': 'text/x-matlab',
+            '.pl': 'text/x-perl',
+            '.sh': 'application/x-sh',
+            '.bash': 'application/x-sh',
+            '.zsh': 'application/x-sh',
+            '.fish': 'application/x-sh',
+            '.ps1': 'application/x-powershell',
+            '.bat': 'application/x-msdos-program',
+            '.cmd': 'application/x-msdos-program',
+            '.vbs': 'text/vbscript',
+            '.lua': 'text/x-lua',
+            '.sql': 'application/sql',
+            '.dart': 'application/dart',
+            '.elm': 'text/x-elm',
+            '.clj': 'text/x-clojure',
+            '.hs': 'text/x-haskell',
+            '.fs': 'text/x-fsharp',
+            '.ml': 'text/x-ocaml',
+            
+            # Web technologies
+            '.css': 'text/css',
+            '.scss': 'text/x-scss',
+            '.sass': 'text/x-sass',
+            '.less': 'text/x-less',
+            '.vue': 'text/x-vue',
+            '.svelte': 'text/x-svelte',
+            '.astro': 'text/x-astro',
+            
+            # Configuration and build files
+            '.yaml': 'application/x-yaml',
+            '.yml': 'application/x-yaml',
+            '.toml': 'application/toml',
+            '.env': 'text/plain',
+            '.gitignore': 'text/plain',
+            '.dockerfile': 'text/x-dockerfile',
+            '.dockerignore': 'text/plain',
+            '.makefile': 'text/x-makefile',
+            '.cmake': 'text/x-cmake',
+            '.gradle': 'text/x-gradle',
+            '.maven': 'text/x-maven',
+            '.pom': 'application/xml',
+            '.sln': 'text/plain',
+            '.vcxproj': 'application/xml',
+            '.csproj': 'application/xml',
+            '.fsproj': 'application/xml',
+            '.vbproj': 'application/xml',
+            '.xcodeproj': 'text/plain',
+            '.pbxproj': 'text/plain',
+            
+            # Documentation and markup
+            '.tex': 'application/x-tex',
+            '.bib': 'text/x-bibtex',
+            '.adoc': 'text/asciidoc',
+            '.asciidoc': 'text/asciidoc',
+            '.wiki': 'text/x-wiki',
+            '.creole': 'text/x-wiki',
+            
+            # Images
+            '.jpg': 'image/jpeg',
+            '.jpeg': 'image/jpeg',
+            '.png': 'image/png',
+            '.gif': 'image/gif',
+            '.webp': 'image/webp',
+            '.bmp': 'image/bmp',
+            '.tiff': 'image/tiff',
+            '.ico': 'image/x-icon',
+            
+            # Documents
+            '.pdf': 'application/pdf',
+            '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
+            '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
+            '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
+            '.odt': 'application/vnd.oasis.opendocument.text',
+            '.ods': 'application/vnd.oasis.opendocument.spreadsheet',
+            '.odp': 'application/vnd.oasis.opendocument.presentation',
+            
+            # Legacy Office formats
+            '.doc': 'application/msword',
+            '.xls': 'application/vnd.ms-excel',
+            '.ppt': 'application/vnd.ms-powerpoint',
+            
+            # Archives and binaries (will be processed as binary)
+            '.zip': 'application/zip',
+            '.tar': 'application/x-tar',
+            '.gz': 'application/gzip',
+            '.7z': 'application/x-7z-compressed',
+            '.rar': 'application/vnd.rar',
+            '.exe': 'application/x-msdownload',
+            '.dll': 'application/x-msdownload',
+            '.so': 'application/x-sharedlib',
+            '.dylib': 'application/x-mach-binary'
+        }
+        return mime_types.get(extension.lower(), 'application/octet-stream')
+    
+    async def run_tests(self) -> None:
+        """Run the document extraction tests on all files."""
+        mode = "WITH AI" if self.enable_ai else "CONTENT ONLY (No AI)"
+        logger.info(f"Starting document extraction tests - {mode}")
+        logger.info(f"Input directory: {self.input_dir}")
+        logger.info(f"Output directory: {self.output_dir}")
+        if self.enable_ai:
+            logger.info(f"Processing prompt: {self.prompt}")
+        else:
+            logger.info("AI processing: DISABLED - Raw content extraction only")
+        
+        # Initialize the extractor
+        if not self.initialize_extractor():
+            logger.error("Cannot proceed without DocumentExtraction!")
+            return
+        
+        # Get files to process
+        files = self.get_files_to_process()
+        
+        if not files:
+            logger.warning("No files found to process!")
+            return
+        
+        # Process each file
+        successful = 0
+        failed = 0
+        
+        logger.info(f"Starting to process {len(files)} files...")
+        for i, file_path in enumerate(files):
+            logger.info(f"Processing file {i+1}/{len(files)}: {file_path.name}")
+            try:
+                if await self.process_single_file(file_path):
+                    successful += 1
+                    logger.info(f"✓ File {i+1} processed successfully")
+                else:
+                    failed += 1
+                    logger.error(f"✗ File {i+1} processing failed")
+            except Exception as e:
+                failed += 1
+                logger.error(f"✗ Exception processing file {i+1}: {e}")
+                import traceback
+                traceback.print_exc()
+        
+        # Print detailed summary
+        mode = "WITH AI" if self.enable_ai else "CONTENT ONLY (No AI)"
+        logger.info("\n" + "=" * 80)
+        logger.info(f"DETAILED TEST SUMMARY - {mode}")
+        logger.info("=" * 80)
+        logger.info(f"Total files processed: {len(files)}")
+        logger.info(f"Successful: {successful}")
+        logger.info(f"Failed: {failed}")
+        logger.info(f"Output directory: {self.output_dir}")
+        if self.enable_ai:
+            logger.info("AI processing: ENABLED")
+        else:
+            logger.info("AI processing: DISABLED")
+        logger.info("=" * 80)
+        
+        # List all processed documents with results
+        logger.info("\nPROCESSING RESULTS:")
+        logger.info("-" * 80)
+        
+        for result in self.processing_results:
+            status_icon = "✅" if result['status'] == 'OK' else "❌"
+            logger.info(f"{status_icon} {result['filename']} - {result['status']}")
+            
+            if result['status'] == 'OK':
+                if result['content_items'] == 1:
+                    logger.info(f"   └─ Generated: {result['output_files'][0]} ({result['total_content_size']} bytes)")
+                else:
+                    logger.info(f"   └─ Generated {result['content_items']} files ({result['total_content_size']} total bytes):")
+                    for output_file in result['output_files']:
+                        logger.info(f"      └─ {output_file}")
+            else:
+                error_msg = result.get('error', 'Unknown error')
+                logger.info(f"   └─ Error: {error_msg}")
+        
+        logger.info("-" * 80)
+        logger.info("=" * 80)
+
+def parse_arguments():
+    """Parse command line arguments."""
+    parser = argparse.ArgumentParser(description='Document Extraction Test Script')
+    parser.add_argument('--no-ai', '--content-only', action='store_true', 
+                       help='Run in content-only mode without AI processing')
+    parser.add_argument('--input-dir', type=str, default='d:/temp/test-extraction',
+                       help='Input directory containing files to process (default: d:/temp/test-extraction)')
+    parser.add_argument('--output-dir', type=str, 
+                       help='Output directory for extracted content (auto-generated if not specified)')
+    parser.add_argument('--verbose', '-v', action='store_true',
+                       help='Enable verbose logging')
+    
+    return parser.parse_args()
+
+async def main():
+    """Main function to run the tests."""
+    # Parse command line arguments
+    args = parse_arguments()
+    
+    # Set logging level based on verbosity
+    if args.verbose:
+        logging.getLogger().setLevel(logging.DEBUG)
+    else:
+        logging.getLogger().setLevel(logging.INFO)
+    
+    logger.info("DocumentExtraction Test Script")
+    logger.info("=" * 50)
+    logger.info(f"Source: {args.input_dir}")
+    
+    # Determine output directory
+    if args.output_dir:
+        output_dir = args.output_dir
+    else:
+        if args.no_ai:
+            output_dir = f"{args.input_dir}/extracted-raw"
+        else:
+            output_dir = f"{args.input_dir}/extracted"
+    
+    logger.info(f"Output: {output_dir}")
+    logger.info("=" * 50)
+    
+    # Check dependencies first
+    if not check_dependencies():
+        logger.error("Please install missing dependencies before running tests.")
+        return
+    
+    # Check module imports
+    if not check_module_imports():
+        logger.error("Cannot import required modules. Please check your setup.")
+        return
+    
+    # Determine mode based on command line arguments
+    if args.no_ai:
+        enable_ai = False
+        logger.info("Running in CONTENT ONLY mode (no AI processing)")
+    else:
+        # Interactive mode: ask user for choice
+        print("\n" + "=" * 50)
+        print("SELECT EXTRACTION MODE:")
+        print("=" * 50)
+        print("1. With AI processing (default)")
+        print("2. Content only (no AI processing)")
+        print("=" * 50)
+        
+        try:
+            choice = input("Enter your choice (1 or 2, default is 1): ").strip()
+            if choice == "2":
+                enable_ai = False
+                output_dir = f"{args.input_dir}/extracted-raw"
+                logger.info("Selected: Content only mode (no AI processing)")
+            else:
+                enable_ai = True
+                output_dir = f"{args.input_dir}/extracted"
+                logger.info("Selected: AI processing mode")
+        except (EOFError, KeyboardInterrupt):
+            # Default to AI mode if input fails
+            enable_ai = True
+            output_dir = f"{args.input_dir}/extracted"
+            logger.info("Defaulting to AI processing mode")
+    
+    # Run tests with selected mode
+    tester = DocumentExtractionTester(
+        input_dir=args.input_dir,
+        output_dir=output_dir,
+        enable_ai=enable_ai
+    )
+    await tester.run_tests()
+
+if __name__ == "__main__":
+    # Check if command line arguments are provided for automated testing
+    if len(sys.argv) > 1:
+        # Parse arguments and run directly
+        asyncio.run(main())
+    else:
+        # Interactive mode: ask user for choice
+        asyncio.run(main())
+
+# Convenience function for easy content-only extraction
+async def extract_documents_content_only(input_folder: str, output_folder: str = None):
+    """
+    Convenience function to extract documents without AI processing.
+    
+    Args:
+        input_folder: Path to folder containing documents to extract
+        output_folder: Path to folder where extracted content will be stored (optional)
+    
+    Example:
+        # Extract from d:/temp to d:/temp/extracted-raw
+        asyncio.run(extract_documents_content_only("d:/temp"))
+        
+        # Extract from custom folders
+        asyncio.run(extract_documents_content_only("c:/my_docs", "c:/my_docs/extracted"))
+    """
+    if output_folder is None:
+        output_folder = f"{input_folder}/extracted-raw"
+    
+    logger.info(f"Running content-only extraction from {input_folder} to {output_folder}")
+    
+    # Check dependencies and imports
+    if not check_dependencies():
+        logger.error("Missing dependencies. Please install required packages.")
+        return False
+    
+    if not check_module_imports():
+        logger.error("Cannot import required modules. Please check your setup.")
+        return False
+    
+    # Create tester and run
+    tester = DocumentExtractionTester(
+        input_dir=input_folder,
+        output_dir=output_folder,
+        enable_ai=False
+    )
+    
+    await tester.run_tests()
+    return True
+
+# Example usage (uncomment to use):
+# if __name__ == "__main__":
+#     # For content-only extraction from d:/temp to d:/temp/extracted-raw
+#     asyncio.run(extract_documents_content_only("d:/temp"))
diff --git a/test_excel_processing.py b/test_excel_processing.py
new file mode 100644
index 00000000..afc27bcf
--- /dev/null
+++ b/test_excel_processing.py
@@ -0,0 +1,189 @@
+#!/usr/bin/env python3
+"""
+Simple test script for enhanced Excel processing functionality.
+This script tests the DocumentExtraction class with Excel files.
+"""
+
+import os
+import sys
+import asyncio
+import logging
+from pathlib import Path
+
+# Configure logging
+logging.basicConfig(
+    level=logging.DEBUG,
+    format='%(asctime)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+# Add the gateway directory to the path
+sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
+
+async def test_excel_processing():
+    """Test Excel processing functionality."""
+    try:
+        # Import required modules
+        from modules.chat.documents.documentExtraction import DocumentExtraction
+        from modules.chat.serviceCenter import ServiceCenter
+        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
+        from modules.interfaces.interfaceChatModel import ChatWorkflow
+        from datetime import datetime, UTC
+        
+        logger.info("Testing Excel processing functionality...")
+        
+        # Create mock service center
+        mock_user = User(
+            id="test_user_001",
+            username="testuser",
+            email="test@example.com",
+            fullName="Test User",
+            language="en",
+            enabled=True,
+            privilege=UserPrivilege.USER,
+            authenticationAuthority=AuthAuthority.LOCAL,
+            mandateId="test_mandate_001"
+        )
+        
+        current_time = datetime.now(UTC).isoformat()
+        mock_workflow = ChatWorkflow(
+            id="test_workflow_001",
+            mandateId="test_mandate_001",
+            status="active",
+            name="Test Excel Processing Workflow",
+            currentRound=1,
+            lastActivity=current_time,
+            startedAt=current_time,
+            logs=[],
+            messages=[],
+            stats=None,
+            tasks=[]
+        )
+        
+        service_center = ServiceCenter(mock_user, mock_workflow)
+        logger.info("✓ ServiceCenter created successfully")
+        
+        # Create DocumentExtraction instance
+        extractor = DocumentExtraction(service_center)
+        logger.info("✓ DocumentExtraction created successfully")
+        
+        # Test with a sample Excel file if available
+        test_file_path = "d:/temp/test-extraction/test.xlsx"
+        
+        if os.path.exists(test_file_path):
+            logger.info(f"Found test file: {test_file_path}")
+            
+            # Read the file
+            with open(test_file_path, 'rb') as f:
+                file_data = f.read()
+            
+            logger.info(f"File size: {len(file_data)} bytes")
+            
+            # Process the Excel file
+            logger.info("Processing Excel file...")
+            result = await extractor.processFileData(
+                fileData=file_data,
+                filename="test.xlsx",
+                mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
+                base64Encoded=False,
+                prompt=None,
+                enableAI=False
+            )
+            
+            logger.info(f"✓ Excel processing completed successfully!")
+            logger.info(f"Generated {len(result.contents)} content items:")
+            
+            for i, content_item in enumerate(result.contents):
+                logger.info(f"  Item {i+1}: {content_item.label}")
+                logger.info(f"    MIME type: {content_item.metadata.mimeType}")
+                logger.info(f"    Size: {content_item.metadata.size} bytes")
+                if content_item.data:
+                    logger.info(f"    Data preview: {content_item.data[:100]}...")
+                else:
+                    logger.info(f"    Data: None")
+            
+        else:
+            logger.info("No test Excel file found. Creating a simple test...")
+            
+            # Test the openpyxl library directly
+            try:
+                import openpyxl
+                from openpyxl import Workbook
+                
+                # Create a test workbook
+                wb = Workbook()
+                ws = wb.active
+                ws.title = "Test Sheet"
+                
+                # Add some test data
+                ws['A1'] = "Name"
+                ws['B1'] = "Age"
+                ws['C1'] = "City"
+                ws['A2'] = "John Doe"
+                ws['B2'] = 30
+                ws['C2'] = "New York"
+                ws['A3'] = "Jane Smith"
+                ws['B3'] = 25
+                ws['C3'] = "Los Angeles"
+                
+                # Test properties
+                wb.properties.title = "Test Workbook"
+                wb.properties.creator = "Test User"
+                wb.properties.subject = "Test Subject"
+                
+                logger.info("✓ Test workbook created successfully")
+                logger.info(f"  Title: {wb.properties.title}")
+                logger.info(f"  Creator: {wb.properties.creator}")
+                logger.info(f"  Subject: {wb.properties.subject}")
+                logger.info(f"  Sheets: {wb.sheetnames}")
+                
+                # Test the DocumentExtraction with this workbook
+                from io import BytesIO
+                
+                # Save to bytes
+                buffer = BytesIO()
+                wb.save(buffer)
+                buffer.seek(0)
+                file_data = buffer.getvalue()
+                
+                logger.info(f"Test workbook size: {len(file_data)} bytes")
+                
+                # Process with DocumentExtraction
+                result = await extractor.processFileData(
+                    fileData=file_data,
+                    filename="test_workbook.xlsx",
+                    mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
+                    base64Encoded=False,
+                    prompt=None,
+                    enableAI=False
+                )
+                
+                logger.info(f"✓ Test workbook processing completed successfully!")
+                logger.info(f"Generated {len(result.contents)} content items:")
+                
+                for i, content_item in enumerate(result.contents):
+                    logger.info(f"  Item {i+1}: {content_item.label}")
+                    logger.info(f"    MIME type: {content_item.metadata.mimeType}")
+                    logger.info(f"    Size: {content_item.metadata.size} bytes")
+                    if content_item.data:
+                        logger.info(f"    Data preview: {content_item.data[:200]}...")
+                    else:
+                        logger.info(f"    Data: None")
+                
+            except ImportError as e:
+                logger.error(f"openpyxl not available: {e}")
+            except Exception as e:
+                logger.error(f"Error testing Excel functionality: {e}")
+        
+        logger.info("Excel processing test completed!")
+        
+    except ImportError as e:
+        logger.error(f"Failed to import required modules: {e}")
+        logger.error("Make sure you're running this script from the gateway directory")
+    except Exception as e:
+        logger.error(f"Unexpected error: {e}")
+        import traceback
+        traceback.print_exc()
+
+if __name__ == "__main__":
+    asyncio.run(test_excel_processing())
diff --git a/web_search_20250717_140455.txt b/web_search_20250717_140455.txt
deleted file mode 100644
index e69de29b..00000000
diff --git a/web_search_20250717_144557.txt b/web_search_20250717_144557.txt
deleted file mode 100644
index e69de29b..00000000