gateway/modules/workflows/methods/methodAi/actions/process.py

# Copyright (c) 2025 Patrick Motsch
# All rights reserved.

import logging
import time
import json
from typing import Dict, Any, List, Optional
from modules.aichat.datamodelFeatureAiChat import ActionResult, ActionDocument
from modules.datamodels.datamodelAi import AiCallOptions
from modules.datamodels.datamodelExtraction import ContentPart

logger = logging.getLogger(__name__)

async def process(self, parameters: Dict[str, Any]) -> ActionResult:
    try:
        # Init progress logger
        workflowId = self.services.workflow.id if self.services.workflow else f"no-workflow-{int(time.time())}"
        operationId = f"ai_process_{workflowId}_{int(time.time())}"

        # Start progress tracking
        parentOperationId = parameters.get('parentOperationId')
        if not parentOperationId:
            logger.warning(f"ai.process: No parentOperationId provided in parameters. Operation '{operationId}' will appear at root level. Available parameters: {list(parameters.keys())}")
        else:
            logger.debug(f"ai.process: Using parentOperationId '{parentOperationId}' for operation '{operationId}'")

        self.services.chat.progressLogStart(
                    operationId,
                    "Generate",
                    "AI Processing",
                    f"Format: {parameters.get('resultType', 'txt')}",
                    parentOperationId=parentOperationId
                )

        aiPrompt = parameters.get("aiPrompt")
        logger.info(f"aiPrompt extracted: '{aiPrompt}' (type: {type(aiPrompt)})")

        # Update progress - preparing parameters
        self.services.chat.progressLogUpdate(operationId, 0.2, "Preparing parameters")

        from modules.datamodels.datamodelDocref import DocumentReferenceList

        documentListParam = parameters.get("documentList")
        # Convert to DocumentReferenceList if needed
        if documentListParam is None:
            documentList = DocumentReferenceList(references=[])
            logger.debug(f"ai.process: documentList is None, using empty DocumentReferenceList")
        elif isinstance(documentListParam, DocumentReferenceList):
            documentList = documentListParam
            logger.info(f"ai.process: Received DocumentReferenceList with {len(documentList.references)} references")
            for idx, ref in enumerate(documentList.references):
                logger.info(f"  Reference {idx + 1}: documentId={ref.documentId}, type={type(ref).__name__}")
        elif isinstance(documentListParam, str):
            documentList = DocumentReferenceList.from_string_list([documentListParam])
            logger.info(f"ai.process: Converted string to DocumentReferenceList with {len(documentList.references)} references")
        elif isinstance(documentListParam, list):
            documentList = DocumentReferenceList.from_string_list(documentListParam)
            logger.info(f"ai.process: Converted list to DocumentReferenceList with {len(documentList.references)} references")
        else:
            logger.error(f"Invalid documentList type: {type(documentListParam)}")
            documentList = DocumentReferenceList(references=[])

        # Optional: if omitted, formats determined from prompt. Default "txt" is validation fallback only.
        resultType = parameters.get("resultType")
        simpleMode = parameters.get("simpleMode", False)

        if not aiPrompt:
            logger.error(f"aiPrompt is missing or empty. Parameters: {parameters}")
            return ActionResult.isFailure(
                error="AI prompt is required"
            )

        # Handle optional resultType: if None, formats determined from prompt by AI
        if resultType:
            normalized_result_type = (str(resultType).strip().lstrip('.').lower() or "txt")
            output_extension = f".{normalized_result_type}"
            output_format = output_extension.replace('.', '') or 'txt'
            logger.info(f"Using result type: {resultType} -> {output_extension}, simpleMode: {simpleMode}")
        else:
            # No format specified - AI will determine formats from prompt
            normalized_result_type = None
            output_extension = None
            output_format = None
            logger.debug("resultType not provided - formats will be determined from prompt by AI")

        output_mime_type = "application/octet-stream"  # Prefer service-provided mimeType when available

        # Phase 7.3: Pass both documentList and contentParts to AI service
        # (Extraction logic removed - handled by AI service)
        contentParts: Optional[List[ContentPart]] = None
        if "contentParts" in parameters:
            contentPartsParam = parameters.get("contentParts")
            if contentPartsParam:
                if isinstance(contentPartsParam, list):
                    contentParts = contentPartsParam
                elif hasattr(contentPartsParam, 'parts'):
                    # Extract from ContentExtracted if it's an ActionDocument
                    contentParts = contentPartsParam.parts
                else:
                    logger.warning(f"Invalid contentParts type: {type(contentPartsParam)}, treating as empty")
                    contentParts = None

        # Update progress - preparing AI call
        self.services.chat.progressLogUpdate(operationId, 0.4, "Preparing AI call")

        # Build output format for simple mode
        output_format_for_call = output_extension.replace('.', '') if output_extension else (output_format or 'txt')

        # Simple mode: fast path without document generation pipeline
        if simpleMode:
            # Update progress - calling AI (simple mode)
            self.services.chat.progressLogUpdate(operationId, 0.6, "Calling AI (simple mode)")

            # Extract context from documents if provided
            context_text = ""
            if documentList and len(documentList.references) > 0:
                try:
                    # Get documents from workflow
                    documents = self.services.chat.getChatDocumentsFromDocumentList(documentList)
                    context_parts = []
                    for doc in documents:
                        if hasattr(doc, 'fileId') and doc.fileId:
                            # Get file data
                            fileData = self.services.interfaceDbComponent.getFileData(doc.fileId)
                            if fileData:
                                if isinstance(fileData, bytes):
                                    doc_text = fileData.decode('utf-8', errors='ignore')
                                else:
                                    doc_text = str(fileData)
                                context_parts.append(doc_text)
                    if context_parts:
                        context_text = "\n\n".join(context_parts)
                except Exception as e:
                    logger.warning(f"Error extracting context from documents in simple mode: {e}")

            # Use direct AI call without document generation pipeline
            from modules.datamodels.datamodelAi import AiCallRequest, OperationTypeEnum, ProcessingModeEnum
            request = AiCallRequest(
                prompt=aiPrompt,
                context=context_text if context_text else None,
                options=AiCallOptions(
                    resultFormat=output_format_for_call,
                    operationType=OperationTypeEnum.DATA_ANALYSE,
                    processingMode=ProcessingModeEnum.BASIC
                )
            )

            aiResponse_obj = await self.services.ai.callAi(request)

            # Convert AiCallResponse to AiResponse format
            from modules.datamodels.datamodelWorkflow import AiResponse, AiResponseMetadata
            aiResponse = AiResponse(
                content=aiResponse_obj.content,
                metadata=AiResponseMetadata(
                    additionalData={
                        "modelName": aiResponse_obj.modelName,
                        "priceUsd": aiResponse_obj.priceUsd,
                        "processingTime": aiResponse_obj.processingTime,
                        "bytesSent": aiResponse_obj.bytesSent,
                        "bytesReceived": aiResponse_obj.bytesReceived,
                        "errorCount": aiResponse_obj.errorCount
                    }
                ),
                documents=[]  # Simple mode doesn't generate documents
            )
        else:
            # Full mode: use unified callAiContent method
            # Detect image generation from resultType (if provided)
            imageFormats = ["png", "jpg", "jpeg", "gif", "webp"]
            isImageGeneration = normalized_result_type in imageFormats if normalized_result_type else False

            # Build options with correct operationType
            from modules.datamodels.datamodelAi import OperationTypeEnum
            # resultFormat in options can be None - formats will be determined by AI if not provided
            options = AiCallOptions(
                resultFormat=output_format,  # Can be None - formats determined by AI
                operationType=OperationTypeEnum.IMAGE_GENERATE if isImageGeneration else OperationTypeEnum.DATA_GENERATE
            )

            # Get generationIntent from parameters (required for DATA_GENERATE)
            # Default to "document" if not provided (most common use case)
            # For code generation, use ai.generateCode action or explicitly pass generationIntent="code"
            generationIntent = parameters.get("generationIntent", "document")

            # Update progress - calling AI
            self.services.chat.progressLogUpdate(operationId, 0.6, "Calling AI")

            # Use unified callAiContent method with BOTH documentList and contentParts
            # Extraction is handled by AI service - no extraction here
            # outputFormat: Optional - if None, formats determined from prompt by AI
            # Note: ContentExtracted documents (from context.extractContent) are now handled
            # automatically in _extractAndPrepareContent() (Phase 5B)
            logger.info(f"ai.process: Calling callAiContent with {len(documentList.references)} document references")
            if documentList.references:
                from modules.datamodels.datamodelDocref import DocumentListReference, DocumentItemReference
                for idx, ref in enumerate(documentList.references):
                    if isinstance(ref, DocumentItemReference):
                        logger.info(f"  Passing reference {idx + 1}: documentId={ref.documentId}")
                    elif isinstance(ref, DocumentListReference):
                        logger.info(f"  Passing reference {idx + 1}: label={ref.label}")
                    else:
                        logger.info(f"  Passing reference {idx + 1}: {ref}")

            aiResponse = await self.services.ai.callAiContent(
                prompt=aiPrompt,
                options=options,
                documentList=documentList,  # Pass documentList - AI service handles extraction
                contentParts=contentParts,  # Pass contentParts if provided (or None)
                outputFormat=output_format,  # Can be None - AI determines from prompt
                parentOperationId=operationId,
                generationIntent=generationIntent  # REQUIRED for DATA_GENERATE
            )

        # Update progress - processing result
        self.services.chat.progressLogUpdate(operationId, 0.8, "Processing result")

        # Extract documents from AiResponse
        if aiResponse.documents and len(aiResponse.documents) > 0:
            action_documents = []
            for doc in aiResponse.documents:
                validationMetadata = {
                    "actionType": "ai.process",
                    "resultType": normalized_result_type,
                    "outputFormat": output_format,
                    "hasDocuments": True,
                    "documentCount": len(aiResponse.documents)
                }
                action_documents.append(ActionDocument(
                    documentName=doc.documentName,
                    documentData=doc.documentData,
                    mimeType=doc.mimeType or output_mime_type,
                    sourceJson=getattr(doc, 'sourceJson', None),  # Preserve source JSON for structure validation
                    validationMetadata=validationMetadata
                ))

            final_documents = action_documents
        else:
            # Text response - create document from content
            # If no extension provided, use "txt" (required for filename)
            extension = output_extension.lstrip('.') if output_extension else "txt"
            meaningful_name = self._generateMeaningfulFileName(
                base_name="ai",
                extension=extension,
                action_name="result"
            )
            validationMetadata = {
                "actionType": "ai.process",
                "resultType": normalized_result_type if normalized_result_type else None,
                "outputFormat": output_format if output_format else None,
                "hasDocuments": False,
                "contentType": "text"
            }
            action_document = ActionDocument(
                documentName=meaningful_name,
                documentData=aiResponse.content,
                mimeType=output_mime_type,
                validationMetadata=validationMetadata
            )
            final_documents = [action_document]

        # Complete progress tracking
        self.services.chat.progressLogFinish(operationId, True)

        return ActionResult.isSuccess(documents=final_documents)

    except Exception as e:
        logger.error(f"Error in AI processing: {str(e)}")

        # Complete progress tracking with failure
        try:
            self.services.chat.progressLogFinish(operationId, False)
        except:
            pass  # Don't fail on progress logging errors

        return ActionResult.isFailure(
            error=str(e)
        )