adapted all renderers from flat to nested element.content.(...) structure

2025-12-29 02:22:01 +01:00 · 2025-12-29 02:22:01 +01:00 · bc2dd6687d
commit bc2dd6687d
parent bcbaf41f4f
4 changed files with 90 additions and 309 deletions
--- a/modules/services/serviceGeneration/renderers/rendererBaseTemplate.py
+++ b/modules/services/serviceGeneration/renderers/rendererBaseTemplate.py
@ -198,161 +198,6 @@ class BaseRenderer(ABC):
            return section.get("id", "unknown")
        return "unknown"
    def _extractTableData(self, sectionData: Dict[str, Any]) -> Tuple[List[str], List[List[str]]]:
        """Extract table headers and rows from section data. Expects nested content structure."""
        # Normalize when elements array was passed in
        if isinstance(sectionData, list):
            if sectionData and isinstance(sectionData[0], dict):
                sectionData = sectionData[0]
            else:
                return [], []
        # Ensure sectionData is a dict
        if not isinstance(sectionData, dict):
            return [], []
        # Extract from nested content structure
        content = sectionData.get("content", {})
        if not isinstance(content, dict):
            return [], []
        headers = content.get("headers", [])
        rows = content.get("rows", [])
        return headers, rows
    def _extractBulletListItems(self, sectionData: Dict[str, Any]) -> List[str]:
        """Extract bullet list items from section data. Expects nested content structure."""
        # Normalize when elements array was passed in
        if isinstance(sectionData, list):
            if sectionData and isinstance(sectionData[0], dict):
                sectionData = sectionData[0]
            else:
                return []
        # Ensure sectionData is a dict
        if not isinstance(sectionData, dict):
            return []
        # Extract from nested content structure
        content = sectionData.get("content", {})
        if not isinstance(content, dict):
            return []
        items = content.get("items", [])
        result = []
        for item in items:
            if isinstance(item, str):
                result.append(item)
            elif isinstance(item, dict) and "text" in item:
                result.append(item["text"])
        return result
    def _extractHeadingData(self, sectionData: Dict[str, Any]) -> Tuple[int, str]:
        """Extract heading level and text from section data. Expects nested content structure."""
        # Normalize when elements array was passed in
        if isinstance(sectionData, list):
            if sectionData and isinstance(sectionData[0], dict):
                sectionData = sectionData[0]
            else:
                return 1, ""
        # Ensure sectionData is a dict
        if not isinstance(sectionData, dict):
            return 1, ""
        # Extract from nested content structure
        content = sectionData.get("content", {})
        if not isinstance(content, dict):
            return 1, ""
        level = content.get("level", 1)
        text = content.get("text", "")
        return level, text
    def _extractParagraphText(self, sectionData: Dict[str, Any]) -> str:
        """Extract paragraph text from section data. Expects nested content structure."""
        if isinstance(sectionData, list):
            # Join multiple paragraph elements if provided as a list
            texts = []
            for el in sectionData:
                if isinstance(el, dict):
                    content = el.get("content", {})
                    if isinstance(content, dict):
                        text = content.get("text", "")
                    elif isinstance(content, str):
                        text = content
                    else:
                        text = ""
                    if text:
                        texts.append(text)
                elif isinstance(el, str):
                    texts.append(el)
            return "\n".join(texts)
        # Extract from nested content structure
        if not isinstance(sectionData, dict):
            return ""
        content = sectionData.get("content", {})
        if isinstance(content, dict):
            return content.get("text", "")
        elif isinstance(content, str):
            return content
        return ""
    def _extractCodeBlockData(self, sectionData: Dict[str, Any]) -> Tuple[str, str]:
        """Extract code and language from section data. Expects nested content structure."""
        # Normalize when elements array was passed in
        if isinstance(sectionData, list):
            if sectionData and isinstance(sectionData[0], dict):
                sectionData = sectionData[0]
            else:
                return "", ""
        # Ensure sectionData is a dict
        if not isinstance(sectionData, dict):
            return "", ""
        # Extract from nested content structure
        content = sectionData.get("content", {})
        if not isinstance(content, dict):
            return "", ""
        code = content.get("code", "")
        language = content.get("language", "")
        return code, language
    def _extractImageData(self, sectionData: Dict[str, Any]) -> Tuple[str, str]:
        """Extract base64 data and alt text from section data. Expects nested content structure."""
        # Normalize when elements array was passed in
        if isinstance(sectionData, list):
            if sectionData and isinstance(sectionData[0], dict):
                sectionData = sectionData[0]
            else:
                return "", "Image"
        # Ensure sectionData is a dict
        if not isinstance(sectionData, dict):
            return "", "Image"
        # Extract from nested content structure
        content = sectionData.get("content", {})
        if not isinstance(content, dict):
            return "", "Image"
        base64Data = content.get("base64Data", "")
        altText = content.get("altText", "Image")
        return base64Data, altText
    def _renderImageSection(self, section: Dict[str, Any], styles: Dict[str, Any] = None) -> Any:
        """
        Render an image section. This is a base implementation that should be overridden
        by format-specific renderers.
        Args:
            section: Image section data
            styles: Optional styling information
        Returns:
            Format-specific image representation
        """
        sectionData = self._getSectionData(section)
        base64Data, altText = self._extractImageData(sectionData)
        # Base implementation returns a simple dict
        # Format-specific renderers should override this method
        return {
            "content_type": "image",
            "base64Data": base64Data,
            "altText": altText,
            "width": sectionData.get("width", None),
            "height": sectionData.get("height", None),
            "caption": sectionData.get("caption", "")
        }
    def _validateImageData(self, base64Data: str, altText: str) -> bool:
        """Validate image data."""
        if not base64Data:
@ -429,64 +274,6 @@ class BaseRenderer(ABC):
        """Check if a section type is valid."""
        return sectionType in self._getSupportedSectionTypes()
    def _processSectionByType(self, section: Dict[str, Any]) -> Dict[str, Any]:
        """Process a section and return structured data based on its type."""
        sectionType = self._getSectionType(section)
        sectionData = self._getSectionData(section)
        if sectionType == "table":
            headers, rows = self._extractTableData(sectionData)
            return {"content_type": "table", "headers": headers, "rows": rows}
        elif sectionType == "bullet_list":
            items = self._extractBulletListItems(sectionData)
            return {"content_type": "bullet_list", "items": items}
        elif sectionType == "heading":
            level, text = self._extractHeadingData(sectionData)
            return {"content_type": "heading", "level": level, "text": text}
        elif sectionType == "paragraph":
            text = self._extractParagraphText(sectionData)
            return {"content_type": "paragraph", "text": text}
        elif sectionType == "code_block":
            code, language = self._extractCodeBlockData(sectionData)
            return {"content_type": "code_block", "code": code, "language": language}
        elif sectionType == "image":
            # Extract image data - preserve nested content structure
            if isinstance(sectionData, list) and sectionData:
                # Get first element from elements array
                element = sectionData[0] if isinstance(sectionData[0], dict) else {}
            elif isinstance(sectionData, dict):
                element = sectionData
            else:
                return {"content_type": "paragraph", "text": "[Image: Invalid data]"}
            # Extract from nested content structure (standard JSON format)
            content = element.get("content", {})
            if not isinstance(content, dict):
                return {"content_type": "paragraph", "text": "[Image: Invalid content]"}
            base64Data = content.get("base64Data", "")
            altText = content.get("altText", "Image")
            caption = content.get("caption", "")
            # Validate image data
            if self._validateImageData(base64Data, altText):
                # Return nested structure matching standard JSON format
                return {
                    "content_type": "image",
                    "content": {
                        "base64Data": base64Data,
                        "altText": altText,
                        "caption": caption
                    }
                }
            else:
                # Return placeholder if image data is invalid
                return {"content_type": "paragraph", "text": f"[Image: {altText}]"}
        else:
            # Fallback to paragraph
            text = self._extractParagraphText(sectionData)
            return {"content_type": "paragraph", "text": text}
    def _formatTimestamp(self, timestamp: str = None) -> str:
        """Format timestamp for display."""
        if timestamp:
--- a/modules/services/serviceGeneration/renderers/rendererHtml.py
+++ b/modules/services/serviceGeneration/renderers/rendererHtml.py
@ -366,39 +366,23 @@ class RendererHtml(BaseRenderer):
            # Process elements according to section's content_type, not just element types
            if sectionType == "table":
-                # Process the section data to extract table structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonTable(processedData, styles)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonTable(element, styles)
                return ""
            elif sectionType == "bullet_list":
-                # Process the section data to extract bullet list structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonBulletList(processedData, styles)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonBulletList(element, styles)
                return ""
            elif sectionType == "heading":
-                # Extract text from elements for heading rendering
+                # Work directly with elements like other renderers
-                if isinstance(sectionData, list):
+                if isinstance(sectionData, list) and sectionData:
-                    # Extract text from heading elements
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
-                    headingText = ""
+                    return self._renderJsonHeading(element, styles)
-                    for element in sectionData:
+                return ""
                        if isinstance(element, dict):
                            element_type = element.get("type", "")
                            if element_type == "heading":
                                headingText = element.get("content", element.get("text", ""))
                                break
                            elif element_type == "extracted_text":
                                # Use extracted text as heading if no heading element found
                                content = element.get("content", "")
                                if content and not headingText:
                                    # Extract first line or title from extracted text
                                    headingText = content.split('\n')[0].strip()
                                    # Remove markdown formatting
                                    headingText = headingText.replace('#', '').replace('**', '').strip()
                                    break
                            elif "text" in element:
                                headingText = element.get("text", "")
                                break
                    if headingText:
                        return self._renderJsonHeading({"text": headingText, "level": 2}, styles)
                return self._renderJsonHeading(sectionData, styles)
            elif sectionType == "paragraph":
                # Process paragraph elements, including extracted_text
                if isinstance(sectionData, list):
@ -435,13 +419,17 @@ class RendererHtml(BaseRenderer):
                        return '\n'.join(htmlParts)
                return self._renderJsonParagraph(sectionData, styles)
            elif sectionType == "code_block":
-                # Process the section data to extract code block structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonCodeBlock(processedData, styles)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonCodeBlock(element, styles)
                return ""
            elif sectionType == "image":
-                # Process the section data to extract image structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonImage(processedData, styles)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonImage(element, styles)
                return ""
            else:
                # Fallback: Check for special element types first
                if isinstance(sectionData, list):
@ -472,7 +460,7 @@ class RendererHtml(BaseRenderer):
    def _renderJsonTable(self, tableData: Dict[str, Any], styles: Dict[str, Any]) -> str:
        """Render a JSON table to HTML using AI-generated styles."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{headers, rows}
            content = tableData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -507,9 +495,9 @@ class RendererHtml(BaseRenderer):
            return ""
    def _renderJsonBulletList(self, listData: Dict[str, Any], styles: Dict[str, Any]) -> str:
-        """Render a JSON bullet list to HTML using AI-generated styles. Expects nested content structure."""
+        """Render a JSON bullet list to HTML using AI-generated styles."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{items}
            content = listData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -535,19 +523,7 @@ class RendererHtml(BaseRenderer):
    def _renderJsonHeading(self, headingData: Dict[str, Any], styles: Dict[str, Any]) -> str:
        """Render a JSON heading to HTML using AI-generated styles."""
        try:
-            # Normalize inputs - headingData is typically a list of elements from _getSectionData
+            # Extract from nested content structure: element.content.{text, level}
            if isinstance(headingData, list):
                # Extract first element from elements array
                if headingData and len(headingData) > 0:
                    headingData = headingData[0] if isinstance(headingData[0], dict) else {}
                else:
                    return ""
            elif isinstance(headingData, str):
                headingData = {"text": headingData, "level": 2}
            elif not isinstance(headingData, dict):
                return ""
            # Extract from nested content structure
            content = headingData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -611,9 +587,9 @@ class RendererHtml(BaseRenderer):
            return ""
    def _renderJsonCodeBlock(self, codeData: Dict[str, Any], styles: Dict[str, Any]) -> str:
-        """Render a JSON code block to HTML using AI-generated styles. Expects nested content structure."""
+        """Render a JSON code block to HTML using AI-generated styles."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{code, language}
            content = codeData.get("content", {})
            if not isinstance(content, dict):
                return ""
--- a/modules/services/serviceGeneration/renderers/rendererMarkdown.py
+++ b/modules/services/serviceGeneration/renderers/rendererMarkdown.py
@ -144,25 +144,37 @@ class RendererMarkdown(BaseRenderer):
                    return '\n\n'.join(markdownParts)
            if sectionType == "table":
-                # Process the section data to extract table structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonTable(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonTable(element)
                return ""
            elif sectionType == "bullet_list":
-                # Process the section data to extract bullet list structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonBulletList(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonBulletList(element)
                return ""
            elif sectionType == "heading":
-                return self._renderJsonHeading(sectionData)
+                # Work directly with elements like other renderers
                if isinstance(sectionData, list) and sectionData:
                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonHeading(element)
                return ""
            elif sectionType == "paragraph":
                return self._renderJsonParagraph(sectionData)
            elif sectionType == "code_block":
-                # Process the section data to extract code block structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonCodeBlock(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonCodeBlock(element)
                return ""
            elif sectionType == "image":
-                # Process the section data to extract image structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonImage(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonImage(element)
                return ""
            else:
                # Fallback to paragraph for unknown types
                return self._renderJsonParagraph(sectionData)
@ -174,7 +186,7 @@ class RendererMarkdown(BaseRenderer):
    def _renderJsonTable(self, tableData: Dict[str, Any]) -> str:
        """Render a JSON table to markdown."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{headers, rows}
            content = tableData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -208,7 +220,7 @@ class RendererMarkdown(BaseRenderer):
    def _renderJsonBulletList(self, listData: Dict[str, Any]) -> str:
        """Render a JSON bullet list to markdown."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{items}
            content = listData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -233,7 +245,7 @@ class RendererMarkdown(BaseRenderer):
    def _renderJsonHeading(self, headingData: Dict[str, Any]) -> str:
        """Render a JSON heading to markdown."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{text, level}
            content = headingData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -292,7 +304,7 @@ class RendererMarkdown(BaseRenderer):
    def _renderJsonImage(self, imageData: Dict[str, Any]) -> str:
        """Render a JSON image to markdown."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{base64Data, altText, caption}
            content = imageData.get("content", {})
            if not isinstance(content, dict):
                return ""
--- a/modules/services/serviceGeneration/renderers/rendererText.py
+++ b/modules/services/serviceGeneration/renderers/rendererText.py
@ -167,35 +167,41 @@ class RendererText(BaseRenderer):
                    return '\n\n'.join(textParts)
            if sectionType == "table":
-                # Process the section data to extract table structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonTable(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonTable(element)
                return ""
            elif sectionType == "bullet_list":
-                # Process the section data to extract bullet list structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonBulletList(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonBulletList(element)
                return ""
            elif sectionType == "heading":
-                # Render each heading element in the elements array
+                # Work directly with elements like other renderers
-                # sectionData is already the elements array from _getSectionData
+                if isinstance(sectionData, list) and sectionData:
-                renderedElements = []
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
-                for element in sectionData:
+                    return self._renderJsonHeading(element)
-                    renderedElements.append(self._renderJsonHeading(element))
+                return ""
                return "\n".join(renderedElements)
            elif sectionType == "paragraph":
                # Render each paragraph element in the elements array
                # sectionData is already the elements array from _getSectionData
                renderedElements = []
                for element in sectionData:
                    renderedElements.append(self._renderJsonParagraph(element))
                return "\n".join(renderedElements)
            elif sectionType == "code_block":
-                # Process the section data to extract code block structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonCodeBlock(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonCodeBlock(element)
                return ""
            elif sectionType == "image":
-                # Process the section data to extract image structure
+                # Work directly with elements like other renderers
-                processedData = self._processSectionByType(section)
+                if isinstance(sectionData, list) and sectionData:
-                return self._renderJsonImage(processedData)
+                    element = sectionData[0] if isinstance(sectionData[0], dict) else {}
                    return self._renderJsonImage(element)
                return ""
            else:
                # Fallback to paragraph for unknown types - render each element
                # sectionData is already the elements array from _getSectionData
@ -211,7 +217,7 @@ class RendererText(BaseRenderer):
    def _renderJsonTable(self, tableData: Dict[str, Any]) -> str:
        """Render a JSON table to text."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{headers, rows}
            content = tableData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -245,7 +251,7 @@ class RendererText(BaseRenderer):
    def _renderJsonBulletList(self, listData: Dict[str, Any]) -> str:
        """Render a JSON bullet list to text."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{items}
            content = listData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -270,7 +276,7 @@ class RendererText(BaseRenderer):
    def _renderJsonHeading(self, headingData: Dict[str, Any]) -> str:
        """Render a JSON heading to text."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{text, level}
            content = headingData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -312,7 +318,7 @@ class RendererText(BaseRenderer):
    def _renderJsonCodeBlock(self, codeData: Dict[str, Any]) -> str:
        """Render a JSON code block to text."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{code, language}
            content = codeData.get("content", {})
            if not isinstance(content, dict):
                return ""
@ -334,7 +340,7 @@ class RendererText(BaseRenderer):
    def _renderJsonImage(self, imageData: Dict[str, Any]) -> str:
        """Render a JSON image to text."""
        try:
-            # Extract from nested content structure
+            # Extract from nested content structure: element.content.{base64Data, altText, caption}
            content = imageData.get("content", {})
            if isinstance(content, dict):
                altText = content.get("altText", "Image")