From dfd76c7d11738649c8a79458f79f3a40e7acbbc9 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 25 Aug 2025 17:24:33 +0200
Subject: [PATCH 01/17] feat: add web search abstraction

---
 .../methods/web/web_search/web_search_base.py | 31 ++++++++
 .../web/web_search/web_search_tavily.py       | 70 +++++++++++++++++++
 2 files changed, 101 insertions(+)
 create mode 100644 modules/methods/web/web_search/web_search_base.py
 create mode 100644 modules/methods/web/web_search/web_search_tavily.py

diff --git a/modules/methods/web/web_search/web_search_base.py b/modules/methods/web/web_search/web_search_base.py
new file mode 100644
index 00000000..d655bfd3
--- /dev/null
+++ b/modules/methods/web/web_search/web_search_base.py
@@ -0,0 +1,31 @@
+"""Base class for web search classes."""
+
+from abc import ABC, abstractmethod
+from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
+
+
+from pydantic import BaseModel, Field
+from typing import List
+
+
+class WebSearchRequest(BaseModel):
+    query: str
+    max_results: int
+
+
+class WebSearchDocumentData(BaseModel):
+    title: str
+    url: str
+
+
+class WebSearchActionDocument(ActionDocument):
+    documentData: List[WebSearchDocumentData]
+
+
+class WebSearchActionResult(ActionResult):
+    documents: List[WebSearchActionDocument] = Field(default_factory=list)
+
+
+class WebSearchBase(ABC):
+    @abstractmethod
+    async def __call__(self, request: WebSearchRequest) -> WebSearchActionResult: ...
diff --git a/modules/methods/web/web_search/web_search_tavily.py b/modules/methods/web/web_search/web_search_tavily.py
new file mode 100644
index 00000000..dcbea35c
--- /dev/null
+++ b/modules/methods/web/web_search/web_search_tavily.py
@@ -0,0 +1,70 @@
+"""Tavily web search class."""
+
+import os
+from dataclasses import dataclass
+from web_search_base import (
+    WebSearchBase,
+    WebSearchRequest,
+    WebSearchActionResult,
+    WebSearchActionDocument,
+    WebSearchDocumentData,
+)
+
+# from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
+from tavily import AsyncTavilyClient
+from modules.shared.timezoneUtils import get_utc_timestamp
+
+
+@dataclass
+class WebSearchTavily(WebSearchBase):
+    client: AsyncTavilyClient = None
+
+    @classmethod
+    async def create(cls):
+        return cls(client=AsyncTavilyClient(api_key=os.getenv("TAVILY_API_KEY")))
+
+    async def __call__(self, request: WebSearchRequest) -> WebSearchActionResult:
+        """Handles the web search request."""
+        # Step 1: Search
+        try:
+            search_results = await self._search(request.query, request.max_results)
+        except Exception as e:
+            return WebSearchActionResult(success=False, error=str(e))
+
+        # Step 2: Build ActionResult
+        try:
+            result = self._build_action_result(search_results)
+        except Exception as e:
+            return WebSearchActionResult(success=False, error=str(e))
+
+        return result
+
+    async def _search(self, query: str, max_results: int) -> WebSearchActionResult:
+        """Calls the Tavily API to perform a web search."""
+        # Make sure max_results is within the allowed range
+        if max_results < 0 or max_results > 20:
+            raise ValueError("max_results must be between 0 and 20")
+
+        # Perform actual API call
+        response = await self.client.search(query=query, max_results=max_results)
+        return response["results"]
+
+    def _build_action_result(self, search_results: list) -> WebSearchActionResult:
+        """Builds the ActionResult from the search results."""
+        documents = []
+        for result in search_results:
+            document_name = f"web_search_{get_utc_timestamp()}.txt"
+            document_data = WebSearchDocumentData(
+                title=result["title"], url=result["url"]
+            )
+            mime_type = "text/plain"
+            doc = WebSearchActionDocument(
+                documentName=document_name,
+                documentData=document_data,
+                mimeType=mime_type,
+            )
+            documents.append(doc)
+
+        return WebSearchActionResult(
+            success=True, documents=documents, resultLabel="web_search_results"
+        )

From b37cd502cd7e3137bef5b062991448f9b4f218ff Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 25 Aug 2025 17:25:11 +0200
Subject: [PATCH 02/17] chore: add tavily requirements

---
 requirements.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/requirements.txt b/requirements.txt
index adf8d3c3..e6397aa6 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -42,6 +42,7 @@ requests==2.31.0
 chardet>=5.0.0      # Für Zeichensatzerkennung bei Webinhalten
 aiohttp>=3.8.0      # Required for SharePoint operations (async HTTP)
 selenium>=4.15.0    # Required for web automation and JavaScript-heavy pages
+tavily-python==0.7.11  # Tavily SDK
 
 ## Image Processing
 Pillow>=10.0.0      # Für Bildverarbeitung (als PIL importiert)

From d4b846c5980d6448b0ef41ea4c6ecbf67a74f22f Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Fri, 29 Aug 2025 15:35:14 +0200
Subject: [PATCH 03/17] chore: restructure web search w/ tests

---
 modules/__init__.py                         |  0
 modules/connectors/connector_tavily.py      | 70 +++++++++++++++++++++
 modules/interfaces/interface_web_model.py   | 49 +++++++++++++++
 modules/interfaces/interface_web_objects.py | 24 +++++++
 modules/methods/method_web.py               | 43 +++++++++++++
 pytest.ini                                  | 11 ++++
 requirements.txt                            |  4 ++
 tests/__init__.py                           |  1 +
 tests/connectors/__init__.py                |  0
 tests/connectors/test_connector_tavily.py   | 39 ++++++++++++
 tests/methods/__init__.py                   |  0
 tests/methods/test_method_web.py            | 36 +++++++++++
 12 files changed, 277 insertions(+)
 create mode 100644 modules/__init__.py
 create mode 100644 modules/connectors/connector_tavily.py
 create mode 100644 modules/interfaces/interface_web_model.py
 create mode 100644 modules/interfaces/interface_web_objects.py
 create mode 100644 modules/methods/method_web.py
 create mode 100644 pytest.ini
 create mode 100644 tests/__init__.py
 create mode 100644 tests/connectors/__init__.py
 create mode 100644 tests/connectors/test_connector_tavily.py
 create mode 100644 tests/methods/__init__.py
 create mode 100644 tests/methods/test_method_web.py

diff --git a/modules/__init__.py b/modules/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
new file mode 100644
index 00000000..4f57fb94
--- /dev/null
+++ b/modules/connectors/connector_tavily.py
@@ -0,0 +1,70 @@
+"""Tavily web search class."""
+
+import os
+from dataclasses import dataclass
+from modules.interfaces.interface_web_model import (
+    WebSearchBase,
+    WebSearchRequest,
+    WebSearchActionResult,
+    WebSearchActionDocument,
+    WebSearchDocumentData,
+)
+
+# from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
+from tavily import AsyncTavilyClient
+from modules.shared.timezoneUtils import get_utc_timestamp
+
+
+@dataclass
+class ConnectorTavily(WebSearchBase):
+    client: AsyncTavilyClient = None
+
+    @classmethod
+    async def create(cls):
+        return cls(client=AsyncTavilyClient(api_key=os.getenv("TAVILY_API_KEY")))
+
+    async def search_urls(self, request: WebSearchRequest) -> WebSearchActionResult:
+        """Handles the web search request."""
+        # Step 1: Search
+        try:
+            search_results = await self._search(request.query, request.max_results)
+        except Exception as e:
+            return WebSearchActionResult(success=False, error=str(e))
+
+        # Step 2: Build ActionResult
+        try:
+            result = self._build_action_result(search_results)
+        except Exception as e:
+            return WebSearchActionResult(success=False, error=str(e))
+
+        return result
+
+    async def _search(self, query: str, max_results: int) -> WebSearchActionResult:
+        """Calls the Tavily API to perform a web search."""
+        # Make sure max_results is within the allowed range
+        if max_results < 0 or max_results > 20:
+            raise ValueError("max_results must be between 0 and 20")
+
+        # Perform actual API call
+        response = await self.client.search(query=query, max_results=max_results)
+        return response["results"]
+
+    def _build_action_result(self, search_results: list) -> WebSearchActionResult:
+        """Builds the ActionResult from the search results."""
+        documents = []
+        for result in search_results:
+            document_name = f"web_search_{get_utc_timestamp()}.txt"
+            document_data = WebSearchDocumentData(
+                title=result["title"], url=result["url"]
+            )
+            mime_type = "application/json"
+            doc = WebSearchActionDocument(
+                documentName=document_name,
+                documentData=document_data,
+                mimeType=mime_type,
+            )
+            documents.append(doc)
+
+        return WebSearchActionResult(
+            success=True, documents=documents, resultLabel="web_search_results"
+        )
diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interface_web_model.py
new file mode 100644
index 00000000..8dc01fc8
--- /dev/null
+++ b/modules/interfaces/interface_web_model.py
@@ -0,0 +1,49 @@
+"""Base class for web classes."""
+
+from abc import ABC, abstractmethod
+from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
+
+
+from pydantic import BaseModel, Field
+from typing import List
+
+
+# --- Web search ---
+
+# query -> list of URLs
+
+
+class WebSearchRequest(BaseModel):
+    query: str
+    max_results: int
+
+
+class WebSearchDocumentData(BaseModel):
+    title: str
+    url: str
+
+
+class WebSearchActionDocument(ActionDocument):
+    documentData: WebSearchDocumentData
+
+
+class WebSearchActionResult(ActionResult):
+    documents: List[WebSearchActionDocument] = Field(default_factory=list)
+
+
+class WebSearchBase(ABC):
+    @abstractmethod
+    async def search_urls(self, request: WebSearchRequest) -> WebSearchActionResult: ...
+
+
+# --- Web crawl ---
+
+# list of URLs -> list of extracted HTML content
+
+# TODO
+
+# --- Web query ---
+
+# query -> list of extracted text
+
+# TODO
diff --git a/modules/interfaces/interface_web_objects.py b/modules/interfaces/interface_web_objects.py
new file mode 100644
index 00000000..b38db6a3
--- /dev/null
+++ b/modules/interfaces/interface_web_objects.py
@@ -0,0 +1,24 @@
+from modules.interfaces.interface_web_model import (
+    WebSearchActionResult,
+    WebSearchRequest,
+)
+
+from dataclasses import dataclass
+from modules.connectors.connector_tavily import ConnectorTavily
+
+
+@dataclass
+class WebInterface:
+    connector_tavily: ConnectorTavily = None
+
+    @classmethod
+    async def create(cls) -> "WebInterface":
+        connector_tavily = await ConnectorTavily.create()
+
+        return WebInterface(connector_tavily=connector_tavily)
+
+    async def search(
+        self, web_search_request: WebSearchRequest
+    ) -> WebSearchActionResult:
+        # NOTE: Add connectors here
+        return await self.connector_tavily.search_urls(web_search_request)
diff --git a/modules/methods/method_web.py b/modules/methods/method_web.py
new file mode 100644
index 00000000..27b82ba5
--- /dev/null
+++ b/modules/methods/method_web.py
@@ -0,0 +1,43 @@
+import logging
+from typing import Any, Dict
+from modules.chat.methodBase import MethodBase, action
+from modules.interfaces.interfaceChatModel import ActionResult
+from modules.interfaces.interface_web_objects import WebInterface
+from modules.interfaces.interface_web_model import WebSearchRequest
+
+
+logger = logging.getLogger(__name__)
+
+
+class MethodWeb(MethodBase):
+    """Web method implementation for web operations."""
+
+    def __init__(self, serviceCenter: Any):
+        super().__init__(serviceCenter)
+
+    @action
+    async def search(self, parameters: Dict[str, Any]) -> ActionResult:
+        """
+        Perform a web search and output a .txt file with a plain list of URLs (one per line).
+
+        Parameters:
+            query (str): Search query to perform
+            maxResults (int, optional): Maximum number of results (default: 10)
+        """
+        # TODO: Fix docstrings - do we need that format for parsing?
+
+        try:
+            # Prepare request data
+            web_search_request = WebSearchRequest(
+                query=parameters.get("query"),
+                max_results=parameters.get("maxResults", 10),
+            )
+
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_search_result = await web_interface.search(web_search_request)
+
+            return web_search_result
+
+        except Exception as e:
+            return ActionResult(success=False, error=str(e))
diff --git a/pytest.ini b/pytest.ini
new file mode 100644
index 00000000..b606fa5f
--- /dev/null
+++ b/pytest.ini
@@ -0,0 +1,11 @@
+[pytest]
+testpaths = tests
+python_paths = .
+addopts = -v --tb=short
+python_files = test_*.py
+python_classes = Test*
+python_functions = test_*
+log_file = logs/test_logs.log
+log_file_level = INFO
+log_file_format = %(asctime)s %(levelname)s %(message)s
+log_file_date_format = %Y-%m-%d %H:%M:%S
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index e6397aa6..75bd81b6 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -68,3 +68,7 @@ PyPDF2>=3.0.0
 PyMuPDF>=1.20.0
 beautifulsoup4>=4.11.0
 chardet>=4.0.0  # For encoding detection
+
+## Testing Dependencies
+pytest>=8.0.0
+pytest-asyncio>=0.21.0
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 00000000..4ede8e6d
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1 @@
+# noqa
diff --git a/tests/connectors/__init__.py b/tests/connectors/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/tests/connectors/test_connector_tavily.py b/tests/connectors/test_connector_tavily.py
new file mode 100644
index 00000000..54ea382c
--- /dev/null
+++ b/tests/connectors/test_connector_tavily.py
@@ -0,0 +1,39 @@
+"""Tests for Tavliy web search."""
+
+import pytest
+import logging
+
+from modules.interfaces.interfaceChatModel import ActionResult
+from modules.interfaces.interface_web_model import WebSearchRequest
+from modules.connectors.connector_tavily import ConnectorTavily
+
+logger = logging.getLogger(__name__)
+
+
+@pytest.mark.asyncio
+async def test_tavily_connector_search_test_live_api():
+    logger.info("Testing Tavliy connector with live API calls")
+
+    # Test request
+    request = WebSearchRequest(query="How old is the Earth?", max_results=5)
+
+    # Tavily instance
+    connector_tavily = await ConnectorTavily.create()
+
+    # Search test
+    action_result = await connector_tavily.search_urls(request=request)
+
+    # Check results
+    assert isinstance(action_result, ActionResult)
+
+    logger.info("=" * 20)
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info("-" * 10)
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" - Document Mime Type: {doc.mimeType}")
+        logger.info(f" - Document Data: {doc.documentData}")
diff --git a/tests/methods/__init__.py b/tests/methods/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/tests/methods/test_method_web.py b/tests/methods/test_method_web.py
new file mode 100644
index 00000000..078d2902
--- /dev/null
+++ b/tests/methods/test_method_web.py
@@ -0,0 +1,36 @@
+"""Tests for method web.py"""
+
+import logging
+
+import pytest
+from modules.methods.method_web import MethodWeb
+
+logger = logging.getLogger(__name__)
+
+
+@pytest.mark.asyncio
+async def test_method_web_search_live():
+    """Tests method web search with live API calls."""
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Actual request
+    action_result = await method_web.search(
+        {"query": "How old is the earth", "maxResults": 5}
+    )
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info("=" * 20)
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info("-" * 10)
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" - Document Mime Type: {doc.mimeType}")
+        logger.info(f" - Document Data: {doc.documentData}")

From 6b05ad206727961f3e7a815f42523cb210bc60cd Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Fri, 29 Aug 2025 20:50:40 +0200
Subject: [PATCH 04/17] chore: add method web test w/ patched tavily api
 response

---
 modules/connectors/connector_tavily.py    |  7 ++++
 tests/connectors/test_connector_tavily.py |  1 +
 tests/fixtures/__init__.py                |  0
 tests/fixtures/tavily_responses.py        | 47 +++++++++++++++++++++++
 tests/methods/test_method_web.py          | 36 +++++++++++++++++
 5 files changed, 91 insertions(+)
 create mode 100644 tests/fixtures/__init__.py
 create mode 100644 tests/fixtures/tavily_responses.py

diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
index 4f57fb94..bcb38e3f 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connector_tavily.py
@@ -1,5 +1,6 @@
 """Tavily web search class."""
 
+import logging
 import os
 from dataclasses import dataclass
 from modules.interfaces.interface_web_model import (
@@ -15,6 +16,9 @@ from tavily import AsyncTavilyClient
 from modules.shared.timezoneUtils import get_utc_timestamp
 
 
+logger = logging.getLogger(__name__)
+
+
 @dataclass
 class ConnectorTavily(WebSearchBase):
     client: AsyncTavilyClient = None
@@ -47,6 +51,9 @@ class ConnectorTavily(WebSearchBase):
 
         # Perform actual API call
         response = await self.client.search(query=query, max_results=max_results)
+
+        logger.info(f"Tavily API response:\n{response}")
+
         return response["results"]
 
     def _build_action_result(self, search_results: list) -> WebSearchActionResult:
diff --git a/tests/connectors/test_connector_tavily.py b/tests/connectors/test_connector_tavily.py
index 54ea382c..3b23f69a 100644
--- a/tests/connectors/test_connector_tavily.py
+++ b/tests/connectors/test_connector_tavily.py
@@ -11,6 +11,7 @@ logger = logging.getLogger(__name__)
 
 
 @pytest.mark.asyncio
+@pytest.mark.expensive
 async def test_tavily_connector_search_test_live_api():
     logger.info("Testing Tavliy connector with live API calls")
 
diff --git a/tests/fixtures/__init__.py b/tests/fixtures/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/tests/fixtures/tavily_responses.py b/tests/fixtures/tavily_responses.py
new file mode 100644
index 00000000..789f62f0
--- /dev/null
+++ b/tests/fixtures/tavily_responses.py
@@ -0,0 +1,47 @@
+"""Sample tavily responses for patching responses in tests."""
+
+RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER = {
+    "query": "How old is the earth",
+    "follow_up_questions": None,
+    "answer": None,
+    "images": [],
+    "results": [
+        {
+            "url": "https://en.wikipedia.org/wiki/Age_of_Earth",
+            "title": "Age of Earth - Wikipedia",
+            "content": 'Scientific dating of the age of Earth The **age of Earth** is estimated to be 4.54 ± 0.05 billion years. In 1862, the physicist William Thomson, 1st Baron Kelvin published calculations that fixed the age of Earth at between 20 million and 400 million years. This suggested that it might be possible to measure the age of Earth by determining the relative proportions of radioactive materials in geological samples. Holmes published *The Age of the Earth, an Introduction to Geological Ideas* in 1927 in which he presented a range of 1.6 to 3.0 billion years. "The age of the Earth and the invention of geological time".',
+            "score": 0.8775715,
+            "raw_content": None,
+        },
+        {
+            "url": "https://answersingenesis.org/age-of-the-earth/how-old-earth/?srsltid=AfmBOorqG4wgNP3fQ457C11mdj7kVx0IcByShaqH3wwc1VivvrqvJnCF",
+            "title": "How Old Is the Earth? | Answers in Genesis",
+            "content": "If you ask this question of most scientifically literate people, they will answer that the earth is about 4.54 billion years old.",
+            "score": 0.8703443,
+            "raw_content": None,
+        },
+        {
+            "url": "https://sites.nd.edu/james-applewhite/2020/03/22/age-of-our-earth/",
+            "title": "Age of Our Earth: 6000 or 4.5 billion years old? - Notre Dame Sites",
+            "content": "If the Earth is only 6,000 years old, why does radiometric dating techniques used by geologists suggest the age is around much older? Each technique demonstrates the earth is much older than 6,000 years old and when combined with the various different techniques of relative dating using rock strata and formations, it becomes apparent that we have solid scientific evidence that the earth is much older than what AIG thinks. With this, as they try to discount radiometric dating as evidence since we were not around back then, they invalidate their own argument as they suggest that we should accept the words of the Bible as evidence.",
+            "score": 0.7975099,
+            "raw_content": None,
+        },
+        {
+            "url": "https://www.tomorrowsworld.org/magazines/2013/march-april/how-old-is-the-earth",
+            "title": "How Old Is the Earth? | Tomorrow's World",
+            "content": "Was it billions of years ago—close to the scientists' estimate of a 4.5 billion-year-old Earth? Or was it earlier or later? On these details, the Bible is",
+            "score": 0.78944516,
+            "raw_content": None,
+        },
+        {
+            "url": "https://www.planetary.org/articles/how-old-is-the-earth",
+            "title": "How old is the Earth? | The Planetary Society",
+            "content": "Skip to main content Community Account Renew Search * Become A Member * Renew Back To Main Menu Learn how our members and community are changing the worlds. Back To Main Menu * ### The Planetary Report Back To Main Menu + Become A Member + Action Center + Renew Membership Back To Main Menu Back To Main Menu + Become A Member + Renew Membership * Take Action * Member Community * Account Center * Search Public Education Specialist, The Planetary Society    Along with other planets, the Earth was born in the early days of the Solar System, which first started forming about 4.6 billion years ago. thanks to techniques including radiometric dating of rocks and minerals,",
+            "score": 0.7756902,
+            "raw_content": None,
+        },
+    ],
+    "response_time": 0.96,
+    "request_id": "3c36cccd-0918-49fd-bd1c-23c62ba7ec2d",
+}
diff --git a/tests/methods/test_method_web.py b/tests/methods/test_method_web.py
index 078d2902..9c0b7671 100644
--- a/tests/methods/test_method_web.py
+++ b/tests/methods/test_method_web.py
@@ -3,12 +3,15 @@
 import logging
 
 import pytest
+from unittest.mock import patch
 from modules.methods.method_web import MethodWeb
+from tests.fixtures.tavily_responses import RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER
 
 logger = logging.getLogger(__name__)
 
 
 @pytest.mark.asyncio
+@pytest.mark.expensive
 async def test_method_web_search_live():
     """Tests method web search with live API calls."""
 
@@ -34,3 +37,36 @@ async def test_method_web_search_live():
         logger.info(f" - Document Name: {doc.documentName}")
         logger.info(f" - Document Mime Type: {doc.mimeType}")
         logger.info(f" - Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+async def test_method_web_search_dummy():
+    """Tests method web search with dummy response data - no external API calls."""
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Mock the Tavily API response
+    with patch(
+        "tavily.AsyncTavilyClient.search",
+        return_value=RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER,
+    ) as mock_client:
+        action_result = await method_web.search(
+            {"query": "How old is the earth", "maxResults": 5}
+        )
+        mock_client.assert_called_once()
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info("=" * 20)
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info("-" * 10)
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" - Document Mime Type: {doc.mimeType}")
+        logger.info(f" - Document Data: {doc.documentData}")

From 181f55359b2399e33cb85ef3aca484b6013fff07 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Fri, 29 Aug 2025 20:51:11 +0200
Subject: [PATCH 05/17] chore: exclude real api calling tests by default

---
 pytest.ini | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/pytest.ini b/pytest.ini
index b606fa5f..e3d8c35e 100644
--- a/pytest.ini
+++ b/pytest.ini
@@ -1,11 +1,13 @@
 [pytest]
 testpaths = tests
 python_paths = .
-addopts = -v --tb=short
 python_files = test_*.py
 python_classes = Test*
 python_functions = test_*
 log_file = logs/test_logs.log
 log_file_level = INFO
 log_file_format = %(asctime)s %(levelname)s %(message)s
-log_file_date_format = %Y-%m-%d %H:%M:%S
\ No newline at end of file
+log_file_date_format = %Y-%m-%d %H:%M:%S
+# Only run non-expensive tests by default, verbose log, short traceback
+# Use 'pytest -m ""' to run ALL tests.
+addopts = -v --tb=short -m 'not expensive'

From 31177063dee00d7c734de8f7c66c7ba5d94c0ffc Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 1 Sep 2025 09:49:57 +0200
Subject: [PATCH 06/17] feat: add web crawl connector; interface

---
 modules/connectors/connector_tavily.py    | 61 +++++++++++++++++++++--
 modules/interfaces/interface_web_model.py | 29 +++++++++--
 2 files changed, 82 insertions(+), 8 deletions(-)

diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
index bcb38e3f..783fea8c 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connector_tavily.py
@@ -4,11 +4,16 @@ import logging
 import os
 from dataclasses import dataclass
 from modules.interfaces.interface_web_model import (
+    WebCrawlBase,
+    WebCrawlDocumentData,
+    WebCrawlRequest,
     WebSearchBase,
     WebSearchRequest,
     WebSearchActionResult,
     WebSearchActionDocument,
     WebSearchDocumentData,
+    WebCrawlActionDocument,
+    WebCrawlActionResult,
 )
 
 # from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
@@ -20,7 +25,7 @@ logger = logging.getLogger(__name__)
 
 
 @dataclass
-class ConnectorTavily(WebSearchBase):
+class ConnectorTavily(WebSearchBase, WebCrawlBase):
     client: AsyncTavilyClient = None
 
     @classmethod
@@ -28,7 +33,10 @@ class ConnectorTavily(WebSearchBase):
         return cls(client=AsyncTavilyClient(api_key=os.getenv("TAVILY_API_KEY")))
 
     async def search_urls(self, request: WebSearchRequest) -> WebSearchActionResult:
-        """Handles the web search request."""
+        """Handles the web search request.
+
+        Takes a query and returns a list of URLs.
+        """
         # Step 1: Search
         try:
             search_results = await self._search(request.query, request.max_results)
@@ -37,12 +45,28 @@ class ConnectorTavily(WebSearchBase):
 
         # Step 2: Build ActionResult
         try:
-            result = self._build_action_result(search_results)
+            result = self._build_search_action_result(search_results)
         except Exception as e:
             return WebSearchActionResult(success=False, error=str(e))
 
         return result
 
+    async def crawl_urls(self, request: WebCrawlRequest) -> WebCrawlActionResult:
+        """Crawls the given URLs and returns the extracted text content."""
+        # Step 1: Crawl
+        try:
+            crawl_results = await self._crawl(request.urls)
+        except Exception as e:
+            return WebCrawlActionResult(success=False, error=str(e))
+
+        # Step 2: Build ActionResult
+        try:
+            result = self._build_crawl_action_result(crawl_results)
+        except Exception as e:
+            return WebCrawlActionResult(success=False, error=str(e))
+
+        return result
+
     async def _search(self, query: str, max_results: int) -> WebSearchActionResult:
         """Calls the Tavily API to perform a web search."""
         # Make sure max_results is within the allowed range
@@ -56,7 +80,9 @@ class ConnectorTavily(WebSearchBase):
 
         return response["results"]
 
-    def _build_action_result(self, search_results: list) -> WebSearchActionResult:
+    def _build_search_action_result(
+        self, search_results: list
+    ) -> WebSearchActionResult:
         """Builds the ActionResult from the search results."""
         documents = []
         for result in search_results:
@@ -75,3 +101,30 @@ class ConnectorTavily(WebSearchBase):
         return WebSearchActionResult(
             success=True, documents=documents, resultLabel="web_search_results"
         )
+
+    async def _crawl(self, urls: list) -> list[str]:
+        """Calls the Tavily API to extract text content from URLs."""
+        response = await self.client.extract(
+            urls=urls, extract_depth="advanced", format="text"
+        )
+        return response["results"]
+
+    def _build_crawl_action_result(self, crawl_results: list) -> WebCrawlActionResult:
+        """Builds the ActionResult from the crawl results."""
+        documents = []
+        for result in crawl_results:
+            document_name = f"web_crawl_{get_utc_timestamp()}.txt"
+            doc_data = WebCrawlDocumentData(
+                url=result["url"], content=result["raw_content"]
+            )
+            mime_type = "application/json"
+            doc = WebCrawlActionDocument(
+                documentName=document_name,
+                documentData=doc_data,
+                mimeType=mime_type,
+            )
+            documents.append(doc)
+
+        return WebCrawlActionResult(
+            success=True, documents=documents, resultLabel="web_crawl_results"
+        )
diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interface_web_model.py
index 8dc01fc8..0a258623 100644
--- a/modules/interfaces/interface_web_model.py
+++ b/modules/interfaces/interface_web_model.py
@@ -40,10 +40,31 @@ class WebSearchBase(ABC):
 
 # list of URLs -> list of extracted HTML content
 
-# TODO
+
+class WebCrawlRequest(BaseModel):
+    urls: List[str]
+
+
+class WebCrawlDocumentData(BaseModel):
+    url: str
+    content: str
+
+
+class WebCrawlActionDocument(ActionDocument):
+    documentData: WebCrawlDocumentData = Field(
+        description="The data extracted from a single crawled URL"
+    )
+
+
+class WebCrawlActionResult(ActionResult):
+    documents: List[WebCrawlActionDocument] = Field(default_factory=list)
+
+
+class WebCrawlBase(ABC):
+    @abstractmethod
+    async def crawl_urls(self, request: WebCrawlRequest) -> WebCrawlActionResult: ...
+
 
 # --- Web query ---
 
-# query -> list of extracted text
-
-# TODO
+# query -> list of extracted text; combines web search and crawl in one step

From 0816e7c45cb64a6014204aac3c17a40c6444eed5 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 1 Sep 2025 10:15:10 +0200
Subject: [PATCH 07/17] feat: finish implement web interface w/ tavily
 connector (untested)

---
 modules/connectors/connector_tavily.py      | 84 ++++++++++++++++++---
 modules/interfaces/interface_web_model.py   | 29 ++++++-
 modules/interfaces/interface_web_objects.py | 14 ++++
 3 files changed, 116 insertions(+), 11 deletions(-)

diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
index 783fea8c..786dc1f1 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connector_tavily.py
@@ -7,6 +7,11 @@ from modules.interfaces.interface_web_model import (
     WebCrawlBase,
     WebCrawlDocumentData,
     WebCrawlRequest,
+    WebScrapeActionDocument,
+    WebScrapeActionResult,
+    WebScrapeBase,
+    WebScrapeDocumentData,
+    WebScrapeRequest,
     WebSearchBase,
     WebSearchRequest,
     WebSearchActionResult,
@@ -25,7 +30,19 @@ logger = logging.getLogger(__name__)
 
 
 @dataclass
-class ConnectorTavily(WebSearchBase, WebCrawlBase):
+class TavilySearchResult:
+    title: str
+    url: str
+
+
+@dataclass
+class TavilyCrawlResult:
+    url: str
+    content: str
+
+
+@dataclass
+class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
     client: AsyncTavilyClient = None
 
     @classmethod
@@ -67,7 +84,30 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase):
 
         return result
 
-    async def _search(self, query: str, max_results: int) -> WebSearchActionResult:
+    async def scrape(self, request: WebScrapeRequest) -> WebScrapeActionResult:
+        """Turns a query in a list of urls with extracted content."""
+        # Step 1: Search
+        try:
+            search_results = await self._search(request.query, request.max_results)
+        except Exception as e:
+            return WebScrapeActionResult(success=False, error=str(e))
+
+        # Step 2: Crawl
+        try:
+            urls = [result.url for result in search_results]
+            crawl_results = await self._crawl(urls)
+        except Exception as e:
+            return WebScrapeActionResult(success=False, error=str(e))
+
+        # Step 3: Build ActionResult
+        try:
+            result = self._build_scrape_action_result(crawl_results)
+        except Exception as e:
+            return WebScrapeActionResult(success=False, error=str(e))
+
+        return result
+
+    async def _search(self, query: str, max_results: int) -> list[TavilySearchResult]:
         """Calls the Tavily API to perform a web search."""
         # Make sure max_results is within the allowed range
         if max_results < 0 or max_results > 20:
@@ -78,18 +118,19 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase):
 
         logger.info(f"Tavily API response:\n{response}")
 
-        return response["results"]
+        return [
+            TavilySearchResult(title=result["title"], url=result["url"])
+            for result in response["results"]
+        ]
 
     def _build_search_action_result(
-        self, search_results: list
+        self, search_results: list[TavilySearchResult]
     ) -> WebSearchActionResult:
         """Builds the ActionResult from the search results."""
         documents = []
         for result in search_results:
             document_name = f"web_search_{get_utc_timestamp()}.txt"
-            document_data = WebSearchDocumentData(
-                title=result["title"], url=result["url"]
-            )
+            document_data = WebSearchDocumentData(title=result.title, url=result.url)
             mime_type = "application/json"
             doc = WebSearchActionDocument(
                 documentName=document_name,
@@ -107,9 +148,14 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase):
         response = await self.client.extract(
             urls=urls, extract_depth="advanced", format="text"
         )
-        return response["results"]
+        return [
+            TavilyCrawlResult(url=result["url"], content=result["raw_content"])
+            for result in response["results"]
+        ]
 
-    def _build_crawl_action_result(self, crawl_results: list) -> WebCrawlActionResult:
+    def _build_crawl_action_result(
+        self, crawl_results: list[TavilyCrawlResult]
+    ) -> WebCrawlActionResult:
         """Builds the ActionResult from the crawl results."""
         documents = []
         for result in crawl_results:
@@ -128,3 +174,23 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase):
         return WebCrawlActionResult(
             success=True, documents=documents, resultLabel="web_crawl_results"
         )
+
+    def _build_scrape_action_result(
+        self, crawl_results: list[TavilyCrawlResult]
+    ) -> WebScrapeActionResult:
+        """Builds the ActionResult from the scrape results."""
+        documents = []
+        for result in crawl_results:
+            document_name = f"web_scrape_{get_utc_timestamp()}.txt"
+            doc_data = WebScrapeDocumentData(url=result.url, content=result.content)
+            mime_type = "application/json"
+            doc = WebScrapeActionDocument(
+                documentName=document_name,
+                documentData=doc_data,
+                mimeType=mime_type,
+            )
+            documents.append(doc)
+
+        return WebScrapeActionResult(
+            success=True, documents=documents, resultLabel="web_scrape_results"
+        )
diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interface_web_model.py
index 0a258623..389cd7ed 100644
--- a/modules/interfaces/interface_web_model.py
+++ b/modules/interfaces/interface_web_model.py
@@ -65,6 +65,31 @@ class WebCrawlBase(ABC):
     async def crawl_urls(self, request: WebCrawlRequest) -> WebCrawlActionResult: ...
 
 
-# --- Web query ---
+# --- Web scrape ---
 
-# query -> list of extracted text; combines web search and crawl in one step
+# scrape -> list of extracted text; combines web search and crawl in one step
+
+
+class WebScrapeRequest(BaseModel):
+    query: str
+    max_results: int
+
+
+class WebScrapeDocumentData(BaseModel):
+    url: str
+    content: str
+
+
+class WebScrapeActionDocument(ActionDocument):
+    documentData: WebScrapeDocumentData = Field(
+        description="The data extracted from a single scraped URL"
+    )
+
+
+class WebScrapeActionResult(ActionResult):
+    documents: List[WebScrapeActionDocument] = Field(default_factory=list)
+
+
+class WebScrapeBase(ABC):
+    @abstractmethod
+    async def scrape(self, request: WebScrapeRequest) -> WebScrapeActionResult: ...
diff --git a/modules/interfaces/interface_web_objects.py b/modules/interfaces/interface_web_objects.py
index b38db6a3..0ea43bd7 100644
--- a/modules/interfaces/interface_web_objects.py
+++ b/modules/interfaces/interface_web_objects.py
@@ -1,6 +1,10 @@
 from modules.interfaces.interface_web_model import (
+    WebCrawlActionResult,
     WebSearchActionResult,
     WebSearchRequest,
+    WebCrawlRequest,
+    WebScrapeActionResult,
+    WebScrapeRequest,
 )
 
 from dataclasses import dataclass
@@ -22,3 +26,13 @@ class WebInterface:
     ) -> WebSearchActionResult:
         # NOTE: Add connectors here
         return await self.connector_tavily.search_urls(web_search_request)
+
+    async def crawl(self, web_crawl_request: WebCrawlRequest) -> WebCrawlActionResult:
+        # NOTE: Add connectors here
+        return await self.connector_tavily.crawl_urls(web_crawl_request)
+
+    async def scrape(
+        self, web_scrape_request: WebScrapeRequest
+    ) -> WebScrapeActionResult:
+        # NOTE: Add connectors here
+        return await self.connector_tavily.scrape(web_scrape_request)

From 4c3592d7d9aaa7c811a5afa54283a75ecec14ce8 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 1 Sep 2025 11:21:37 +0200
Subject: [PATCH 08/17] feat: switch to single file approach

---
 modules/connectors/connector_tavily.py    | 115 +++++++++-------
 modules/interfaces/interface_web_model.py |  42 +++++-
 modules/methods/method_web.py             | 160 +++++++++++++++++++++-
 3 files changed, 261 insertions(+), 56 deletions(-)

diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
index 786dc1f1..af802790 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connector_tavily.py
@@ -7,16 +7,19 @@ from modules.interfaces.interface_web_model import (
     WebCrawlBase,
     WebCrawlDocumentData,
     WebCrawlRequest,
+    WebCrawlResultItem,
     WebScrapeActionDocument,
     WebScrapeActionResult,
     WebScrapeBase,
     WebScrapeDocumentData,
     WebScrapeRequest,
+    WebScrapeResultItem,
     WebSearchBase,
     WebSearchRequest,
     WebSearchActionResult,
     WebSearchActionDocument,
     WebSearchDocumentData,
+    WebSearchResultItem,
     WebCrawlActionDocument,
     WebCrawlActionResult,
 )
@@ -62,7 +65,7 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
 
         # Step 2: Build ActionResult
         try:
-            result = self._build_search_action_result(search_results)
+            result = self._build_search_action_result(search_results, request.query)
         except Exception as e:
             return WebSearchActionResult(success=False, error=str(e))
 
@@ -78,7 +81,7 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
 
         # Step 2: Build ActionResult
         try:
-            result = self._build_crawl_action_result(crawl_results)
+            result = self._build_crawl_action_result(crawl_results, request.urls)
         except Exception as e:
             return WebCrawlActionResult(success=False, error=str(e))
 
@@ -101,7 +104,7 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
 
         # Step 3: Build ActionResult
         try:
-            result = self._build_scrape_action_result(crawl_results)
+            result = self._build_scrape_action_result(crawl_results, request.query)
         except Exception as e:
             return WebScrapeActionResult(success=False, error=str(e))
 
@@ -124,26 +127,32 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
         ]
 
     def _build_search_action_result(
-        self, search_results: list[TavilySearchResult]
+        self, search_results: list[TavilySearchResult], query: str = ""
     ) -> WebSearchActionResult:
         """Builds the ActionResult from the search results."""
-        documents = []
-        for result in search_results:
-            document_name = f"web_search_{get_utc_timestamp()}.txt"
-            document_data = WebSearchDocumentData(title=result.title, url=result.url)
-            mime_type = "application/json"
-            doc = WebSearchActionDocument(
-                documentName=document_name,
-                documentData=document_data,
-                mimeType=mime_type,
-            )
-            documents.append(doc)
+        # Convert to result items
+        result_items = [
+            WebSearchResultItem(title=result.title, url=result.url)
+            for result in search_results
+        ]
 
-        return WebSearchActionResult(
-            success=True, documents=documents, resultLabel="web_search_results"
+        # Create document data with all results
+        document_data = WebSearchDocumentData(
+            query=query, results=result_items, total_count=len(result_items)
         )
 
-    async def _crawl(self, urls: list) -> list[str]:
+        # Create single document
+        document = WebSearchActionDocument(
+            documentName=f"web_search_results_{get_utc_timestamp()}.json",
+            documentData=document_data,
+            mimeType="application/json",
+        )
+
+        return WebSearchActionResult(
+            success=True, documents=[document], resultLabel="web_search_results"
+        )
+
+    async def _crawl(self, urls: list) -> list[TavilyCrawlResult]:
         """Calls the Tavily API to extract text content from URLs."""
         response = await self.client.extract(
             urls=urls, extract_depth="advanced", format="text"
@@ -154,43 +163,57 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
         ]
 
     def _build_crawl_action_result(
-        self, crawl_results: list[TavilyCrawlResult]
+        self, crawl_results: list[TavilyCrawlResult], urls: list[str] = None
     ) -> WebCrawlActionResult:
         """Builds the ActionResult from the crawl results."""
-        documents = []
-        for result in crawl_results:
-            document_name = f"web_crawl_{get_utc_timestamp()}.txt"
-            doc_data = WebCrawlDocumentData(
-                url=result["url"], content=result["raw_content"]
-            )
-            mime_type = "application/json"
-            doc = WebCrawlActionDocument(
-                documentName=document_name,
-                documentData=doc_data,
-                mimeType=mime_type,
-            )
-            documents.append(doc)
+        # Convert to result items
+        result_items = [
+            WebCrawlResultItem(url=result.url, content=result.content)
+            for result in crawl_results
+        ]
+
+        # Create document data with all results
+        document_data = WebCrawlDocumentData(
+            urls=urls or [result.url for result in crawl_results],
+            results=result_items,
+            total_count=len(result_items),
+        )
+
+        # Create single document
+        document = WebCrawlActionDocument(
+            documentName=f"web_crawl_results_{get_utc_timestamp()}.json",
+            documentData=document_data,
+            mimeType="application/json",
+        )
 
         return WebCrawlActionResult(
-            success=True, documents=documents, resultLabel="web_crawl_results"
+            success=True, documents=[document], resultLabel="web_crawl_results"
         )
 
     def _build_scrape_action_result(
-        self, crawl_results: list[TavilyCrawlResult]
+        self, crawl_results: list[TavilyCrawlResult], query: str = ""
     ) -> WebScrapeActionResult:
         """Builds the ActionResult from the scrape results."""
-        documents = []
-        for result in crawl_results:
-            document_name = f"web_scrape_{get_utc_timestamp()}.txt"
-            doc_data = WebScrapeDocumentData(url=result.url, content=result.content)
-            mime_type = "application/json"
-            doc = WebScrapeActionDocument(
-                documentName=document_name,
-                documentData=doc_data,
-                mimeType=mime_type,
-            )
-            documents.append(doc)
+        # Convert to result items
+        result_items = [
+            WebScrapeResultItem(url=result.url, content=result.content)
+            for result in crawl_results
+        ]
+
+        # Create document data with all results
+        document_data = WebScrapeDocumentData(
+            query=query,
+            results=result_items,
+            total_count=len(result_items),
+        )
+
+        # Create single document
+        document = WebScrapeActionDocument(
+            documentName=f"web_scrape_results_{get_utc_timestamp()}.json",
+            documentData=document_data,
+            mimeType="application/json",
+        )
 
         return WebScrapeActionResult(
-            success=True, documents=documents, resultLabel="web_scrape_results"
+            success=True, documents=[document], resultLabel="web_scrape_results"
         )
diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interface_web_model.py
index 389cd7ed..86f19e08 100644
--- a/modules/interfaces/interface_web_model.py
+++ b/modules/interfaces/interface_web_model.py
@@ -2,8 +2,6 @@
 
 from abc import ABC, abstractmethod
 from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
-
-
 from pydantic import BaseModel, Field
 from typing import List
 
@@ -18,11 +16,21 @@ class WebSearchRequest(BaseModel):
     max_results: int
 
 
-class WebSearchDocumentData(BaseModel):
+class WebSearchResultItem(BaseModel):
+    """Individual search result"""
+
     title: str
     url: str
 
 
+class WebSearchDocumentData(BaseModel):
+    """Complete search results document"""
+
+    query: str
+    results: List[WebSearchResultItem]
+    total_count: int
+
+
 class WebSearchActionDocument(ActionDocument):
     documentData: WebSearchDocumentData
 
@@ -45,14 +53,24 @@ class WebCrawlRequest(BaseModel):
     urls: List[str]
 
 
-class WebCrawlDocumentData(BaseModel):
+class WebCrawlResultItem(BaseModel):
+    """Individual crawl result"""
+
     url: str
     content: str
 
 
+class WebCrawlDocumentData(BaseModel):
+    """Complete crawl results document"""
+
+    urls: List[str]
+    results: List[WebCrawlResultItem]
+    total_count: int
+
+
 class WebCrawlActionDocument(ActionDocument):
     documentData: WebCrawlDocumentData = Field(
-        description="The data extracted from a single crawled URL"
+        description="The data extracted from crawled URLs"
     )
 
 
@@ -75,14 +93,24 @@ class WebScrapeRequest(BaseModel):
     max_results: int
 
 
-class WebScrapeDocumentData(BaseModel):
+class WebScrapeResultItem(BaseModel):
+    """Individual scrape result"""
+
     url: str
     content: str
 
 
+class WebScrapeDocumentData(BaseModel):
+    """Complete scrape results document"""
+
+    query: str
+    results: List[WebScrapeResultItem]
+    total_count: int
+
+
 class WebScrapeActionDocument(ActionDocument):
     documentData: WebScrapeDocumentData = Field(
-        description="The data extracted from a single scraped URL"
+        description="The data extracted from scraped URLs"
     )
 
 
diff --git a/modules/methods/method_web.py b/modules/methods/method_web.py
index 27b82ba5..ccb0f185 100644
--- a/modules/methods/method_web.py
+++ b/modules/methods/method_web.py
@@ -3,7 +3,11 @@ from typing import Any, Dict
 from modules.chat.methodBase import MethodBase, action
 from modules.interfaces.interfaceChatModel import ActionResult
 from modules.interfaces.interface_web_objects import WebInterface
-from modules.interfaces.interface_web_model import WebSearchRequest
+from modules.interfaces.interface_web_model import (
+    WebSearchRequest,
+    WebCrawlRequest,
+    WebScrapeRequest,
+)
 
 
 logger = logging.getLogger(__name__)
@@ -14,11 +18,14 @@ class MethodWeb(MethodBase):
 
     def __init__(self, serviceCenter: Any):
         super().__init__(serviceCenter)
+        self.name = "web"
+        self.description = "Web search, crawling, and scraping operations using Tavily"
 
     @action
     async def search(self, parameters: Dict[str, Any]) -> ActionResult:
-        """
-        Perform a web search and output a .txt file with a plain list of URLs (one per line).
+        """Perform a web search and outputs a .json file with a list of found URLs.
+
+        Each result contains "title" and "url".
 
         Parameters:
             query (str): Search query to perform
@@ -41,3 +48,150 @@ class MethodWeb(MethodBase):
 
         except Exception as e:
             return ActionResult(success=False, error=str(e))
+
+    @action
+    async def crawl(self, parameters: Dict[str, Any]) -> ActionResult:
+        """Crawls a list of URLs and extracts information from them.
+
+        Parameters:
+            document (str): Document reference containing URL list from search results
+            expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
+        """
+        try:
+            document_ref = parameters.get("document")
+
+            if not document_ref:
+                return ActionResult(
+                    success=False, error="No document reference provided."
+                )
+
+            # Resolve document reference to ChatDocument objects
+            chat_documents = self.service.getChatDocumentsFromDocumentList(
+                [document_ref]
+            )
+
+            if not chat_documents:
+                return ActionResult(
+                    success=False,
+                    error=f"No documents found for reference: {document_ref}",
+                )
+
+            # Get the first document (search results)
+            search_doc = chat_documents[0]
+
+            # Get file data using the service center
+            file_data = self.service.getFileData(search_doc.fileId)
+            if not file_data:
+                return ActionResult(
+                    success=False, error="Could not retrieve file data for document"
+                )
+
+            content = file_data.decode("utf-8")
+
+            # Parse JSON to extract URLs from search results
+            import json
+
+            try:
+                # The document structure from WebSearchActionResult
+                search_data = json.loads(content)
+
+                # Extract URLs from the search results structure
+                urls = []
+                if isinstance(search_data, dict):
+                    # Handle the document structure: documentData contains the actual search results
+                    doc_data = search_data.get("documentData", search_data)
+                    if "results" in doc_data and isinstance(doc_data["results"], list):
+                        urls = [
+                            result["url"]
+                            for result in doc_data["results"]
+                            if isinstance(result, dict) and "url" in result
+                        ]
+                    elif "urls" in doc_data and isinstance(doc_data["urls"], list):
+                        # Fallback: if URLs are stored directly in a 'urls' field
+                        urls = [url for url in doc_data["urls"] if isinstance(url, str)]
+
+                # Fallback: try to parse as plain text with regex (for backward compatibility)
+                if not urls:
+                    logger.warning(
+                        "Could not extract URLs from JSON structure, trying plain text parsing"
+                    )
+                    import re
+
+                    urls = re.split(r"[\n,;]+", content)
+                    urls = [
+                        u.strip()
+                        for u in urls
+                        if u.strip()
+                        and (
+                            u.strip().startswith("http://")
+                            or u.strip().startswith("https://")
+                        )
+                    ]
+
+            except json.JSONDecodeError:
+                # Fallback to plain text parsing if JSON parsing fails
+                logger.warning("Document is not valid JSON, trying plain text parsing")
+                import re
+
+                urls = re.split(r"[\n,;]+", content)
+                urls = [
+                    u.strip()
+                    for u in urls
+                    if u.strip()
+                    and (
+                        u.strip().startswith("http://")
+                        or u.strip().startswith("https://")
+                    )
+                ]
+
+            if not urls:
+                return ActionResult(
+                    success=False, error="No valid URLs found in the document."
+                )
+
+            logger.info(f"Extracted {len(urls)} URLs from document: {urls}")
+
+            # Prepare request data
+            web_crawl_request = WebCrawlRequest(urls=urls)
+
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_crawl_result = await web_interface.crawl(web_crawl_request)
+
+            return web_crawl_result
+
+        except Exception as e:
+            logger.error(f"Error in crawl method: {str(e)}")
+            return ActionResult(success=False, error=str(e))
+
+    @action
+    async def scrape(self, parameters: Dict[str, Any]) -> ActionResult:
+        """Scrapes web content by searching for URLs and then extracting their content.
+
+        Combines search and crawl operations in one step.
+
+        Parameters:
+            query (str): Search query to perform
+            maxResults (int, optional): Maximum number of results (default: 10)
+        """
+        try:
+            query = parameters.get("query")
+            max_results = parameters.get("maxResults", 10)
+
+            if not query:
+                return ActionResult(success=False, error="Search query is required")
+
+            # Prepare request data
+            web_scrape_request = WebScrapeRequest(
+                query=query,
+                max_results=max_results,
+            )
+
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_scrape_result = await web_interface.scrape(web_scrape_request)
+
+            return web_scrape_result
+
+        except Exception as e:
+            return ActionResult(success=False, error=str(e))

From cfc83a7f42d990a391ba6a3d469f13ce089892e4 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 1 Sep 2025 15:36:32 +0200
Subject: [PATCH 09/17] chore: add tests

---
 modules/connectors/connector_tavily.py    |   6 +-
 tests/connectors/test_connector_tavily.py |  72 +++++++-
 tests/fixtures/tavily_responses.py        |  26 ++-
 tests/methods/test_method_web.py          | 196 ++++++++++++++++++++--
 4 files changed, 286 insertions(+), 14 deletions(-)

diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connector_tavily.py
index af802790..8a05e781 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connector_tavily.py
@@ -119,7 +119,7 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
         # Perform actual API call
         response = await self.client.search(query=query, max_results=max_results)
 
-        logger.info(f"Tavily API response:\n{response}")
+        logger.info(f"Tavily API search response:\n{response}")
 
         return [
             TavilySearchResult(title=result["title"], url=result["url"])
@@ -157,6 +157,10 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
         response = await self.client.extract(
             urls=urls, extract_depth="advanced", format="text"
         )
+
+        # Log the result
+        logger.info(f"Tavily API extract (crawl) response:\n{response}")
+
         return [
             TavilyCrawlResult(url=result["url"], content=result["raw_content"])
             for result in response["results"]
diff --git a/tests/connectors/test_connector_tavily.py b/tests/connectors/test_connector_tavily.py
index 3b23f69a..81ce64c3 100644
--- a/tests/connectors/test_connector_tavily.py
+++ b/tests/connectors/test_connector_tavily.py
@@ -4,7 +4,11 @@ import pytest
 import logging
 
 from modules.interfaces.interfaceChatModel import ActionResult
-from modules.interfaces.interface_web_model import WebSearchRequest
+from modules.interfaces.interface_web_model import (
+    WebSearchRequest,
+    WebCrawlRequest,
+    WebScrapeRequest,
+)
 from modules.connectors.connector_tavily import ConnectorTavily
 
 logger = logging.getLogger(__name__)
@@ -13,7 +17,7 @@ logger = logging.getLogger(__name__)
 @pytest.mark.asyncio
 @pytest.mark.expensive
 async def test_tavily_connector_search_test_live_api():
-    logger.info("Testing Tavliy connector with live API calls")
+    logger.info("Testing Tavliy connector search with live API calls")
 
     # Test request
     request = WebSearchRequest(query="How old is the Earth?", max_results=5)
@@ -38,3 +42,67 @@ async def test_tavily_connector_search_test_live_api():
         logger.info(f" - Document Name: {doc.documentName}")
         logger.info(f" - Document Mime Type: {doc.mimeType}")
         logger.info(f" - Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+@pytest.mark.expensive
+async def test_tavily_connector_crawl_test_live_api():
+    logger.info("Testing Tavily connector crawl with live API calls")
+
+    # Test request
+    urls = [
+        "https://en.wikipedia.org/wiki/Earth",
+        "https://valueon.ch",
+    ]
+    request = WebCrawlRequest(urls=urls)
+
+    # Tavily instance
+    connector_tavily = await ConnectorTavily.create()
+
+    # Crawl test
+    action_result = await connector_tavily.crawl_urls(request=request)
+
+    # Check results
+    assert isinstance(action_result, ActionResult)
+
+    logger.info("=" * 20)
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info("-" * 10)
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" - Document Mime Type: {doc.mimeType}")
+        logger.info(f" - Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+@pytest.mark.expensive
+async def test_tavily_connector_scrape_test_live_api():
+    logger.info("Testing Tavily connector scrape with live API calls")
+
+    # Test request with query
+    request = WebScrapeRequest(query="How old is the Earth?", max_results=3)
+
+    # Tavily instance
+    connector_tavily = await ConnectorTavily.create()
+
+    # Scrape test
+    action_result = await connector_tavily.scrape(request=request)
+
+    # Check results
+    assert isinstance(action_result, ActionResult)
+
+    logger.info("=" * 20)
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info("-" * 10)
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" - Document Mime Type: {doc.mimeType}")
+        logger.info(f" - Document Data: {doc.documentData}")
diff --git a/tests/fixtures/tavily_responses.py b/tests/fixtures/tavily_responses.py
index 789f62f0..ab94d353 100644
--- a/tests/fixtures/tavily_responses.py
+++ b/tests/fixtures/tavily_responses.py
@@ -1,6 +1,6 @@
 """Sample tavily responses for patching responses in tests."""
 
-RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER = {
+RESPONSE_SEARCH_HOW_OLD_IS_EARTH_NO_ANSWER = {
     "query": "How old is the earth",
     "follow_up_questions": None,
     "answer": None,
@@ -45,3 +45,27 @@ RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER = {
     "response_time": 0.96,
     "request_id": "3c36cccd-0918-49fd-bd1c-23c62ba7ec2d",
 }
+
+
+RESPONSE_EXTRACT_HOW_OLD_IS_EARTH_NO_ANSWER = {
+    "results": [
+        {
+            "url": "https://en.wikipedia.org/wiki/Age_of_Earth",
+            "raw_content": 'Jump to content\nAge of Earth\n\nAfrikaans\nالعربية\nAzərbaycanca\nবাংলা\nБеларуская\nБългарски\nCatalà\nČeština\nDansk\nΕλληνικά\nEspañol\nEsperanto\nEuskara\nفارسی\nFrançais\nGalego\n한국어\nՀայերեն\nBahasa Indonesia\nItaliano\nעברית\nҚазақша\nLatina\nLëtzebuergesch\nLietuvių\nBahasa Melayu\nNederlands\n日本語\nپښتو\nPortuguês\nRomnă\nРусский\nSimple English\nSlovenčina\nSlovenščina\nСрпски / srpski\nSrpskohrvatski / српскохрватски\nSvenska\nTürkçe\nУкраїнська\nاردو\nTiếng Việt\n文言\nYorùbá\n粵語\n中文\n\nEdit links\nFrom Wikipedia, the free encyclopedia\nScientific dating of the age of Earth\nThe age of Earth is estimated to be 4.54 ± 0.05 billion years. This age represents the final stages of Earth\'s accretion and planetary differentiation. Age estimates are based on evidence from radiometric age-dating of meteoritic material—consistent with the radiometric ages of the oldest-known terrestrial material and lunar samples—and astrophysical accretion models consistent with observations of planet formation in protoplanetary disks.\nFollowing the development of radiometric dating in the early 20th century, measurements of lead in uranium-rich minerals showed that some were in excess of a billion years old. The oldest such minerals analyzed to date—small crystals of zircon from the Jack Hills of Western Australia—are at least 4.404 billion years old. Calcium–aluminium-rich inclusions—the oldest known solid constituents within meteorites that are formed within the Solar System—are 4.5673 ± 0.00016 billion years old giving a lower limit for the age of the Solar System.\nIt is hypothesized that the accretion of Earth began soon after the formation of the calcium-aluminium-rich inclusions. Because the duration of this accretion process is not yet adequately constrained—predictions from different accretion models range from around 30 million to 100 million years—the difference between the age of Earth and of the oldest rocks is difficult to determine. It can also be difficult to determine the exact age of the oldest rocks on Earth, exposed at the surface, as they are aggregates of minerals of possibly different ages.\nDevelopment of modern geologic concepts\n|  |  |  |\n --- \n| Life timeline | | |\n| This box:    view  talk  edit | | |\n| −4500 —  –  —  –  −4000 —  –  —  –  −3500 —  –  —  –  −3000 —  –  —  –  −2500 —  –  —  –  −2000 —  –  —  –  −1500 —  –  —  –  −1000 —  –  —  –  −500 —  –  —  –  0 — | Water Single-celled life Photosynthesis Multicellular life Plants Arthropods Molluscs Flowers Dinosaurs Mammals Birds Primates Hadean Archean Proterozoic Phanerozoic | |  |  |  --- | | ← | Earth formed |  |  |  |  --- | | ← | Earliest water |  |  |  |  --- | | ← | LUCA |  |  |  |  --- | | ← | Earliest fossils |  |  |  |  --- | | ← | Atmospheric oxygen |  |  |  |  --- | | ← | Sexual reproduction |  |  |  |  --- | | ← | Earliest fungi |  |  |  |  --- | | ← | Neoproterozoic oxygenation event |  |  |  |  --- | | ← | Ediacaran biota |  |  |  |  --- | | ← | Cambrian explosion |  |  |  |  --- | | ← | Earliest tetrapods |  |  |  |  --- | | ← | Earliest hominoid | |\n| (million years ago) | | |\nMain article: History of geology\nFurther information: Relative dating\nStudies of strata—the layering of rocks and soil—gave naturalists an appreciation that Earth may have been through many changes during its existence. These layers often contained fossilized remains of unknown creatures, leading some to interpret a progression of organisms from layer to layer.\nNicolas Steno in the 17th century was one of the first naturalists to appreciate the connection between fossil remains and strata. His observations led him to formulate important stratigraphic concepts (i.e., the "law of superposition" and the "principle of original horizontality"). In the 1790s, William Smith hypothesized that if two layers of rock at widely differing locations contained similar fossils, then it was very plausible that the layers were the same age. Smith\'s nephew and student, John Phillips, later calculated by such means that Earth was about 96 million years old.\nIn the mid-18th century, the naturalist Mikhail Lomonosov suggested that Earth had been created separately from, and several hundred thousand years before, the rest of the universe.[citation needed] Lomonosov\'s ideas were mostly speculative.[citation needed] In 1779 the Comte du Buffon tried to obtain a value for the age of Earth using an experiment: he created a small globe that resembled Earth in composition and then measured its rate of cooling. This led him to estimate that Earth was about 75,000 years old. Even earlier, in 1687, in his Principia, the mathematician and physicist Isaac Newton was the first to calculate the age of the Earth by experiment, coming to a conclusion of 50,000 years.\nOther naturalists used these hypotheses to construct a history of Earth, though their timelines were inexact as they did not know how long it took to lay down stratigraphic layers. In 1830, geologist Charles Lyell, developing ideas found in James Hutton\'s works, popularized the concept that the features of Earth were in perpetual change, eroding and reforming continuously, and the rate of this change was roughly constant. This was a challenge to the traditional view, which saw the history of Earth as dominated by intermittent catastrophes. Many naturalists were influenced by Lyell to become "uniformitarians" who believed that changes were constant and uniform.[citation needed]\nEarly calculations\nFurther information: William Thomson, 1st Baron Kelvin § Age of the Earth: geology\nIn 1862, the physicist William Thomson, 1st Baron Kelvin published calculations that fixed the age of Earth at between 20 million and 400 million years. He assumed that Earth had formed as a completely molten object, and determined the amount of time it would take for the near-surface temperature gradient to decrease to its present value. His calculations did not account for heat produced via radioactive decay (a then unknown process) or, more significantly, convection inside Earth, which allows the temperature in the upper mantle to remain high much longer, maintaining a high thermal gradient in the crust much longer. Even more constraining were Thomson\'s estimates of the age of the Sun, which were based on estimates of its thermal output and a theory that the Sun obtains its energy from gravitational collapse; Thomson estimated that the Sun is about 20 million years old.\nGeologists such as Lyell had difficulty accepting such a short age for Earth. For biologists, even 100 million years seemed much too short to be plausible. In Charles Darwin\'s theory of evolution, the process of random heritable variation with cumulative selection requires great durations of time, and Darwin stated that Thomson\'s estimates did not appear to provide enough time. According to modern biology, the total evolutionary history from the beginning of life to today has taken place since 3.5 to 3.8 billion years ago, the amount of time which passed since the last universal ancestor of all living organisms as shown by geological dating.\nIn a lecture in 1869, Darwin\'s great advocate, Thomas Henry Huxley, attacked Thomson\'s calculations, suggesting they appeared precise in themselves but were based on faulty assumptions. The physicist Hermann von Helmholtz (in 1856) and astronomer Simon Newcomb (in 1892) contributed their own calculations of 22 and 18 million years, respectively, to the debate: they independently calculated the amount of time it would take for the Sun to condense down to its current diameter and brightness from the nebula of gas and dust from which it was born. Their values were consistent with Thomson\'s calculations. However, they assumed that the Sun was only glowing from the heat of its gravitational contraction. The process of solar nuclear fusion was not yet known to science.\nIn 1892, Thomson was ennobled as Lord Kelvin in appreciation of his many scientific accomplishments. In 1895 John Perry challenged Kelvin\'s figure on the basis of his assumptions on conductivity, and Oliver Heaviside entered the dialogue, considering it "a vehicle to display the ability of his operator method to solve problems of astonishing complexity." Other scientists backed up Kelvin\'s figures. Darwin\'s son, the astronomer George H. Darwin, proposed that Earth and Moon had broken apart in their early days when they were both molten. He calculated the amount of time it would have taken for tidal friction to give Earth its current 24-hour day. His value of 56 million years was additional evidence that Thomson was on the right track. The last estimate Kelvin gave, in 1897, was: "that it was more than 20 and less than 40 million year old, and probably much nearer 20 than 40". In 1899 and 1900, John Joly calculated the rate at which the oceans should have accumulated salt from erosion processes and determined that the oceans were about 80 to 100 million years old.\nRadiometric dating\nMain article: Radiometric dating\nOverview\nBy their chemical nature, rock minerals contain certain elements and not others; but in rocks containing radioactive isotopes, the process of radioactive decay generates exotic elements over time. By measuring the concentration of the stable end product of the decay, coupled with knowledge of the half life and initial concentration of the decaying element, the age of the rock can be calculated. Typical radioactive end products are argon from decay of potassium-40, and lead from decay of uranium and thorium. If the rock becomes molten, as happens in Earth\'s mantle, such nonradioactive end products typically escape or are redistributed. Thus the age of the oldest terrestrial rock gives a minimum for the age of Earth, assuming that no rock has been intact for longer than Earth itself.\nConvective mantle and radioactivity\nThe discovery of radioactivity introduced another factor in the calculation. After Henri Becquerel\'s initial discovery in 1896, Marie and Pierre Curie discovered the radioactive elements polonium and radium in 1898; and in 1903, Pierre Curie and Albert Laborde announced that radium produces enough heat to melt its own weight in ice in less than an hour. Geologists quickly realized that this upset the assumptions underlying most calculations of the age of Earth. These had assumed that the original heat of Earth and the Sun had dissipated steadily into space, but radioactive decay meant that this heat had been continually replenished. George Darwin and John Joly were the first to point this out, in 1903.\nInvention of radiometric dating\nRadioactivity, which had overthrown the old calculations, yielded a bonus by providing a basis for new calculations, in the form of radiometric dating.\nErnest Rutherford and Frederick Soddy jointly had continued their work on radioactive materials and concluded that radioactivity was caused by a spontaneous transmutation of atomic elements. In radioactive decay, an element breaks down into another, lighter element, releasing alpha, beta, or gamma radiation in the process. They also determined that a particular isotope of a radioactive element decays into another element at a distinctive rate. This rate is given in terms of a "half-life", or the amount of time it takes half of a mass of that radioactive material to break down into its "decay product".\nSome radioactive materials have short half-lives; some have long half-lives. Uranium and thorium have long half-lives and so persist in Earth\'s crust, but radioactive elements with short half-lives have generally disappeared. This suggested that it might be possible to measure the age of Earth by determining the relative proportions of radioactive materials in geological samples. In reality, radioactive elements do not always decay into nonradioactive ("stable") elements directly, instead, decaying into other radioactive elements that have their own half-lives and so on, until they reach a stable element. These "decay chains", such as the uranium-radium and thorium series, were known within a few years of the discovery of radioactivity and provided a basis for constructing techniques of radiometric dating.\nThe pioneers of radioactivity were chemist Bertram B. Boltwood and physicist Rutherford. Boltwood had conducted studies of radioactive materials as a consultant, and when Rutherford lectured at Yale in 1904, Boltwood was inspired to describe the relationships between elements in various decay series. Late in 1904, Rutherford took the first step toward radiometric dating by suggesting that the alpha particles released by radioactive decay could be trapped in a rocky material as helium atoms. At the time, Rutherford was only guessing at the relationship between alpha particles and helium atoms, but he would prove the connection four years later.\nSoddy and Sir William Ramsay had just determined the rate at which radium produces alpha particles, and Rutherford proposed that he could determine the age of a rock sample by measuring its concentration of helium. He dated a rock in his possession to an age of 40 million years by this technique. Rutherford wrote of addressing a meeting of the Royal Institution in 1904:\n\nI came into the room, which was half dark, and presently spotted Lord Kelvin in the audience and realized that I was in trouble at the last part of my speech dealing with the age of the Earth, where my views conflicted with his. To my relief, Kelvin fell fast asleep, but as I came to the important point, I saw the old bird sit up, open an eye, and cock a baleful glance at me! Then a sudden inspiration came, and I said, "Lord Kelvin had limited the age of the Earth, provided no new source was discovered. That prophetic utterance refers to what we are now considering tonight, radium!" Behold! the old boy beamed upon me.\n\nRutherford assumed that the rate of decay of radium as determined by Ramsay and Soddy was accurate and that helium did not escape from the sample over time. Rutherford\'s scheme was inaccurate, but it was a useful first step. Boltwood focused on the end products of decay series. In 1905, he suggested that lead was the final stable product of the decay of radium. It was already known that radium was an intermediate product of the decay of uranium. Rutherford joined in, outlining a decay process in which radium emitted five alpha particles through various intermediate products to end up with lead, and speculated that the radium–lead decay chain could be used to date rock samples. Boltwood did the legwork and by the end of 1905 had provided dates for 26 separate rock samples, ranging from 92 to 570 million years. He did not publish these results, which was fortunate because they were flawed by measurement errors and poor estimates of the half-life of radium. Boltwood refined his work and finally published the results in 1907.\nBoltwood\'s paper pointed out that samples taken from comparable layers of strata had similar lead-to-uranium ratios, and that samples from older layers had a higher proportion of lead, except where there was evidence that lead had leached out of the sample. His studies were flawed by the fact that the decay series of thorium was not understood, which led to incorrect results for samples that contained both uranium and thorium. However, his calculations were far more accurate than any that had been performed to that time. Refinements in the technique would later give ages for Boltwood\'s 26 samples of 410 million to 2.2 billion years.\nArthur Holmes establishes radiometric dating\nAlthough Boltwood published his paper in a prominent geological journal, the geological community had little interest in radioactivity.[citation needed] Boltwood gave up work on radiometric dating and went on to investigate other decay series. Rutherford remained mildly curious about the issue of the age of Earth but did little work on it.\nRobert Strutt tinkered with Rutherford\'s helium method until 1910 and then ceased. However, Strutt\'s student Arthur Holmes became interested in radiometric dating and continued to work on it after everyone else had given up. Holmes focused on lead dating because he regarded the helium method as unpromising. He performed measurements on rock samples and concluded in 1911 that the oldest (a sample from Ceylon) was about 1.6 billion years old. These calculations were not particularly trustworthy. For example, he assumed that the samples had contained only uranium and no lead when they were formed.\nMore important research was published in 1913. It showed that elements generally exist in multiple variants with different masses, or "isotopes". In the 1930s, isotopes would be shown to have nuclei with differing numbers of the neutral particles known as "neutrons". In that same year, other research was published establishing the rules for radioactive decay, allowing more precise identification of decay series.\nMany geologists felt these new discoveries made radiometric dating so complicated as to be worthless.[citation needed] Holmes felt that they gave him tools to improve his techniques, and he plodded ahead with his research, publishing before and after the First World War. His work was generally ignored until the 1920s, though in 1917 Joseph Barrell, a professor of geology at Yale, redrew geological history as it was understood at the time to conform to Holmes\'s findings in radiometric dating. Barrell\'s research determined that the layers of strata had not all been laid down at the same rate, and so current rates of geological change could not be used to provide accurate timelines of the history of Earth.[citation needed]\nHolmes\' persistence finally began to pay off in 1921, when the speakers at the yearly meeting of the British Association for the Advancement of Science came to a rough consensus that Earth was a few billion years old and that radiometric dating was credible. Holmes published The Age of the Earth, an Introduction to Geological Ideas in 1927 in which he presented a range of 1.6 to 3.0 billion years. No great push to embrace radiometric dating followed, however, and the die-hards in the geological community stubbornly resisted. They had never cared for attempts by physicists to intrude in their domain, and had successfully ignored them so far. The growing weight of evidence finally tilted the balance in 1931, when the National Research Council of the US National Academy of Sciences decided to resolve the question of the age of Earth by appointing a committee to investigate.\nHolmes, being one of the few people who was trained in radiometric dating techniques, was a committee member and in fact wrote most of the final report. Thus, Holmes\' report concluded that radioactive dating was the only reliable means of pinning down a geologic time scale. Questions of bias were deflected by the great and exacting detail of the report. It described the methods used, the care with which measurements were made, and their error bars and limitations.[citation needed]\nModern radiometric dating\nRadiometric dating continues to be the predominant way scientists date geologic time scales. Techniques for radioactive dating have been tested and fine-tuned on an ongoing basis since the 1960s. Forty or so different dating techniques have been utilized to date, working on a wide variety of materials. Dates for the same sample using these different techniques are in very close agreement on the age of the material.[citation needed] Possible contamination problems do exist, but they have been studied and dealt with by careful investigation, leading to sample preparation procedures being minimized to limit the chance of contamination.[citation needed]\nUse of meteorites\nAn age of 4.55 ± 0.07 billion years, very close to today\'s accepted age, was determined by Clair Cameron Patterson using uranium–lead isotope dating (specifically lead–lead dating) on several meteorites including the Canyon Diablo meteorite and published in 1956. The quoted age of Earth is derived, in part, from the Canyon Diablo meteorite for several important reasons and is built upon a modern understanding of cosmochemistry built up over decades of research.\nMost geological samples from Earth are unable to give a direct date of the formation of Earth from the solar nebula because Earth has undergone differentiation into the core, mantle, and crust, and this has then undergone a long history of mixing and unmixing of these sample reservoirs by plate tectonics, weathering and hydrothermal circulation.\nAll of these processes may adversely affect isotopic dating mechanisms because the sample cannot always be assumed to have remained as a closed system, by which it is meant that either the parent or daughter nuclide (a species of atom characterised by the number of neutrons and protons an atom contains) or an intermediate daughter nuclide may have been partially removed from the sample, which will skew the resulting isotopic date. To mitigate this effect it is usual to date several minerals in the same sample, to provide an isochron. Alternatively, more than one dating system may be used on a sample to check the date.\nSome meteorites are furthermore considered to represent the primitive material from which the accreting solar disk was formed. Some have behaved as closed systems (for some isotopic systems) soon after the solar disk and the planets formed.[citation needed] To date, these assumptions are supported by much scientific observation and repeated isotopic dates, and it is certainly a more robust hypothesis than that which assumes a terrestrial rock has retained its original composition.\nNevertheless, ancient Archaean lead ores of galena have been used to date the formation of Earth as these represent the earliest formed lead-only minerals on the planet and record the earliest homogeneous lead–lead isotope systems on the planet. These have returned age dates of 4.54 billion years with a precision of as little as 1% margin for error.\nStatistics for several meteorites that have undergone isochron dating are as follows:\n| 1. St. Severin (ordinary chondrite) | | | |\n ---  --- |\n|  | 1. | Pb-Pb isochron | 4.543 ± 0.019 billion years |\n|  | 2. | Sm-Nd isochron | 4.55 ± 0.33 billion years |\n|  | 3. | Rb-Sr isochron | 4.51 ± 0.15 billion years |\n|  | 4. | Re-Os isochron | 4.68 ± 0.15 billion years |\n| 2. Juvinas (basaltic achondrite) | | | |\n|  | 1. | Pb-Pb isochron | 4.556 ± 0.012 billion years |\n|  | 2. | Pb-Pb isochron | 4.540 ± 0.001 billion years |\n|  | 3. | Sm-Nd isochron | 4.56 ± 0.08 billion years |\n|  | 4. | Rb-Sr isochron | 4.50 ± 0.07 billion years |\n| 3. Allende (carbonaceous chondrite) | | | |\n|  | 1. | Pb-Pb isochron | 4.553 ± 0.004 billion years |\n|  | 2. | Ar-Ar age spectrum | 4.52 ± 0.02 billion years |\n|  | 3. | Ar-Ar age spectrum | 4.55 ± 0.03 billion years |\n|  | 4. | Ar-Ar age spectrum | 4.56 ± 0.05 billion years |\nCanyon Diablo meteorite\nFurther information: Age of the Solar System and Canyon Diablo (meteorite)\nThe Canyon Diablo meteorite was used because it is both large and representative of a particularly rare type of meteorite that contains sulfide minerals (particularly troilite, FeS), metallic nickel-iron alloys, plus silicate minerals. This is important because the presence of the three mineral phases allows investigation of isotopic dates using samples that provide a great separation in concentrations between parent and daughter nuclides. This is particularly true of uranium and lead. Lead is strongly chalcophilic and is found in the sulfide at a much greater concentration than in the silicate, versus uranium. Because of this segregation in the parent and daughter nuclides during the formation of the meteorite, this allowed a much more precise date of the formation of the solar disk and hence the planets than ever before.\nThe age determined from the Canyon Diablo meteorite has been confirmed by hundreds of other age determinations, from both terrestrial samples and other meteorites. The meteorite samples, however, show a spread from 4.53 to 4.58 billion years ago. This is interpreted as the duration of formation of the solar nebula and its collapse into the solar disk to form the Sun and the planets. This 50 million year time span allows for accretion of the planets from the original solar dust and meteorites.\nThe Moon, as another extraterrestrial body that has not undergone plate tectonics and that has no atmosphere, provides quite precise age dates from the samples returned from the Apollo missions. Rocks returned from the Moon have been dated at a maximum of 4.51 billion years old. Martian meteorites that have landed upon Earth have also been dated to around 4.5 billion years old by lead–lead dating. Lunar samples, since they have not been disturbed by weathering, plate tectonics or material moved by organisms, can also provide dating by direct electron microscope examination of cosmic ray tracks. The accumulation of dislocations generated by high energy cosmic ray particle impacts provides another confirmation of the isotopic dates. Cosmic ray dating is only useful on material that has not been melted, since melting erases the crystalline structure of the material, and wipes away the tracks left by the particles.\nSee also\n\nWorld portal\n\nAge of the universe\n\nCreation myth\nGeochronology\nHistory of Earth\nNatural history\nOldest dated rocks\nTimeline of natural history\n\nReferences\n\n^ "Age of the Earth". U.S. Geological Survey. 1997. Archived from the original on 23 December 2005. Retrieved 2006-01-10.\n^ Dalrymple, G. Brent (2001). "The age of the Earth in the twentieth century: a problem (mostly) solved". Special Publications, Geological Society of London. 190 (1): 205–221. Bibcode:2001GSLSP.190..205D. doi:10.1144/GSL.SP.2001.190.01.14. S2CID 130092094.\n^ Manhesa, Gérard; Allègre, Claude J.; Dupréa, Bernard & Hamelin, Bruno (1980). "Lead isotope study of basic-ultrabasic layered complexes: Speculations about the age of the earth and primitive mantle characteristics". Earth and Planetary Science Letters. 47 (3): 370–382. Bibcode:1980E&PSL..47..370M. doi:10.1016/0012-821X(80)90024-2.\n^ Braterman, Paul S. (2013). "How Science Figured Out the Age of Earth". Scientific American. Archived from the original on 2016-04-12.\n^ a b Mezger, K.; Schönbächler, M.; Bouvier, A. (2020-03-04). "Accretion of the Earth—Missing Components?". Space Science Reviews. 216 (2): 27. doi:10.1007/s11214-020-00649-y. hdl:20.500.11850/405628. ISSN 1572-9672.\n^ Hedman, Matthew (2007). "9: Meteorites and the Age of the Solar System". The Age of Everything. University of Chicago Press. pp. 142–162. ISBN 9780226322940. Archived from the original on 2018-02-14.\n^ a b Wilde, S. A.; Valley, J. W.; Peck, W. H.; Graham C. M. (2001-01-11). "Evidence from detrital zircons for the existence of continental crust and oceans on the Earth 4.4 Gyr ago". Nature. 409 (6817): 175–178. Bibcode:2001Natur.409..175W. doi:10.1038/35051550. PMID 11196637. S2CID 4319774.\n^ Barboni, Melanie; Boehnke, Patrick; Keller, Brenhin; Kohl, Issaku E.; Schoene, Blair; Young, Edward D.; McKeegan, Kevin D. (2017-01-06). "Early formation of the Moon 4.51 billion years ago". Science Advances. 3 (1): e1602365. Bibcode:2017SciA....3E2365B. doi:10.1126/sciadv.1602365. ISSN 2375-2548. PMC 5226643. PMID 28097222.\n^ Halliday, Alex N.; Canup, Robin M. (2022-11-29). "The accretion of planet Earth". Nature Reviews Earth & Environment. 4 (1): 19–35. doi:10.1038/s43017-022-00370-0. ISSN 2662-138X.\n^ Pfalzner, S; Davies, M B; Gounelle, M; Johansen, A; Münker, C; Lacerda, P; Zwart, S Portegies; Testi, L; Trieloff, M; Veras, D (2015-06-01). "The formation of the solar system". Physica Scripta. 90 (6): 068001. arXiv:1501.03101. doi:10.1088/0031-8949/90/6/068001. ISSN 0031-8949.\n^ a b c Boltwood, B. B. (1907). "On the ultimate disintegration products of the radio-active elements. Part II. The disintegration products of uranium". American Journal of Science. 23 (134): 77–88. doi:10.2475/ajs.s4-23.134.78. S2CID 131688682.\n    For the abstract, see: Chemical Abstracts Service, American Chemical Society (1907). Chemical Abstracts. New York, London: American Chemical Society. p. 817. Retrieved 2008-12-19.\n^ Valley, John W.; Peck, William H.; Kin, Elizabeth M. (1999). "Zircons Are Forever" (PDF). The Outcrop, Geology Alumni Newsletter. University of Wisconsin-Madison. pp. 34–35. Archived (PDF) from the original on 2009-02-26. Retrieved 2008-12-22.\n^ Wyche, S.; Nelson, D. R.; Riganti, A. (2004). "4350–3130 Ma detrital zircons in the Southern Cross Granite–Greenstone Terrane, Western Australia: implications for the early evolution of the Yilgarn Craton". Australian Journal of Earth Sciences. 51 (1): 31–45. Bibcode:2004AuJES..51...31W. doi:10.1046/j.1400-0952.2003.01042.x.\n^ Amelin, Yuri; Kaltenbach, Angela; Iizuka, Tsuyoshi; Stirling, Claudine H.; Ireland, Trevor R.; Petaev, Michail; Jacobsen, Stein B. (2010-12-01). "U–Pb chronology of the Solar System\'s oldest solids with variable 238U/235U". Earth and Planetary Science Letters. 300 (3): 343–350. doi:10.1016/j.epsl.2010.10.015. hdl:1885/21305. ISSN 0012-821X.\n^ Connelly, James N.; Bizzarro, Martin; Krot, Alexander N.; Nordlund, Åke; Wielandt, Daniel; Ivanova, Marina A. (2012-11-02). "The Absolute Chronology and Thermal Processing of Solids in the Solar Protoplanetary Disk". Science. 338 (6107): 651–655. doi:10.1126/science.1226919.\n^ Sossi, Paolo A.; Stotz, Ingo L.; Jacobson, Seth A.; Morbidelli, Alessandro; O’Neill, Hugh St C. (2022-07-07). "Stochastic accretion of the Earth". Nature Astronomy. 6 (8): 951–960. doi:10.1038/s41550-022-01702-2. ISSN 2397-3366. PMC 7613298.\n^ Lyell, Charles, Sir (1866). Elements of Geology; or, The Ancient Changes of the Earth and its Inhabitants as Illustrated by Geological Monuments (Sixth ed.). New York: D. Appleton and company. Retrieved 2008-12-19.{{cite book}}: CS1 maint: multiple names: authors list (link)\n^ a b Stiebing, William H. (1994). Uncovering the Past. Oxford University Press US. ISBN 978-0-19-508921-9.\n^ a b Brookfield, Michael E. (2004). Principles of Stratigraphy. Blackwell Publishing. p. 116. ISBN 978-1-4051-1164-5.\n^ Fuller, J. G. C. M. (2007-07-17). "Smith\'s other debt, John Strachey, William Smith and the strata of England 1719–1801". Geoscientist. The Geological Society. Archived from the original on 24 November 2008. Retrieved 2008-12-19.\n^ Burchfield, Joe D. (1998). "The age of the Earth and the invention of geological time". Geological Society, London, Special Publications. 143 (1): 137–143. Bibcode:1998GSLSP.143..137B. CiteSeerX 10.1.1.557.2702. doi:10.1144/GSL.SP.1998.143.01.12. S2CID 129443412.\n^ BUFFON, GEORGES LOUIS LECLERC (2022). HISTOIRE NATURELLE, GA (C)NA (C)RALE ET PARTICULIARE, : introduction a l\'histoire... des mina (c)raux (classic reprint). [S.l.]: FORGOTTEN BOOKS. ISBN 978-0-265-92735-9. OCLC 1354275595.\n^ Merrill, Ronald T. (2010). Our Magnetic Earth: The Science of Geomagnetism. Chicago: University of Chicago Press. p. 86. ISBN 978-0-226-52053-7.\n^ Simms, D. L. (2004). "Newton\'s Contribution to the Science of Heat". Annals of Science. 61 (1): 33–77. doi:10.1080/00033790210123810. ISSN 0003-3790.\n^ a b England, P.; Molnar, P.; Righter, F. (January 2007). "John Perry\'s neglected critique of Kelvin\'s age for the Earth: A missed opportunity in geodynamics". GSA Today. 17 (1): 4–9. Bibcode:2007GSAT...17R...4E. doi:10.1130/GSAT01701A.1.\n^ Dalrymple (1994) pp. 14–17, 38\n^ Burchfield, Joe D. (1990-05-15). Lord Kelvin and the Age of the Earth. University of Chicago Press. pp. 69 ff. ISBN 9780226080437. Archived from the original on 2018-02-14.\n^ Stacey, Frank D. (2000). "Kelvin\'s age of the Earth paradox revisited". Journal of Geophysical Research. 105 (B6): 13155–13158. Bibcode:2000JGR...10513155S. doi:10.1029/2000JB900028.\n^ Origin of Species, Charles Darwin, 1872 edition, page 286\n^ Borenstein, Seth (November 13, 2013). "Oldest fossil found: Meet your microbial mom". Excite. Yonkers, NY: Mindspark Interactive Network. Associated Press. Archived from the original on June 29, 2015. Retrieved 2015-03-02.)\n^ a b c Dalrymple (1994) pp. 14–17\n^ Paul J. Nahin (1985) Oliver Heaviside, Fractional Operators, and the Age of the Earth, IEEE Transactions on Education E-28(2): 94–104, link from IEEE Explore\n^ Dalrymple (1994) pp. 14, 43\n^ a b c Nichols, Gary (2009). "21.2 Radiometric Dating". Sedimentology and Stratigraphy. John Wiley & Sons. pp. 325–327. ISBN 978-1405193795.\n^ Henri Becquerel (1896). "Sur les radiations émises par phosphorescence". Comptes Rendus. 122: 420–421.\n^ Comptes Rendus 122: 420 (1896), translated by Carmen Giunta. Accessed 12 April 2021.\n^ Henri Becquerel (1896). "Sur les radiations invisibles émises par les corps phosphorescents". Comptes Rendus. 122: 501–503.\n^ Comptes Rendus 122: 501–503 (1896), translated by Carmen Giunta. Accessed 12 April 2021.\n^ Curie, Pierre; Curie, Marie & Bémont, Gustave (1898). "Sur une nouvelle substance fortement radio-active, contenue dans la pechblende (On a new, strongly radioactive substance contained in pitchblende)". Comptes Rendus. 127: 1215–1217. Archived from the original on 6 August 2009. Retrieved 12 April 2021.\n^ Curie, Pierre; Laborde, Albert (1903). "Sur la chaleur dégagée spontanément par les sels de radium". Comptes Rendus. 136: 673–675.\n^ Joly, John (1909). Radioactivity and Geology: An Account of the Influence of Radioactive Energy on Terrestrial History (1st ed.). London, UK: Archibald Constable & Co., ltd. p. 36. Reprinted by BookSurge Publishing (2004) ISBN 1-4021-3577-7.\n^ Rutherford, E. (1906). Radioactive Transformations. London: Charles Scribner\'s Sons. Reprinted by Juniper Grove (2007) ISBN 978-1-60355-054-3.\n^ Eve, Arthur Stewart (1939). Rutherford: Being the life and letters of the Rt. Hon. Lord Rutherford, O. M.. Cambridge: Cambridge University Press.\n^ Dalrymple (1994) p. 74\n^ The Age of the Earth Debate Badash, L Scientific American 1989 esp p95 Archived 2016-11-05 at the Wayback Machine\n^ Dalrymple (1994) pp. 77–78\n^ Patterson, Claire (1956). "Age of meteorites and the earth" (PDF). Geochimica et Cosmochimica Acta. 10 (4): 230–237. Bibcode:1956GeCoA..10..230P. doi:10.1016/0016-7037(56)90036-9. Archived (PDF) from the original on 2010-06-21. Retrieved 2009-07-07.\n^ Carlson, R. W.; Tera, F. (December 1–3, 1998). "Lead–Lead Constraints on the Timescale of Early Planetary Differentiation" (PDF). Conference Proceedings, Origin of the Earth and Moon. Houston, Texas: Lunar and Planetary Institute. p. 6. Archived (PDF) from the original on 16 December 2008. Retrieved 2008-12-22.\n^ Dalrymple (1994) pp. 310–341\n^ Dalrymple, Brent G. (2004). Ancient Earth, Ancient Skies: The Age of the Earth and Its Cosmic Surroundings. Stanford University Press. pp. 147, 169. ISBN 978-0-8047-4933-6.\n^ Terada, K.; Sano, Y. (May 20–24, 2001). "In-situ ion microprobe U-Pb dating of phosphates in H-chondrites" (PDF). Proceedings, Eleventh Annual V. M. Goldschmidt Conference. Hot Springs, Virginia: Lunar and Planetary Institute. Bibcode:2001eag..conf.3306T. Archived (PDF) from the original on 16 December 2008. Retrieved 2008-12-22.\n\nBibliography\n\nDalrymple, G. Brent (1994-02-01). The Age of the Earth. Stanford University Press. ISBN 978-0-8047-2331-2.\n\nFurther reading\n\nBaadsgaard, H.; Lerbekmo, J.F.; Wijbrans, J.R., 1993. Multimethod radiometric age for a bentonite near the top of the Baculites reesidei Zone of southwestern Saskatchewan (Campanian-Maastrichtian stage boundary?). Canadian Journal of Earth Sciences, v.30, p. 769–775.\nBaadsgaard, H. and Lerbekmo, J.F., 1988. A radiometric age for the Cretaceous-Tertiary boundary based on K-Ar, Rb-Sr, and U-Pb ages of bentonites from Alberta, Saskatchewan, and Montana. Canadian Journal of Earth Sciences, v.25, p. 1088–1097.\nEberth, D.A. and Braman, D., 1990. Stratigraphy, sedimentology, and vertebrate paleontology of the Judith River Formation (Campanian) near Muddy Lake, west-central Saskatchewan. Bulletin of Canadian Petroleum Geology, v.38, no.4, p. 387–406.\nGoodwin, M.B. and Deino, A.L., 1989. The first radiometric ages from the Judith River Formation (Upper Cretaceous), Hill County, Montana. Canadian Journal of Earth Sciences, v.26, p. 1384–1391.\nGradstein, F. M.; Agterberg, F.P.; Ogg, J.G.; Hardenbol, J.; van Veen, P.; Thierry, J. and Zehui Huang., 1995. A Triassic, Jurassic and Cretaceous time scale. IN: Bergren, W. A.; Kent, D.V.; Aubry, M-P. and Hardenbol, J. (eds.), Geochronology, Time Scales, and Global Stratigraphic Correlation. Society of Economic Paleontologists and Mineralogists, Special Publication No. 54, p. 95–126.\nHarland, W.B., Cox, A.V.; Llewellyn, P.G.; Pickton, C.A.G.; Smith, A.G.; and Walters, R., 1982. A Geologic Time Scale: 1982 edition. Cambridge University Press: Cambridge, 131p.\nHarland, W.B.; Armstrong, R.L.; Cox, A.V.; Craig, L.E.; Smith, A.G.; Smith, D.G., 1990. A Geologic Time Scale, 1989 edition. Cambridge University Press: Cambridge, p. 1–263. ISBN 0-521-38765-5\nHarper, C.W. Jr (1980). "Relative age inference in paleontology". Lethaia. 13 (3): 239–248. Bibcode:1980Letha..13..239H. doi:10.1111/j.1502-3931.1980.tb00638.x.\nObradovich, J.D., 1993. A Cretaceous time scale. IN: Caldwell, W.G.E. and Kauffman, E.G. (eds.). Evolution of the Western Interior Basin. Geological Association of Canada, Special Paper 39, p. 379–396.\nPalmer, Allison R (1983). "The Decade of North American Geology 1983 Geologic Time Scale". Geology. 11 (9): 503–504. Bibcode:1983Geo....11..503P. doi:10.1130/0091-7613(1983)11<503:tdonag>2.0.co;2.\nPowell, James Lawrence, 2001, Mysteries of Terra Firma: the Age and Evolution of the Earth, Simon & Schuster, ISBN 0-684-87282-X\n\nExternal links\n\nThe Age of the Earth by Chris Stassen (TalkOrigins.org)\nUSGS preface on the Age of the Earth\nNASA exposition on the age of Martian meteorites\nAgeing the Earth on In Our Time at the BBC\nPre-1900 Non-Religious Estimates of the Age of the Earth\n\n|  | |\n --- |\n|  Outline  History | |\n| Atmosphere |  Atmosphere of Earth  Prebiotic atmosphere  Troposphere  Stratosphere  Mesosphere  Thermosphere  Exosphere  Weather |\n| Climate |  Climate system  Energy balance  Climate change  Climate variability and change  Climatology  Paleoclimatology |\n| Continents |  Africa  Antarctica  Asia  Australia  Europe  North America  South America |\n| Culture and society |  List of sovereign states   + dependent territories  In culture  Earth Day  Flag  Symbol  World economy  Etymology  World history  Time zones  World |\n| Environment |  Biome  Biosphere  Biogeochemical cycles  Ecology  Ecosystem  Human impact on the environment  Evolutionary history of life  Nature |\n| Geodesy |  Cartography   + Computer cartography  Earth\'s orbit  Geodetic astronomy  Geomatics  Gravity  Navigation  Remote Sensing  Geopositioning  Virtual globe |\n| Geophysics |  Earth structure  Fluid dynamics  Geomagnetism  Magnetosphere  Mineral physics  Seismology  Plate tectonics  Signal processing  Tomography |\n| Geology |  Age of Earth  Earth science  Extremes on Earth  Future  Geological history   + Geologic time scale  Geologic record  History of Earth |\n| Oceans |  Antarctic/Southern Ocean  Arctic Ocean  Atlantic Ocean  Indian Ocean  Pacific Ocean  Oceanography |\n| Planetary science |  The Moon  Evolution of the Solar System  Geology of solar terrestrial planets  Location in the Universe  Solar System |\n|  | |\n| Authority control databases | |\n --- |\n| National |  United States  Israel |\n| Other |  Yale LUX |\nRetrieved from "\nCategories:\n\nGeochronology\nHistory of Earth science\nGeology theories\n\nHidden categories:\n\nCS1 maint: multiple names: authors list\nWebarchive template wayback links\nArticles with short description\nShort description is different from Wikidata\nWikipedia pages semi-protected against vandalism\nAll articles with unsourced statements\nArticles with unsourced statements from February 2023\nArticles with unsourced statements from March 2015',
+            "images": [],
+        },
+        {
+            "url": "https://www.planetary.org/articles/how-old-is-the-earth",
+            "raw_content": "Skip to main content\nCommunity Account Renew Search\nJoin\n\nBecome A Member\nRenew\nGift Membership\nKids Membership\nOther Ways to Give\n\nDonate\nJoin\nDonate\nBack To Main Menu\n\nWhat We Do\n\nExplore Worlds\n\nFind Life\nDefend Earth\n\nHow We Work\n\nEducation & Public Outreach\n\nSpace Policy & Advocacy\nScience & Technology\nGlobal Collaboration\n\nOur Results\n\nOur Impact\nLearn how our members and community are changing the worlds.\n  + LightSail\nOur citizen-funded spacecraft successfully demonstrated solar sailing for CubeSats.\n\nBack To Main Menu\n\nSpace Topics\n\nPlanets & Other Worlds\n\nSpace Missions\nNight Sky\nSpace Policy\nFor Kids\n\nLearn\n\nArticles\n\nPlanetary Radio\nSpace Images\nVideos\nCourses\n\nThe Planetary Report\n\n#### Solar Maximum\nOur dynamic star's reach throughout the Solar System.\nBack To Main Menu\n\nGet Involved\n\nBecome A Member\nMembership programs for explorers of all ages.\n  + Email Signup\nGet updates and weekly tools to learn, share, and advocate for space exploration.\n  + Action Center\nVolunteer as a space advocate.\n ### Support Our Mission\n\nRenew Membership\n\nSociety Projects\nTravel\nOther Ways to Give\nStore\n\nThe Planetary Fund\n\nAccelerate progress in our three core enterprises — Explore Worlds, Find Life, and Defend Earth. You can support the entire fund, or designate a core enterprise of your choice.\nGive Today\nBack To Main Menu\n\nAbout Us\n\nOverview\n\nStrategic Framework\nNews & Press\nCareers\nContact Us\nOur Story\n\nThe Planetary Society\n\n#### Our Vision\nKnow the Cosmos and our place within it.\n#### Our Mission\nEmpowering the world's citizens to advance space science and exploration.\nBack To Main Menu\n\nMembership\n\nBecome A Member\n\nRenew Membership\nGift Membership\nKids Membership\nOther Ways to Give\n\nContact Us\n\nOur Work\n\nExplore Space\nTake Action\nAbout\nMembership\nMember Community\nAccount Center\n\nSearch\n\n“Exploration is in our nature.” - Carl Sagan\n\nHow old is the Earth?\nWritten by\nKate Howells\nPublic Education Specialist, The Planetary Society \nNovember 14, 2023\nThe Earth is thought to be about 4.54 billion years old. Along with other planets, the Earth was born in the early days of the Solar System, which first started forming about 4.6 billion years ago.\nHow did the Earth form?\nThe Solar System formed about 4.6 billion years ago from material in a massive, rotating cloud of gas and dust called the solar nebula. Gravity caused this cloud to collapse in on itself, spin, and flatten into a disk shape. Most of the material in that cloud was pulled toward the center, forming the protostar that would eventually become our Sun. The rest of the material began to come together into clumps called planetesimals. These in turn gradually came together with other planetesimals, forming larger bodies called protoplanets. Earth started as one of these protoplanets, likely about 4.5 billion years ago.\nThe Earth’s history\nAs the proto-Earth grew, heavier elements within it began to sink toward the center, forming the core, and lighter elements rose to the surface. This process, called differentiation, likely took place over tens of millions of years.\nDuring these early stages a Mars-sized protoplanet, often referred to as Theia, collided with the young Earth, ejecting material from both protoplanets into space. Some of this material fell back to Earth, but some of the material eventually coalesced in orbit around Earth to form the Moon.\nThe Earth continued to experience impacts throughout its early life, though none as dramatic as the collision with Theia. During a period called the Late Heavy Bombardment, which likely happened between 4.1 and 3.8 billion years ago, there was an increased rate of asteroid and comet impacts in the inner Solar System. The Late Heavy Bombardment had major geological consequences, including causing Earth’s crust to melt and differentiate and shaping the early atmosphere and oceans. Although geological activity has erased the craters from this time on Earth, they are preserved on the Moon. These are some of the craters you can see from Earth.\nBy about 4.3 billion years ago, the Earth's surface had cooled enough for water vapor in the atmosphere to condense on the surface, leading to the formation of oceans. Volcanic activity, which was more widespread at the time, released gasses that shaped the early atmosphere. Life emerged around 3.5 to 4 billion years ago in the form of simple, single-celled organisms.\nThe Earth has probably been as we know it today — with recognizable continents, oceans, a hospitable climate, and diverse life — for the past few hundred million years. But it continues to evolve through its own gradual tectonic and volcanic activity, and through the more rapid effects of climate change.\nHow do scientists determine the age of the Earth?\nScientists have been able to piece together our planet’s timeline\nthanks to techniques including radiometric dating of rocks and minerals,\nexamining layers of sedimentary rock, and studying the Earth's magnetic\nfield.\nThe most precise method is radiometric dating,\nwhich measures the decay of radioactive isotopes in rocks. Because\ngeologists know how long these isotopes take to decay, they can\ndetermine a rock’s age by looking at the ratio of parent (pre-decay) and\ndaughter (post-decay) isotopes in a sample.\nOne challenge with dating the Earth via rocks is that most of the\noriginal rocks that formed on our planet at the earliest stages of its\ncreation have likely been recycled into the mantle since then. Because\nof this, geologists also learn about the history of the Solar System by\nstudying rocks from beyond Earth, including meteorites that were formed\nbillions of years before falling to Earth, meteorites of Earth material\nthat have been found on the Moon,\nand asteroids that have coasted through space undisturbed for billions\nof years without undergoing any major composition-altering change. The\nasteroid Bennu,\nfor example, is thought to have formed in the first 10 million years of\nthe Solar System’s history. By studying the samples returned to Earth\nby the OSIRIS-REx mission, scientists can learn a lot about the early Solar System.\nEarth's First Line of Defense\nSupport the team of astronomers defending Earth with a gift today.\nDonate",
+            "images": [],
+        },
+        {
+            "url": "https://answersingenesis.org/age-of-the-earth/how-old-earth/?srsltid=AfmBOoqSX0LqvRa1nZM5V8YjVoWspP8t9WHAhFQRrQUEVoHW8DukYZf4",
+            "raw_content": "Published Time: Sept. 1, 2018, 6 a.m.\nHow Old Is the Earth? | Answers in Genesis \n\nInternet Explorer is no longer supported. Try downloading another browser like Chrome or Firefox.\n\nCart\nAccount\nUnited States / English\n\nIf you already have an account, Sign in.\nView Cart\n×\nUnited States / English\n\nAnswers\nStore\nEvents\nVideos\nKids\nEducation\nDonate\n\nSubscribe\n\nAnswers in Genesis\nAnswers\nScience\nGeology\nAge of the Earth\nHow Old Is the Earth?\n\nHow Old Is the Earth?\nIs the earth 4.54 billion years old?\nby Dr. Danny R. Faulkner on September 1, 2018; last featured November 26, 2023\nFeatured in Answers Magazine\nAudio Version\nShare\n\nWatch the video on YouTube.\nIf you ask this question of most scientifically literate people, they will answer that the earth is about 4.54 billion years old. But if you ask biblically literate people, many will answer that the earth is little more than 6,000 years old. Why the huge difference? We look at the same world but come to different conclusions because our worldviews are different.\n Latest Answers -------------- Stay up to date each week with top articles, blogs, news, videos, and more. Sign Up Now\nTo fully understand the issue, we must look beyond this earth. Literally. Let me explain.\nThe Biblical Date\nHow do we arrive at the biblical date? The genealogies of Genesis 5 and 11 make it clear that Abraham lived about 2,000 years after creation. And we know from chronologies found elsewhere in the Bible that Abraham lived about 2,000 years before the birth of Jesus Christ. Furthermore, we know that Jesus’ ministry was about 2,000 years ago. Summing these lengths of time, we get about 6,000 years (technically just a little more).\nWhat Most Scientists Think\nHow do many scientists arrive at the age of 4.54 billion years? They rely on radiometric dating, though the story is a bit more complicated than it sounds. Some rocks contain trace amounts of radioactive atoms. Those radioactive atoms decay into stable atoms over time. By knowing the decay rate and measuring the amount of both kinds of atoms in a rock, scientists can compute the amount of time it took to produce the stable atoms.\nSome assumptions are involved, however. Were some of the stable atoms present in the rock to begin with? Did some of either type of atom leave or enter the rock during the time being measured for decay? To make matters worse, measuring the age of a rock by different kinds of radioactive atoms (such as uranium or rubidium) often yields very different ages. There are many examples of such discordant ages.\nBut even if we accept these ages as correct, there are many other assumptions that cause even more problems. You see, we never find rocks on earth that date back 4.54 billion years. The earth is a very dynamic place, with volcanic eruptions and tectonic plate movements that constantly recycle old rocks into new rocks. When rocks are recycled this way, it is believed that their radiometric dates are reset.\nSo we wouldn’t expect to find the original “primordial” rocks on earth. Instead, scientists must look to other bodies in the solar system that are less active geologically. The search for primordial rocks was one of the scientific reasons we sent men to the moon a half-century ago. Scientists thought that since the moon has far less geological activity than the earth, its rocks would be older.\nIndeed, the moon’s rocks generally yield old radiometric dates, but even they don’t yield dates of 4.54 billion years. Why?\nWhile the moon is far less active than the earth, that hasn’t always been the case. Most scientists think that the moon was very active early in its history. So while moon rocks have relatively old radiometric dates, they aren’t primordial either. To find truly primordial rocks, planetary scientists think they must look at meteorites, debris that has fallen onto the earth’s surface from somewhere else in the solar system. The 4.54-billion-year age of the earth comes from radiometric dating of meteorites.\nHow can they know these are the earliest rocks? They have a theory that the whole solar system formed at the same time, around 4.54 billion years ago. This means the sun and planets would be about the same age. Material that didn’t become part of the sun supposedly coalesced into larger and larger pieces in outer space, eventually forming planets and their satellites, or moons. But many of the pieces never formed into planets or satellites. Fragments of these pieces are thought to be the origin of meteorites. Since meteorites didn’t form into planets, they must have avoided the geological process that reset radiometric ages on earth. This is particularly true of the carbonaceous chondrites.\nBut note all the unproven assumptions. Evolutionary assumptions at that.\nThe Real Agenda\nFor decades, scientists who believe the earth is billions of years old have said that radiometric dates are their reason for believing so. But this hasn’t always been the case. The methods for radiometric dating were developed only a hundred years ago. Prior to that, many scientists already believed the earth was billions of years old, not based upon radiometric dates but the assumption that modern life evolved from nonlife. Evolutionists recognize that we can’t see planets and life evolving before our eyes. They say it requires great time; so the earth must be very old.\nThere is a good lesson here. In the late 1800s, many scientists concluded that the earth must be at least 100 million years old because that was considered the minimum time necessary for evolution to account for the earth’s biology and geology. The need for time drives the claims of ancient dates.\nLord Kelvin, one of the most significant scientists of the 1800s, tested the then-popular age of 100 million years and produced two quantitative tests that showed the earth and sun could be no more than about one-third of this age. Yet his evolutionary colleagues persisted in their belief despite Lord Kelvin’s objections. Since then, many critics have noted that his objections have been explained to their satisfaction. But that misses the point. Many of Kelvin’s colleagues believed in great age despite the evidence, not because of it.\nToday many scientists continue to believe in a 4.54-billion-year-old earth, which evolution requires. They will continue to choose to believe that age, even though solid scientific reasons are available to doubt those dates.\nOur Job\nIt is the job of creation scientists to reevaluate scientific claims using their biblical worldview. Scientists have found many evidences that the earth is far younger than 4.54 billion years—even as young as 6,000 years—but these are usually swept under the rug.\n\nScientists have found many evidences that the earth is far younger than 4.54 billion years, but these are usually swept under the rug.\n\nCreationist literature (including this magazine) is filled with examples. They include the composition of the earth’s atmosphere and seawater, which would be much different if helium had been escaping the atmosphere and salt had been accumulating in the ocean for millions of years. Also, the moon’s tidal interaction with the earth is causing the moon to spiral outward, which limits how long it has been in orbit. (Just go online and search for “evidences of a young earth” for details and more examples.)\nMost importantly, we need to point people to the importance of starting in the right place—God’s Word—when interpreting the evidence.\nDr. Danny R. Faulkner joined the staff of Answers in Genesis after more than 26 years as professor of physics and astronomy at the University of South Carolina Lancaster. He has written numerous articles in astronomical journals, and he is the author of Universe by Design.\nRelated Videos\nWhy Shouldn’t Christians Accept Millions of Years?\n\nAnswers Magazine\nSeptember–October 2018\n\nEven as skepticism spreads around the globe, the creation movement is flourishing. Meet some of the new generation of creation scientists.\nBrowse IssueSubscribe\nRecommended Resources\n\nUniverse by Design$18.99 \nThe Heavens Declare Set$39.99 Sale \n\nAge of the Earth$12.99 \n\nScience\n\nWhat Is Science?\nAstronomy\nBiology\nChemistry\nEnvironmental Science\nFossils\nGenetics\nGeology\nHuman Body\nMathematics\nPhysics\n\nNewsletter\nGet the latest answers emailed to you.\nBy submitting this form, you accept our Privacy Policy and will be given an opportunity to receive emails from Answers in Genesis regarding our latest news, resources, and events.\nThank You!\nThank you for signing up to receive email newsletters from Answers in Genesis.\nYou can also sign up for our free print newsletter (US only).\nFinish your subscription\nYou're almost done! Please follow the instructions we emailed you in order to finish subscribing.\nYou can also sign up for our free print newsletter (US only).\nWhoops!\nYour newsletter signup did not work out. Please refresh the page and try again.\nSupport the creation/gospel message by donating or getting involved! \n\nAnswers in Genesis is an apologetics ministry, dedicated to helping Christians defend their faith and proclaim the good news of Jesus Christ.\nLearn more\n\nCustomer Service 800.778.3390\nAvailable Monday–Friday | 9 AM–5 PM ET\n© 2025 Answers in Genesis",
+            "images": [],
+        },
+    ],
+    "failed_results": [],
+    "response_time": 5.16,
+    "request_id": "81c3ce85-3014-4a81-b342-fd9f2a9fba32",
+}
diff --git a/tests/methods/test_method_web.py b/tests/methods/test_method_web.py
index 9c0b7671..2d9305a2 100644
--- a/tests/methods/test_method_web.py
+++ b/tests/methods/test_method_web.py
@@ -1,11 +1,15 @@
 """Tests for method web.py"""
 
+import json
 import logging
 
 import pytest
 from unittest.mock import patch
 from modules.methods.method_web import MethodWeb
-from tests.fixtures.tavily_responses import RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER
+from tests.fixtures.tavily_responses import (
+    RESPONSE_SEARCH_HOW_OLD_IS_EARTH_NO_ANSWER,
+    RESPONSE_EXTRACT_HOW_OLD_IS_EARTH_NO_ANSWER,
+)
 
 logger = logging.getLogger(__name__)
 
@@ -15,6 +19,9 @@ logger = logging.getLogger(__name__)
 async def test_method_web_search_live():
     """Tests method web search with live API calls."""
 
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Search Live")
+
     method_web = MethodWeb(serviceCenter=None)
 
     # Actual request
@@ -26,29 +33,30 @@ async def test_method_web_search_live():
     assert action_result.success
     assert len(action_result.documents) > 0
 
-    logger.info("=" * 20)
     logger.info(f"Action result success status: {action_result.success}")
     logger.info(f"Action result error: {action_result.error}")
     logger.info(f"Action result label: {action_result.resultLabel}")
 
     logger.info("Documents:")
     for doc in action_result.documents:
-        logger.info("-" * 10)
         logger.info(f" - Document Name: {doc.documentName}")
-        logger.info(f" - Document Mime Type: {doc.mimeType}")
-        logger.info(f" - Document Data: {doc.documentData}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")
 
 
 @pytest.mark.asyncio
 async def test_method_web_search_dummy():
     """Tests method web search with dummy response data - no external API calls."""
 
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Search Dummy")
+
     method_web = MethodWeb(serviceCenter=None)
 
     # Mock the Tavily API response
     with patch(
         "tavily.AsyncTavilyClient.search",
-        return_value=RESPONSE_HOW_OLD_IS_EARTH_NO_ANSWER,
+        return_value=RESPONSE_SEARCH_HOW_OLD_IS_EARTH_NO_ANSWER,
     ) as mock_client:
         action_result = await method_web.search(
             {"query": "How old is the earth", "maxResults": 5}
@@ -59,14 +67,182 @@ async def test_method_web_search_dummy():
     assert action_result.success
     assert len(action_result.documents) > 0
 
-    logger.info("=" * 20)
     logger.info(f"Action result success status: {action_result.success}")
     logger.info(f"Action result error: {action_result.error}")
     logger.info(f"Action result label: {action_result.resultLabel}")
 
     logger.info("Documents:")
     for doc in action_result.documents:
-        logger.info("-" * 10)
         logger.info(f" - Document Name: {doc.documentName}")
-        logger.info(f" - Document Mime Type: {doc.mimeType}")
-        logger.info(f" - Document Data: {doc.documentData}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+@pytest.mark.expensive
+async def test_method_web_crawl_live():
+    """Tests method web crawl with live API calls."""
+
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Crawl Live")
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Create mock document data with URLs from search results
+    search_results_json = {
+        "documentData": {
+            "results": [
+                {"url": "https://en.wikipedia.org/wiki/Age_of_Earth"},
+                {"url": "https://www.planetary.org/articles/how-old-is-the-earth"},
+            ]
+        }
+    }
+
+    # Mock the service center methods
+    with patch.object(method_web, "service") as mock_service:
+        mock_service.getChatDocumentsFromDocumentList.return_value = [
+            type("MockDoc", (), {"fileId": "test-file-id"})()
+        ]
+        mock_service.getFileData.return_value = json.dumps(search_results_json).encode(
+            "utf-8"
+        )
+
+        # Actual request
+        action_result = await method_web.crawl({"document": "test-document-ref"})
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+async def test_method_web_crawl_dummy():
+    """Tests method web crawl with dummy response data - no external API calls."""
+
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Crawl Dummy")
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Create mock document data with URLs from search results
+    search_results_json = {
+        "documentData": {
+            "results": [
+                {"url": "https://en.wikipedia.org/wiki/Age_of_Earth"},
+                {"url": "https://www.planetary.org/articles/how-old-is-the-earth"},
+            ]
+        }
+    }
+
+    # Mock both the service center and Tavily API
+    with (
+        patch.object(method_web, "service") as mock_service,
+        patch(
+            "tavily.AsyncTavilyClient.extract",
+            return_value=RESPONSE_EXTRACT_HOW_OLD_IS_EARTH_NO_ANSWER,
+        ) as mock_client,
+    ):
+        mock_service.getChatDocumentsFromDocumentList.return_value = [
+            type("MockDoc", (), {"fileId": "test-file-id"})()
+        ]
+        mock_service.getFileData.return_value = json.dumps(search_results_json).encode(
+            "utf-8"
+        )
+
+        action_result = await method_web.crawl({"document": "test-document-ref"})
+        mock_client.assert_called_once()
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+@pytest.mark.expensive
+async def test_method_web_scrape_live():
+    """Tests method web scrape with live API calls."""
+
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Scrape Live")
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Actual request
+    action_result = await method_web.scrape(
+        {"query": "How old is the earth", "maxResults": 3}
+    )
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")
+
+
+@pytest.mark.asyncio
+async def test_method_web_scrape_dummy():
+    """Tests method web scrape with dummy response data - no external API calls."""
+
+    logger.info("=" * 50)
+    logger.info("==> Test: Method Web Scrape Dummy")
+
+    method_web = MethodWeb(serviceCenter=None)
+
+    # Mock both Tavily API responses (search + extract)
+    with (
+        patch(
+            "tavily.AsyncTavilyClient.search",
+            return_value=RESPONSE_SEARCH_HOW_OLD_IS_EARTH_NO_ANSWER,
+        ) as mock_search,
+        patch(
+            "tavily.AsyncTavilyClient.extract",
+            return_value=RESPONSE_EXTRACT_HOW_OLD_IS_EARTH_NO_ANSWER,
+        ) as mock_extract,
+    ):
+        action_result = await method_web.scrape(
+            {"query": "How old is the earth", "maxResults": 3}
+        )
+        mock_search.assert_called_once()
+        mock_extract.assert_called_once()
+
+    # Evaluate results
+    assert action_result.success
+    assert len(action_result.documents) > 0
+
+    logger.info(f"Action result success status: {action_result.success}")
+    logger.info(f"Action result error: {action_result.error}")
+    logger.info(f"Action result label: {action_result.resultLabel}")
+
+    logger.info("Documents:")
+    for doc in action_result.documents:
+        logger.info(f" - Document Name: {doc.documentName}")
+        logger.info(f" --> Document Mime Type: {doc.mimeType}")
+        logger.info(f" --> Document Data: {doc.documentData}")

From 017b7f1ca04d5be5397a9479eebd266d0b151741 Mon Sep 17 00:00:00 2001
From: Christopher Gondek <gondek.christopher@gmail.com>
Date: Mon, 1 Sep 2025 16:06:29 +0200
Subject: [PATCH 10/17] chore: type checking; input validation for web
 interface

---
 modules/interfaces/interface_web_model.py   | 24 ++++++++++-----------
 modules/interfaces/interface_web_objects.py | 12 +++++++++--
 2 files changed, 22 insertions(+), 14 deletions(-)

diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interface_web_model.py
index 86f19e08..bb4a82e0 100644
--- a/modules/interfaces/interface_web_model.py
+++ b/modules/interfaces/interface_web_model.py
@@ -2,7 +2,7 @@
 
 from abc import ABC, abstractmethod
 from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
-from pydantic import BaseModel, Field
+from pydantic import BaseModel, Field, HttpUrl
 from typing import List
 
 
@@ -12,21 +12,21 @@ from typing import List
 
 
 class WebSearchRequest(BaseModel):
-    query: str
-    max_results: int
+    query: str = Field(min_length=1, max_length=400)
+    max_results: int = Field(ge=1, le=20)
 
 
 class WebSearchResultItem(BaseModel):
     """Individual search result"""
 
     title: str
-    url: str
+    url: HttpUrl
 
 
 class WebSearchDocumentData(BaseModel):
     """Complete search results document"""
 
-    query: str
+    query: str = Field(min_length=1, max_length=400)
     results: List[WebSearchResultItem]
     total_count: int
 
@@ -50,20 +50,20 @@ class WebSearchBase(ABC):
 
 
 class WebCrawlRequest(BaseModel):
-    urls: List[str]
+    urls: List[HttpUrl]
 
 
 class WebCrawlResultItem(BaseModel):
     """Individual crawl result"""
 
-    url: str
+    url: HttpUrl
     content: str
 
 
 class WebCrawlDocumentData(BaseModel):
     """Complete crawl results document"""
 
-    urls: List[str]
+    urls: List[HttpUrl]
     results: List[WebCrawlResultItem]
     total_count: int
 
@@ -89,21 +89,21 @@ class WebCrawlBase(ABC):
 
 
 class WebScrapeRequest(BaseModel):
-    query: str
-    max_results: int
+    query: str = Field(min_length=1, max_length=400)
+    max_results: int = Field(ge=1, le=20)
 
 
 class WebScrapeResultItem(BaseModel):
     """Individual scrape result"""
 
-    url: str
+    url: HttpUrl
     content: str
 
 
 class WebScrapeDocumentData(BaseModel):
     """Complete scrape results document"""
 
-    query: str
+    query: str = Field(min_length=1, max_length=400)
     results: List[WebScrapeResultItem]
     total_count: int
 
diff --git a/modules/interfaces/interface_web_objects.py b/modules/interfaces/interface_web_objects.py
index 0ea43bd7..f348f0bd 100644
--- a/modules/interfaces/interface_web_objects.py
+++ b/modules/interfaces/interface_web_objects.py
@@ -1,3 +1,4 @@
+from typing import Optional
 from modules.interfaces.interface_web_model import (
     WebCrawlActionResult,
     WebSearchActionResult,
@@ -11,9 +12,16 @@ from dataclasses import dataclass
 from modules.connectors.connector_tavily import ConnectorTavily
 
 
-@dataclass
+@dataclass(slots=True)
 class WebInterface:
-    connector_tavily: ConnectorTavily = None
+    connector_tavily: ConnectorTavily
+
+    def __post_init__(self) -> None:
+        if self.connector_tavily is None:
+            raise TypeError(
+                "connector_tavily must be provided. "
+                "Use `await WebInterface.create()` or pass a ConnectorTavily."
+            )
 
     @classmethod
     async def create(cls) -> "WebInterface":

From 91aff56e1c192b5770733943fbf69c18b7dd7ebe Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Tue, 2 Sep 2025 11:47:39 +0200
Subject: [PATCH 11/17] messageing aligned

---
 modules/chat/handling/handlingTasks.py | 315 +++++--------------------
 modules/chat/handling/promptFactory.py |  10 +-
 modules/chat/serviceCenter.py          | 102 +++++++-
 modules/methods/methodDocument.py      |  24 +-
 modules/routes/routeWorkflows.py       |   9 -
 modules/workflow/managerWorkflow.py    |  10 +-
 notes/changelog.txt                    |   3 +-
 7 files changed, 177 insertions(+), 296 deletions(-)

diff --git a/modules/chat/handling/handlingTasks.py b/modules/chat/handling/handlingTasks.py
index 290fdf0a..6138932b 100644
--- a/modules/chat/handling/handlingTasks.py
+++ b/modules/chat/handling/handlingTasks.py
@@ -192,7 +192,8 @@ class HandlingTasks:
                 
             task_plan = TaskPlan(
                 overview=task_plan_dict.get('overview', ''),
-                tasks=tasks
+                tasks=tasks,
+                userMessage=task_plan_dict.get('userMessage', '')
             )
             
             # Set workflow totals for progress tracking
@@ -217,24 +218,19 @@ class HandlingTasks:
         """Create a chat message containing the task plan with user-friendly messages"""
         try:
             # Build task plan summary
-            task_summary = f"📋 **Task Plan Generated**\n\n"
-            task_summary += f"**Overview:** {task_plan.overview}\n\n"
-            task_summary += f"**Total Tasks:** {len(task_plan.tasks)}\n\n"
-            
-            # Add each task with its user message
-            for i, task in enumerate(task_plan.tasks):
-                task_summary += f"**Task {i+1}:** {task.objective}\n"
-                if task.userMessage:
-                    task_summary += f"  💬 {task.userMessage}\n"
-                if task.success_criteria:
-                    criteria_str = ', '.join(task.success_criteria)
-                    task_summary += f"  ✅ Success Criteria: {criteria_str}\n"
-                task_summary += "\n"
-            
+            task_summary = f"📋 **Task Plan**\n\n"
+
             # Get overall user message from task plan if available
             overall_message = task_plan.userMessage
             if overall_message:
-                task_summary += f"**Plan Summary:** {overall_message}\n\n"
+                task_summary += f"{overall_message}\n\n"
+
+            # Add each task with its user message
+            for i, task in enumerate(task_plan.tasks):
+                if task.userMessage:
+                    task_summary += f"💬 {task.userMessage}\n"
+                task_summary += "\n"
+        
             
             # Create workflow message
             message_data = {
@@ -269,76 +265,6 @@ class HandlingTasks:
         except Exception as e:
             logger.error(f"Error creating task plan message: {str(e)}")
 
-    async def createDocumentContextMessage(self, documents: List, workflow):
-        """Create a chat message with document context and workflow labeling"""
-        try:
-            # Get current workflow context and stats
-            workflow_context = self.service.getWorkflowContext()
-            workflow_stats = self.service.getWorkflowStats()
-            
-            # Create a simple document context message without AI dependency
-            message_text = f"📄 **Document Context**\n\n"
-            message_text += f"**Total Documents:** {len(documents)}\n\n"
-            
-            # Add workflow context information
-            current_round = workflow_context.get('currentRound', 0)
-            current_task = workflow_context.get('currentTask', 0)
-            total_tasks = workflow_stats.get('totalTasks', 0)
-            current_action = workflow_context.get('currentAction', 0)
-            total_actions = workflow_stats.get('totalActions', 0)
-            
-            message_text += f"**Workflow Context:**\n"
-            message_text += f"- Round: {current_round}\n"
-            if total_tasks > 0:
-                message_text += f"- Task: {current_task}/{total_tasks}\n"
-            else:
-                message_text += f"- Task: {current_task}\n"
-            if total_actions > 0:
-                message_text += f"- Action: {current_action}/{total_actions}\n"
-            else:
-                message_text += f"- Action: {current_action}\n"
-            message_text += f"- Status: {workflow_stats.get('workflowStatus', 'unknown')}\n\n"
-            
-            # Add document list
-            if documents:
-                message_text += "**Available Documents:**\n"
-                for i, doc in enumerate(documents[:5]):  # Show first 5 documents
-                    message_text += f"- {doc.fileName if hasattr(doc, 'fileName') else f'Document {i+1}'}\n"
-                if len(documents) > 5:
-                    message_text += f"- ... and {len(documents) - 5} more documents\n"
-                message_text += "\n"
-            
-            message_text += "Document context information is available for processing."
-            
-            # Create workflow message
-            message_data = {
-                "workflowId": workflow.id,
-                "role": "assistant",
-                "message": message_text,
-                "status": "step",
-                "sequenceNr": len(workflow.messages) + 1,
-                "publishedAt": get_utc_timestamp(),
-                "documentsLabel": "document_context",
-                "documents": [],  # Empty documents for context message
-                # Add workflow context fields
-                "roundNumber": workflow_context.get('currentRound', 0),
-                "taskNumber": workflow_context.get('currentTask', 0),
-                "actionNumber": workflow_context.get('currentAction', 0),
-                # Add progress status
-                "taskProgress": "pending",
-                "actionProgress": "pending"
-            }
-            
-            message = self.chatInterface.createWorkflowMessage(message_data)
-            if message:
-                workflow.messages.append(message)
-                logger.info(f"Document context message created with {len(documents)} documents")
-            else:
-                logger.error("Failed to create document context message")
-                
-        except Exception as e:
-            logger.error(f"Error creating document context message: {str(e)}")
-
     async def generateTaskActions(self, task_step, workflow, previous_results=None, enhanced_context=None) -> List[TaskAction]:
         """Generate actions for a given task step."""
         try:
@@ -546,25 +472,13 @@ class HandlingTasks:
         
         # Create database log entry for task start in format expected by frontend
         if task_index is not None:
-            if total_tasks is not None:
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"Executing task {task_index}/{total_tasks}",
-                    "type": "info"
-                })
-            else:
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"Executing task {task_index}/?",
-                    "type": "info"
-                })
-            
+
             # Create a task start message for the user
             task_progress = f"{task_index}/{total_tasks}" if total_tasks is not None else str(task_index)
             task_start_message = {
                 "workflowId": workflow.id,
                 "role": "assistant",
-                "message": f"🚀 Starting Task {task_progress}\n\nObjective: {task_step.objective}",
+                "message": f"🚀 **Task {task_progress}**",
                 "status": "step",
                 "sequenceNr": len(workflow.messages) + 1,
                 "publishedAt": get_utc_timestamp(),
@@ -617,11 +531,6 @@ class HandlingTasks:
                 logger.error("No actions defined for task step, aborting task execution")
                 break
             
-            # Create document context message if documents are available
-            available_docs = self.service.getAvailableDocuments(workflow)
-            if available_docs:
-                await self.createDocumentContextMessage(available_docs, workflow)
-            
             action_results = []
             for action_idx, action in enumerate(actions):
                 # Check workflow status before each action execution
@@ -639,18 +548,11 @@ class HandlingTasks:
                 # Log action start in format expected by frontend
                 logger.info(f"Task {task_index} - Starting action {action_number}/{total_actions}")
                 
-                # Create database log entry for action start
-                self.chatInterface.createWorkflowLog({
-                    "workflowId": workflow.id,
-                    "message": f"Task {task_index} - Starting action {action_number}/{total_actions}",
-                    "type": "info"
-                })
-                
                 # Create an action start message for the user
                 action_start_message = {
                     "workflowId": workflow.id,
                     "role": "assistant",
-                    "message": f"⚡ Task {task_index} - Action {action_number}/{total_actions}\n\nMethod: {action.execMethod}.{action.execAction}",
+                    "message": f"⚡ **Action {action_number}/{total_actions}** (Method {action.execMethod}.{action.execAction})",
                     "status": "step",
                     "sequenceNr": len(workflow.messages) + 1,
                     "publishedAt": get_utc_timestamp(),
@@ -694,34 +596,19 @@ class HandlingTasks:
             if success:
                 logger.info(f"=== TASK {task_index or '?'} COMPLETED SUCCESSFULLY: {task_step.objective} ===")
                 
-                # Create database log entry for task completion
-                if total_tasks is not None:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"🎯 Task {task_index}/{total_tasks} completed",
-                        "type": "success"
-                    })
-                else:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"🎯 Task {task_index}/? completed",
-                        "type": "success"
-                    })
-                
                 # Create a task completion message for the user
                 task_progress = f"{task_index}/{total_tasks}" if total_tasks is not None else str(task_index)
                 
                 # Enhanced completion message with criteria details
-                completion_message = f"🎯 Task {task_progress} Completed Successfully!\n\nObjective: {task_step.objective}\n\nFeedback: {feedback or 'Task completed successfully'}"
+                completion_message = f"🎯 **Task {task_progress}**\n\n✅ {feedback or 'Task completed successfully'}"
                 
                 # Add criteria status if available
                 if hasattr(review_result, 'met_criteria') and review_result.met_criteria:
-                    completion_message += f"\n\n✅ **Success Criteria Met:**\n"
                     for criterion in review_result.met_criteria:
-                        completion_message += f"• {criterion}\n"
+                        completion_message += f"\n• {criterion}\n"
                 
                 if hasattr(review_result, 'quality_score'):
-                    completion_message += f"\n📊 **Quality Score:** {review_result.quality_score}/10"
+                    completion_message += f"\n📊 Score {review_result.quality_score}/10"
                 
                 task_completion_message = {
                     "workflowId": workflow.id,
@@ -740,10 +627,6 @@ class HandlingTasks:
                     "taskProgress": "success"
                 }
                 
-                # Add user-friendly message if available
-                if task_step.userMessage:
-                    task_completion_message["message"] += f"\n\n💬 {task_step.userMessage}"
-                
                 message = self.chatInterface.createWorkflowMessage(task_completion_message)
                 if message:
                     workflow.messages.append(message)
@@ -824,7 +707,7 @@ class HandlingTasks:
                 retry_message = {
                     "workflowId": workflow.id,
                     "role": "assistant",
-                    "message": f"🔄 Task {task_index} requires retry: {review_result.improvements}",
+                    "message": f"🔄 **Task {task_index}** needs retry: {review_result.improvements}",
                     "status": "step",
                     "sequenceNr": len(workflow.messages) + 1,
                     "publishedAt": get_utc_timestamp(),
@@ -843,19 +726,19 @@ class HandlingTasks:
                 continue
             else:
                 logger.error(f"=== TASK {task_index or '?'} FAILED: {task_step.objective} after {attempt+1} attempts ===")
-                
+                task_progress = f"{task_index}/{total_tasks}" if total_tasks is not None else str(task_index)
+
                 # Create user-facing error message for task failure
-                error_message = f"❌ Task {task_index or '?'} - '{task_step.objective}' failed after {attempt+1} attempts\n\n"
-                error_message += f"Objective: {task_step.objective}\n\n"
+                error_message = f"**Task {task_progress}**\n\n❌ '{task_step.objective}' {attempt+1}x failed\n\n"
                 
                 # Add specific error details if available
                 if review_result and hasattr(review_result, 'reason') and review_result.reason:
-                    error_message += f"Reason: {review_result.reason}\n\n"
+                    error_message += f"{review_result.reason}\n\n"
                 
                 # Add criteria progress information if available
                 if retry_context and hasattr(retry_context, 'criteria_progress'):
                     progress = retry_context.criteria_progress
-                    error_message += f"📊 **Progress Summary:**\n"
+                    error_message += f"📊 **Details**\n"
                     if progress.get('met_criteria'):
                         error_message += f"✅ Met criteria: {', '.join(progress['met_criteria'])}\n"
                     if progress.get('unmet_criteria'):
@@ -908,19 +791,18 @@ class HandlingTasks:
         logger.error(f"=== TASK {task_index or '?'} FAILED AFTER ALL RETRIES: {task_step.objective} ===")
         
         # Create user-facing error message for task failure
-        error_message = f"❌ Task {task_index or '?'} - '{task_step.objective}' failed after all retries\n\n"
-        error_message += f"Objective: {task_step.objective}\n\n"
+        error_message = f"**Task {task_index or '?'}**\n\n❌ '{task_step.objective}' failed after all retries\n\n"
+        error_message += f"{task_step.objective}\n\n"
         
         # Add specific error details if available
         if retry_context and hasattr(retry_context, 'previous_review_result') and retry_context.previous_review_result:
             reason = retry_context.previous_review_result.get('reason', '')
             if reason and reason != "Task failed after all retries.":
-                error_message += f"Reason: {reason}\n\n"
+                error_message += f"{reason}\n\n"
         
         # Add retry information
         error_message += f"Retries attempted: {retry_context.retry_count if retry_context else 'Unknown'}\n"
-        error_message += f"Status: Task failed permanently\n\n"
-        error_message += "Please check the connection and try again, or contact support if the issue persists."
+        error_message += f"Status: Task failed permanently"
         
         # Create workflow message for user
         message_data = {
@@ -1170,7 +1052,8 @@ class HandlingTasks:
                 processingTime=createdAction.get("processingTime"),
                 timestamp=float(createdAction.get("timestamp", get_utc_timestamp())),
                 result=createdAction.get("result"),
-                resultDocuments=createdAction.get("resultDocuments", [])
+                resultDocuments=createdAction.get("resultDocuments", []),
+                userMessage=createdAction.get("userMessage")
             )
             
         except Exception as e:
@@ -1241,20 +1124,6 @@ class HandlingTasks:
                 # Log action results
                 logger.info(f"Action completed successfully")
                 
-                # Create database log entry for action completion
-                if total_actions is not None:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"✅ Task {task_num} - Action {action_num}/{total_actions} completed",
-                        "type": "success"
-                    })
-                else:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"✅ Task {task_num} - Action {action_num}/? completed",
-                        "type": "success"
-                    })
-                
                 if created_documents:
                     logger.info(f"Output documents ({len(created_documents)}):")
                     for i, doc in enumerate(created_documents):
@@ -1276,19 +1145,12 @@ class HandlingTasks:
                 await self.createActionMessage(action, result, workflow, result_label, [], task_step, task_index)
                 
                 # Create database log entry for action failure
-                if total_actions is not None:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"❌ Task {task_num} - Action {action_num}/{total_actions} failed: {result.error}",
-                        "type": "error"
-                    })
-                else:
-                    self.chatInterface.createWorkflowLog({
-                        "workflowId": workflow.id,
-                        "message": f"❌ Task {task_num} - Action {action_num}/? failed: {result.error}",
-                        "type": "error"
-                    })
-            
+                self.chatInterface.createWorkflowLog({
+                    "workflowId": workflow.id,
+                    "message": f"❌ **Task {task_num}**\n\n❌ **Action {action_num}/{total_actions}** failed: {result.error}",
+                    "type": "error"
+                })
+
             # Log action summary
             logger.info(f"=== TASK {task_num} ACTION {action_num} COMPLETED ===")
             
@@ -1336,89 +1198,25 @@ class HandlingTasks:
             
             # Create a more meaningful message that includes task context
             task_objective = task_step.objective if task_step else 'Unknown task'
-            
+
+            # Add comprehensive workflow context
+            current_round = workflow_context.get('currentRound', 0)
+            current_task = workflow_context.get('currentTask', 0)
+            total_tasks = workflow_stats.get('totalTasks', 0)
+            current_action = workflow_context.get('currentAction', 0)
+            total_actions = workflow_stats.get('totalActions', 0)
+
             # Build a user-friendly message based on success/failure
             if result.success:
-                if created_documents and len(created_documents) > 0:
-                    doc_names = [doc.fileName for doc in created_documents[:3]]
-                    if len(created_documents) > 3:
-                        doc_names.append(f"... and {len(created_documents) - 3} more")
-                    
-                    # Enhanced message with workflow context
-                    message_text = f"✅ **Task {task_index or '?'} - Action {action.execMethod}.{action.execAction} Completed**\n\n"
-                    message_text += f"**Objective:** {task_objective}\n\n"
-                    message_text += f"**Generated {len(created_documents)} document(s):** {', '.join(doc_names)}\n\n"
-                    message_text += f"**Result Label:** {result_label}\n"
-                    
-                    # Add comprehensive workflow context
-                    current_round = workflow_context.get('currentRound', 0)
-                    current_task = workflow_context.get('currentTask', 0)
-                    total_tasks = workflow_stats.get('totalTasks', 0)
-                    current_action = workflow_context.get('currentAction', 0)
-                    total_actions = workflow_stats.get('totalActions', 0)
-                    
-                    message_text += f"**Workflow Context:**\n"
-                    message_text += f"- Round: {current_round}\n"
-                    if total_tasks > 0:
-                        message_text += f"- Task: {current_task}/{total_tasks}\n"
-                    else:
-                        message_text += f"- Task: {current_task}\n"
-                    if total_actions > 0:
-                        message_text += f"- Action: {current_action}/{total_actions}\n"
-                    else:
-                        message_text += f"- Action: {current_action}\n"
-                    message_text += f"- Status: {workflow_stats.get('workflowStatus', 'unknown')}"
-                else:
-                    message_text = f"✅ **Task {task_index or '?'} - Action {action.execMethod}.{action.execAction} Completed**\n\n"
-                    message_text += f"**Objective:** {task_objective}\n\n"
-                    message_text += "**Action executed successfully**\n\n"
-                    message_text += f"**Result Label:** {result_label}\n"
-                    
-                    # Add comprehensive workflow context
-                    current_round = workflow_context.get('currentRound', 0)
-                    current_task = workflow_context.get('currentTask', 0)
-                    total_tasks = workflow_stats.get('totalTasks', 0)
-                    current_action = workflow_context.get('currentAction', 0)
-                    total_actions = workflow_stats.get('totalActions', 0)
-                    
-                    message_text += f"**Workflow Context:**\n"
-                    message_text += f"- Round: {current_round}\n"
-                    if total_tasks > 0:
-                        message_text += f"- Task: {current_task}/{total_tasks}\n"
-                    else:
-                        message_text += f"- Task: {current_task}\n"
-                    if total_actions > 0:
-                        message_text += f"- Action: {current_action}/{total_actions}\n"
-                    else:
-                        message_text += f"- Action: {current_action}\n"
-                    message_text += f"- Status: {workflow_stats.get('workflowStats', 'unknown')}"
+                message_text = f"**Action {current_action}/{total_actions} ({action.execMethod}.{action.execAction})**\n\n"
+                message_text += f"✅ {task_objective}\n\n"
             else:
                 # ⚠️ FAILURE MESSAGE - Show error details to user
                 error_details = result.error if result.error else "Unknown error occurred"
-                message_text = f"❌ **Task {task_index or '?'} - Action {action.execMethod}.{action.execAction} Failed**\n\n"
-                message_text += f"**Objective:** {task_objective}\n\n"
-                message_text += f"**Error:** {error_details}\n\n"
-                message_text += f"**Result Label:** {result_label}\n"
-                
-                # Add comprehensive workflow context
-                current_round = workflow_context.get('currentRound', 0)
-                current_task = workflow_context.get('currentTask', 0)
-                total_tasks = workflow_stats.get('totalTasks', 0)
-                current_action = workflow_context.get('currentAction', 0)
-                total_actions = workflow_stats.get('totalActions', 0)
-                
-                message_text += f"**Workflow Context:**\n"
-                message_text += f"- Round: {current_round}\n"
-                if total_tasks > 0:
-                    message_text += f"- Task: {current_task}/{total_tasks}\n"
-                else:
-                    message_text += f"- Task: {current_task}\n"
-                if total_actions > 0:
-                    message_text += f"- Action: {current_action}/{total_actions}\n"
-                    message_text += f"- Action: {current_action}\n"
-                message_text += f"- Status: {workflow_stats.get('workflowStatus', 'unknown')}\n\n"
-                message_text += "Please check the connection and try again."
-            
+                message_text = f"**Action {current_action}/{total_actions} ({action.execMethod}.{action.execAction})**\n\n"
+                message_text += f"❌ {task_objective}\n\n"
+                message_text += f"{error_details}\n\n"
+                            
             message_data = {
                 "workflowId": workflow.id,
                 "role": "assistant",
@@ -1432,19 +1230,12 @@ class HandlingTasks:
                 "documentsLabel": result_label,
                 "documents": created_documents,
                 # Add workflow context fields - extract from result_label to match document reference
-                "roundNumber": workflow_context.get('currentRound', 0),
-                "taskNumber": task_index,
-                "actionNumber": self._extractActionNumberFromLabel(result_label) if result_label else workflow_context.get('currentAction', 0),
+                "roundNumber": current_round,
+                "taskNumber": current_task,
+                "actionNumber": current_action,
                 "actionProgress": "success" if result.success else "fail"
             }
             
-            # Add user-friendly message if available
-            if action.userMessage:
-                if result.success:
-                    message_data["message"] += f"\n\n💬 {action.userMessage}"
-                else:
-                    message_data["message"] += f"\n\n💬 Action was intended to: {action.userMessage}"
-            
             # Add debugging for error messages
             if not result.success:
                 logger.info(f"Creating ERROR message: {message_text}")
diff --git a/modules/chat/handling/promptFactory.py b/modules/chat/handling/promptFactory.py
index 884606e4..4587cce4 100644
--- a/modules/chat/handling/promptFactory.py
+++ b/modules/chat/handling/promptFactory.py
@@ -34,8 +34,8 @@ INSTRUCTIONS:
 3. Focus on business outcomes, not technical operations
 4. Each task should produce meaningful, usable outputs
 5. Ensure proper handover between tasks using result labels
-6. Generate user-friendly messages for each task in the user's language ({user_language})
-7. Detect the language of the user request and include it in languageUserDetected
+6. Detect the language of the user request and include it in languageUserDetected
+7. Generate user-friendly messages for each task in the user's request language
 8. Return a JSON object with the exact structure shown below
 
 TASK GROUPING PRINCIPLES:
@@ -63,15 +63,15 @@ TASK PLANNING PRINCIPLES:
 - Keep tasks at a meaningful level of abstraction
 - Each task should produce results that can be used by subsequent tasks
 - Ensure clear dependencies and handovers between tasks
-- Provide clear, actionable user messages in the user's language ({user_language})
+- Provide clear, actionable user messages in the user's request language
 - Group related activities to minimize task fragmentation
 - Only create multiple tasks when dealing with truly different, independent objectives
 
 REQUIRED JSON STRUCTURE:
 {{
     "overview": "Brief description of the overall plan",
-    "userMessage": "User-friendly message explaining the task plan in {user_language}",
     "languageUserDetected": "en",  // Language code detected from user request (en, de, fr, it, es, etc.)
+    "userMessage": "User-friendly message explaining the task plan in user's request language",
     "tasks": [
         {{
             "id": "task_1",
@@ -79,7 +79,7 @@ REQUIRED JSON STRUCTURE:
             "dependencies": ["task_0"],  // IDs of tasks that must complete first
             "success_criteria": ["criteria1", "criteria2"],
             "estimated_complexity": "low|medium|high",
-            "userMessage": "User-friendly message explaining what this task will accomplish in {user_language}"
+            "userMessage": "User-friendly message explaining what this task will accomplish in user's request language"
         }}
     ]
 }}
diff --git a/modules/chat/serviceCenter.py b/modules/chat/serviceCenter.py
index 9a37030c..13545001 100644
--- a/modules/chat/serviceCenter.py
+++ b/modules/chat/serviceCenter.py
@@ -350,16 +350,19 @@ class ServiceCenter:
             doc_exchange = None
             if message.documents:
                 if message.actionId and message.documentsLabel:
-                    # Use new document label format
+                    # Validate that we use the same label as in the message
+                    validated_label = self._validateDocumentLabelConsistency(message)
+                    
+                    # Use the message's actual documentsLabel
                     doc_refs = []
                     for doc in message.documents:
                         doc_ref = self.getDocumentReferenceFromChatDocument(doc, message)
                         doc_refs.append(doc_ref)
                     
-                        doc_exchange = DocumentExchange(
-                            documentsLabel=message.documentsLabel,
+                    doc_exchange = DocumentExchange(
+                        documentsLabel=validated_label,
                         documents=doc_refs
-                        )
+                    )
                 else:
                     # Generate new labels for documents without explicit labels
                     doc_refs = []
@@ -444,8 +447,21 @@ class ServiceCenter:
             if document_list["chat"]:
                 context += "CURRENT ROUND DOCUMENTS:\n"
                 for exchange in document_list["chat"]:
-                    # Generate docList reference for the exchange (using message ID)
-                    doc_list_ref = f"docList:{exchange.documentsLabel}"
+                    # Generate docList reference for the exchange (using message ID and label)
+                    # Find the message that corresponds to this exchange
+                    message_id = None
+                    for message in self.workflow.messages:
+                        if hasattr(message, 'documentsLabel') and message.documentsLabel == exchange.documentsLabel:
+                            message_id = message.id
+                            break
+                    
+                    if message_id:
+                        doc_list_ref = f"docList:{message_id}:{exchange.documentsLabel}"
+                    else:
+                        # Fallback to label-only format if message ID not found
+                        doc_list_ref = f"docList:{exchange.documentsLabel}"
+                    
+                    logger.debug(f"Using document label for action planning: {exchange.documentsLabel} (message_id: {message_id})")
                     context += f"- {doc_list_ref} contains:\n"
                     # Generate docItem references for each document in the list
                     for doc_ref in exchange.documents:
@@ -460,8 +476,21 @@ class ServiceCenter:
             if document_list["history"]:
                 context += "WORKFLOW HISTORY DOCUMENTS:\n"
                 for exchange in document_list["history"]:
-                    # Generate docList reference for the exchange (using message ID)
-                    doc_list_ref = f"docList:{exchange.documentsLabel}"
+                    # Generate docList reference for the exchange (using message ID and label)
+                    # Find the message that corresponds to this exchange
+                    message_id = None
+                    for message in self.workflow.messages:
+                        if hasattr(message, 'documentsLabel') and message.documentsLabel == exchange.documentsLabel:
+                            message_id = message.id
+                            break
+                    
+                    if message_id:
+                        doc_list_ref = f"docList:{message_id}:{exchange.documentsLabel}"
+                    else:
+                        # Fallback to label-only format if message ID not found
+                        doc_list_ref = f"docList:{exchange.documentsLabel}"
+                    
+                    logger.debug(f"Using history document label for action planning: {exchange.documentsLabel} (message_id: {message_id})")
                     context += f"- {doc_list_ref} contains:\n"
                     # Generate docItem references for each document in the list
                     for doc_ref in exchange.documents:
@@ -481,6 +510,16 @@ class ServiceCenter:
             logger.error(f"Error generating enhanced document context: {str(e)}")
             return "NO DOCUMENTS AVAILABLE - Error generating document context."
 
+    def _validateDocumentLabelConsistency(self, message) -> str:
+        """Validate that the document label used for references matches the message's actual label"""
+        if not hasattr(message, 'documentsLabel') or not message.documentsLabel:
+            logger.debug(f"Message {message.id} has no documentsLabel, returning None")
+            return None
+            
+        # Simply return the message's actual documentsLabel - no correction, just validation
+        logger.debug(f"Using message's documentsLabel for references: '{message.documentsLabel}'")
+        return message.documentsLabel
+
     def _extractDocumentInfoFromReference(self, doc_ref: str) -> Dict[str, str]:
         """Extract document information from reference string"""
         try:
@@ -569,19 +608,56 @@ class ServiceCenter:
                             if message.documents:
                                 for doc in message.documents:
                                     if doc.id == doc_id:
+                                        doc_name = getattr(doc, 'fileName', 'unknown')
+                                        logger.debug(f"Found docItem reference {doc_ref}: {doc_name}")
                                         all_documents.append(doc)
                                         break
                 elif doc_ref.startswith("docList:"):
-                    # docList:<messageId>:<label> - extract message ID and find document list
+                    # docList:<messageId>:<label> or docList:<label> - extract message ID and find document list
                     parts = doc_ref.split(':')
-                    if len(parts) >= 2:
+                    if len(parts) >= 3:
+                        # Format: docList:<messageId>:<label>
                         message_id = parts[1]
+                        label = parts[2]
                         # Find the message by ID and get all its documents
                         for message in self.workflow.messages:
                             if str(message.id) == message_id:
                                 if message.documents:
+                                    doc_names = [doc.fileName for doc in message.documents if hasattr(doc, 'fileName')]
+                                    logger.debug(f"Found docList reference {doc_ref}: {len(message.documents)} documents - {doc_names}")
                                     all_documents.extend(message.documents)
+                                else:
+                                    logger.debug(f"Found docList reference {doc_ref} but message has no documents")
                                 break
+                    elif len(parts) >= 2:
+                        # Format: docList:<label> - find message by documentsLabel
+                        label = parts[1]
+                        logger.debug(f"Looking for message with documentsLabel: {label}")
+                        # Find messages with matching documentsLabel
+                        matching_messages = []
+                        for message in self.workflow.messages:
+                            # Check both attribute and raw data for documentsLabel
+                            msg_label = getattr(message, 'documentsLabel', None)
+                            if msg_label == label:
+                                matching_messages.append(message)
+                                logger.debug(f"Found message {message.id} with matching documentsLabel: {msg_label}")
+                            else:
+                                # Debug: show what labels we're comparing
+                                logger.debug(f"Message {message.id} has documentsLabel: '{msg_label}' (looking for: '{label}')")
+                        
+                        if matching_messages:
+                            # Use the newest message (highest publishedAt)
+                            matching_messages.sort(key=lambda msg: getattr(msg, 'publishedAt', 0), reverse=True)
+                            newest_message = matching_messages[0]
+                            
+                            if newest_message.documents:
+                                doc_names = [doc.fileName for doc in newest_message.documents if hasattr(doc, 'fileName')]
+                                logger.debug(f"Found docList reference {doc_ref}: {len(newest_message.documents)} documents - {doc_names}")
+                                all_documents.extend(newest_message.documents)
+                            else:
+                                logger.debug(f"Found docList reference {doc_ref} but message has no documents")
+                        else:
+                            logger.debug(f"No messages found with documentsLabel: {label}")
                 else:
                     # Direct label reference (round1_task2_action3_contextinfo)
                     # Search for messages with matching documentsLabel to find the actual documents
@@ -619,8 +695,9 @@ class ServiceCenter:
                                 logger.debug(f"Newest message has {len(newest_message.documents) if newest_message.documents else 0} documents")
                                 
                                 if newest_message.documents:
+                                    doc_names = [doc.fileName for doc in newest_message.documents if hasattr(doc, 'fileName')]
+                                    logger.debug(f"Added {len(newest_message.documents)} documents from newest message {newest_message.id}: {doc_names}")
                                     all_documents.extend(newest_message.documents)
-                                    logger.debug(f"Added {len(newest_message.documents)} documents from newest message {newest_message.id}")
                                 else:
                                     logger.debug(f"No documents found in newest message {newest_message.id}")
                             else:
@@ -641,8 +718,9 @@ class ServiceCenter:
                                     
                                     logger.debug(f"Using fallback message {newest_fallback.id} with documentsLabel: {getattr(newest_fallback, 'documentsLabel', 'unknown')}")
                                     if newest_fallback.documents:
+                                        doc_names = [doc.fileName for doc in newest_fallback.documents if hasattr(doc, 'fileName')]
+                                        logger.debug(f"Added {len(newest_fallback.documents)} documents from fallback message {newest_fallback.id}: {doc_names}")
                                         all_documents.extend(newest_fallback.documents)
-                                        logger.debug(f"Added {len(newest_fallback.documents)} documents from fallback message {newest_fallback.id}")
                                     else:
                                         logger.debug(f"No documents found in fallback message {newest_fallback.id}")
                                 else:
diff --git a/modules/methods/methodDocument.py b/modules/methods/methodDocument.py
index 0bad2d67..72d6d81b 100644
--- a/modules/methods/methodDocument.py
+++ b/modules/methods/methodDocument.py
@@ -441,6 +441,10 @@ class MethodDocument(MethodBase):
                 if len(lines) > 2:
                     formatted_content = '\n'.join(lines[1:-1])
             
+            # For HTML format, check if AI returned complete HTML document
+            if extension == ".html" and (formatted_content.startswith('<!DOCTYPE') or formatted_content.startswith('<html')):
+                return formatted_content
+            
             return formatted_content
             
         except Exception as e:
@@ -643,7 +647,22 @@ class MethodDocument(MethodBase):
                 raise Exception("AI report generation failed - AI is required for report generation")
             
             # Clean up the AI response and ensure it's valid HTML
-            if not aiReport.strip().startswith('<html'):
+            aiReport = aiReport.strip()
+
+            # Strip fenced code blocks like ```html ... ``` if present
+            if aiReport.startswith("```") and aiReport.endswith("```"):
+                lines = aiReport.split('\n')
+                if len(lines) >= 2:
+                    # remove first and last fence lines (language tag allowed on first)
+                    aiReport = '\n'.join(lines[1:-1]).strip()
+
+            # Check if AI response starts with DOCTYPE or html tag (complete HTML document)
+            if aiReport.startswith('<!DOCTYPE') or aiReport.startswith('<html'):
+                # AI returned complete HTML document, use it directly
+                return aiReport
+            else:
+                # AI returned HTML content without document structure, wrap it
+                
                 # Check if AI response already contains a title/header
                 has_title = any(title.lower() in aiReport.lower() for title in [title, "outlook", "report", "status"])
                 
@@ -660,9 +679,6 @@ class MethodDocument(MethodBase):
                 html.append(aiReport)
                 html.append("</body></html>")
                 return '\n'.join(html)
-            else:
-                # AI returned complete HTML, use it directly
-                return aiReport
                 
         except Exception as e:
             logger.error(f"Error generating AI report: {str(e)}")
diff --git a/modules/routes/routeWorkflows.py b/modules/routes/routeWorkflows.py
index 95947dde..565052ce 100644
--- a/modules/routes/routeWorkflows.py
+++ b/modules/routes/routeWorkflows.py
@@ -270,15 +270,6 @@ async def get_workflow_messages(
         # Get all messages
         allMessages = interfaceChat.getWorkflowMessages(workflowId)
         
-        # Debug logging: Log attributes for each message
-        logger.debug(f"Retrieved {len(allMessages)} messages for workflow {workflowId}")
-        for i, message in enumerate(allMessages):
-            logger.debug(f"Message {i+1} (ID: {message.id}): {message}")
-            logger.debug(f"  - Type: {getattr(message, 'type', 'N/A')}")
-            logger.debug(f"  - Content: {getattr(message, 'content', 'N/A')[:100]}...")
-            logger.debug(f"  - PublishedAt: {getattr(message, 'publishedAt', 'N/A')}")
-            logger.debug(f"  - All attributes: {message.__dict__}")
-        
         # Apply selective data transfer if messageId is provided
         if messageId:
             # Find the index of the message with the given ID
diff --git a/modules/workflow/managerWorkflow.py b/modules/workflow/managerWorkflow.py
index b30b9c4b..59aa338a 100644
--- a/modules/workflow/managerWorkflow.py
+++ b/modules/workflow/managerWorkflow.py
@@ -141,6 +141,12 @@ class WorkflowManager:
             self.chatManager.handlingTasks._checkWorkflowStopped()
             
             # Create initial message using interface
+            # Generate the correct documentsLabel that matches what getDocumentReferenceList() will create
+            round_num = workflow.currentRound
+            task_num = 0
+            action_num = 0
+            context_label = f"round{round_num}_task{task_num}_action{action_num}_context"
+            
             messageData = {
                 "workflowId": workflow.id,
                 "role": "user",
@@ -148,7 +154,7 @@ class WorkflowManager:
                 "status": "first",
                 "sequenceNr": 1,
                 "publishedAt": get_utc_timestamp(),
-                "documentsLabel": "workflow_start",
+                "documentsLabel": context_label,
                 "documents": [],
                 # Add workflow context fields
                 "roundNumber": workflow.currentRound,
@@ -390,7 +396,7 @@ class WorkflowManager:
             summary_message = {
                 "workflowId": workflow.id,
                 "role": "assistant",
-                "message": f"Workflow completed successfully. Completed {workflow_result.completed_tasks}/{workflow_result.total_tasks} tasks in {workflow_result.execution_time:.2f} seconds.",
+                "message": f"Workflow completed successfully.",
                 "status": "last",
                 "sequenceNr": len(workflow.messages) + 1,
                 "publishedAt": get_utc_timestamp(),
diff --git a/notes/changelog.txt b/notes/changelog.txt
index 22df65b7..9004403d 100644
--- a/notes/changelog.txt
+++ b/notes/changelog.txt
@@ -2,8 +2,7 @@
 TODO
 
 # System
-- Backend/UI fix Table Connections mit korrekten Token Infos, View jedesmal neu laden im formGeneric
-- model reference diagram for all models. who uses who? --> to see the basic building blocks
+- chat workflow: messages to user in user language
 - neutralizer to activate AND put back placeholders to the returned data
 
 # Tests

From 13bf17cd64efe905d762f5884c34791e0944e24a Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Tue, 2 Sep 2025 13:09:56 +0200
Subject: [PATCH 12/17] msg cleanup

---
 modules/chat/handling/handlingTasks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modules/chat/handling/handlingTasks.py b/modules/chat/handling/handlingTasks.py
index 6138932b..d99521f2 100644
--- a/modules/chat/handling/handlingTasks.py
+++ b/modules/chat/handling/handlingTasks.py
@@ -605,7 +605,7 @@ class HandlingTasks:
                 # Add criteria status if available
                 if hasattr(review_result, 'met_criteria') and review_result.met_criteria:
                     for criterion in review_result.met_criteria:
-                        completion_message += f"\n• {criterion}\n"
+                        completion_message += f"\n• {criterion}"
                 
                 if hasattr(review_result, 'quality_score'):
                     completion_message += f"\n📊 Score {review_result.quality_score}/10"

From ba6bb3d09f0d0415322888b76cd09899005652e6 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Tue, 2 Sep 2025 13:43:40 +0200
Subject: [PATCH 13/17] web integration

---
 notes/changelog.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/notes/changelog.txt b/notes/changelog.txt
index 9004403d..5e017239 100644
--- a/notes/changelog.txt
+++ b/notes/changelog.txt
@@ -2,7 +2,7 @@
 TODO
 
 # System
-- chat workflow: messages to user in user language
+- web
 - neutralizer to activate AND put back placeholders to the returned data
 
 # Tests

From 3c1f66cb6d88ae77bce49e64d77a778d54700449 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Tue, 2 Sep 2025 18:58:30 +0200
Subject: [PATCH 14/17] web integrated

---
 AI_ENGINE_MIGRATION_PLAN.md                   |  276 +++++
 config.ini                                    |   27 +-
 modules/__init__.py                           |    0
 modules/chat/serviceCenter.py                 |    5 -
 modules/chat/serviceCenter_ai_engine.py       |  266 +++++
 modules/connectors/connectorAiOpenai.py       |   21 +
 ...nector_tavily.py => connectorWebTavily.py} |   79 +-
 modules/engines/aiEngine.py                   |  544 +++++++++
 modules/interfaces/interfaceAiCalls.py        |   22 +-
 modules/interfaces/interfaceAiEngine.py       |  115 ++
 ...face_web_model.py => interfaceWebModel.py} |   29 +-
 modules/interfaces/interfaceWebObjects.py     |  118 ++
 modules/interfaces/interface_web_objects.py   |   46 -
 modules/methods/methodWeb.py                  | 1043 ++++-------------
 modules/methods/method_web.py                 |  197 ----
 .../methods/web/web_search/web_search_base.py |   31 -
 .../web/web_search/web_search_tavily.py       |   70 --
 notes/changelog.txt                           |    8 +-
 requirements.txt                              |   19 +
 test_ai_calls.md                              |  235 ++++
 test_ai_fallback.py                           |  103 ++
 test_methodWeb.py                             |  658 +++++++++++
 test_web_csv_functionality.py                 |  207 ++++
 tests/connectors/test_connector_tavily.py     |   16 +-
 tests/methods/test_method_web.py              |   10 +-
 25 files changed, 2953 insertions(+), 1192 deletions(-)
 create mode 100644 AI_ENGINE_MIGRATION_PLAN.md
 delete mode 100644 modules/__init__.py
 create mode 100644 modules/chat/serviceCenter_ai_engine.py
 rename modules/connectors/{connector_tavily.py => connectorWebTavily.py} (70%)
 create mode 100644 modules/engines/aiEngine.py
 create mode 100644 modules/interfaces/interfaceAiEngine.py
 rename modules/interfaces/{interface_web_model.py => interfaceWebModel.py} (69%)
 create mode 100644 modules/interfaces/interfaceWebObjects.py
 delete mode 100644 modules/interfaces/interface_web_objects.py
 delete mode 100644 modules/methods/method_web.py
 delete mode 100644 modules/methods/web/web_search/web_search_base.py
 delete mode 100644 modules/methods/web/web_search/web_search_tavily.py
 create mode 100644 test_ai_calls.md
 create mode 100644 test_ai_fallback.py
 create mode 100644 test_methodWeb.py
 create mode 100644 test_web_csv_functionality.py

diff --git a/AI_ENGINE_MIGRATION_PLAN.md b/AI_ENGINE_MIGRATION_PLAN.md
new file mode 100644
index 00000000..71077e6f
--- /dev/null
+++ b/AI_ENGINE_MIGRATION_PLAN.md
@@ -0,0 +1,276 @@
+# AI Engine Migration Plan
+
+## Overview
+This document outlines the migration strategy from the current AI call system to the new Smart AI Engine architecture.
+
+## Benefits of the New Architecture
+
+### 1. **Separation of Concerns**
+- Applications no longer need to worry about content size limits
+- Centralized AI model selection and failover
+- Intelligent content reduction strategies
+
+### 2. **Improved Reliability**
+- Automatic handling of "content too large" errors
+- Multiple fallback strategies
+- Model-specific optimization
+
+### 3. **Better Performance**
+- Optimal model selection based on content characteristics
+- Intelligent chunking and processing strategies
+- Reduced API costs through smart model selection
+
+### 4. **Enhanced Maintainability**
+- Single point of AI logic
+- Easy to add new models and strategies
+- Consistent error handling
+
+## Migration Phases
+
+### Phase 1: Infrastructure Setup (Week 1-2)
+1. **Create AI Engine Interface**
+   - ✅ `interfaceAiEngine.py` - Core interfaces and data structures
+   - ✅ `aiEngine.py` - Smart AI Engine implementation
+   - ✅ `serviceCenter_ai_engine.py` - ServiceCenter integration
+
+2. **Update Dependencies**
+   - Add new imports to existing modules
+   - Update configuration for AI model selection
+   - Add logging for AI engine operations
+
+### Phase 2: ServiceCenter Integration (Week 3)
+1. **Update ServiceCenter Class**
+   ```python
+   # Add to ServiceCenter.__init__
+   self.ai_engine = ServiceCenterAIEngine(self)
+   
+   # Replace existing AI methods
+   async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
+       return await self.ai_engine.callAiTextAdvanced(prompt, context)
+   
+   async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
+       return await self.ai_engine.callAiTextBasic(prompt, context)
+   
+   async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
+       return await self.ai_engine.extractContentFromDocument(prompt, document)
+   
+   async def summarizeChat(self, messages: List[ChatMessage]) -> str:
+       return await self.ai_engine.summarizeChat(messages)
+   ```
+
+2. **Add New Document-Aware Methods**
+   ```python
+   async def callAiWithDocuments(
+       self,
+       prompt: str,
+       documents: List[ChatDocument] = None,
+       operation_type: str = "general"
+   ) -> str:
+       return await self.ai_engine.callAiWithDocuments(
+           prompt, documents, operation_type=operation_type
+       )
+   ```
+
+### Phase 3: Method Updates (Week 4-5)
+1. **Update MethodWeb.py**
+   ```python
+   # Before
+   web_scrape_result = await web_interface.scrape(web_scrape_request)
+   
+   # After - no changes needed, but can be enhanced
+   # The AI engine will automatically handle large content
+   ```
+
+2. **Update MethodDocument.py**
+   ```python
+   # Before
+   formatted_content = await self.service.callAiTextBasic(ai_prompt, content)
+   
+   # After
+   formatted_content = await self.service.callAiForReportGeneration(
+       prompt=ai_prompt,
+       documents=chat_documents
+   )
+   ```
+
+3. **Update MethodAi.py**
+   ```python
+   # Before
+   result = await self.service.callAiTextAdvanced(enhanced_prompt, context)
+   
+   # After
+   result = await self.service.callAiWithDocuments(
+       prompt=enhanced_prompt,
+       documents=document_list,
+       operation_type="ai_processing"
+   )
+   ```
+
+4. **Update MethodOutlook.py**
+   ```python
+   # Before
+   composed_email = await self.service.interfaceAiCalls.callAiTextAdvanced(ai_prompt)
+   
+   # After
+   composed_email = await self.service.callAiForEmailComposition(
+       prompt=ai_prompt,
+       documents=attached_documents
+   )
+   ```
+
+### Phase 4: Task Handling Updates (Week 6)
+1. **Update handlingTasks.py**
+   ```python
+   # Before
+   prompt = await self.service.callAiTextAdvanced(task_planning_prompt)
+   
+   # After
+   prompt = await self.service.callAiForTaskPlanning(
+       prompt=task_planning_prompt,
+       documents=available_documents,
+       context=workflow_context
+   )
+   ```
+
+2. **Update promptFactory.py**
+   ```python
+   # Before
+   messageSummary = await service.summarizeChat(context.workflow.messages)
+   
+   # After - no changes needed, method signature stays the same
+   # But internally uses the new AI engine
+   ```
+
+### Phase 5: Testing and Optimization (Week 7-8)
+1. **Unit Tests**
+   - Test AI engine with various content sizes
+   - Test fallback strategies
+   - Test model selection logic
+
+2. **Integration Tests**
+   - Test with real documents of various sizes
+   - Test error scenarios
+   - Test performance improvements
+
+3. **Performance Monitoring**
+   - Monitor AI call success rates
+   - Monitor processing times
+   - Monitor cost savings
+
+## Code Changes Required
+
+### 1. ServiceCenter Updates
+```python
+# Add to ServiceCenter.__init__
+from modules.chat.serviceCenter_ai_engine import ServiceCenterAIEngine
+self.ai_engine_wrapper = ServiceCenterAIEngine(self)
+
+# Update existing methods to use AI engine
+async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
+    return await self.ai_engine_wrapper.callAiTextAdvanced(prompt, context)
+
+async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
+    return await self.ai_engine_wrapper.callAiTextBasic(prompt, context)
+
+async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
+    return await self.ai_engine_wrapper.extractContentFromDocument(prompt, document)
+
+async def summarizeChat(self, messages: List[ChatMessage]) -> str:
+    return await self.ai_engine_wrapper.summarizeChat(messages)
+```
+
+### 2. Method Updates (Optional Enhancements)
+```python
+# Enhanced method calls with document awareness
+async def process_documents_with_ai(self, prompt: str, documents: List[ChatDocument]):
+    return await self.service.callAiWithDocuments(
+        prompt=prompt,
+        documents=documents,
+        operation_type="document_processing"
+    )
+```
+
+### 3. Configuration Updates
+```ini
+# Add to config.ini
+[AI_ENGINE]
+DEFAULT_MODEL=anthropic_claude
+FALLBACK_MODEL=openai_gpt35
+MAX_CONTENT_SIZE=100000
+ENABLE_CONTENT_REDUCTION=true
+CONTENT_REDUCTION_THRESHOLD=0.8
+```
+
+## Backward Compatibility
+
+### 1. **Method Signatures**
+- All existing method signatures remain unchanged
+- Internal implementation uses new AI engine
+- No breaking changes for existing code
+
+### 2. **Error Handling**
+- Same error types and messages
+- Enhanced error recovery with fallback strategies
+- Better error reporting with processing details
+
+### 3. **Performance**
+- Same or better performance
+- Automatic optimization based on content
+- Reduced API costs through smart model selection
+
+## Risk Mitigation
+
+### 1. **Gradual Rollout**
+- Deploy with feature flags
+- A/B testing with subset of users
+- Rollback capability
+
+### 2. **Monitoring**
+- Comprehensive logging of AI engine operations
+- Performance metrics tracking
+- Error rate monitoring
+
+### 3. **Fallback Strategy**
+- Keep original AI call methods as backup
+- Automatic fallback to original methods on errors
+- Manual override capability
+
+## Expected Benefits
+
+### 1. **Immediate Benefits**
+- Elimination of "content too large" errors
+- Better handling of large documents
+- Improved user experience
+
+### 2. **Long-term Benefits**
+- Easier addition of new AI models
+- Better cost optimization
+- Enhanced content processing capabilities
+- Improved system reliability
+
+### 3. **Developer Benefits**
+- Simplified AI integration
+- No need to worry about content size limits
+- Consistent AI behavior across the system
+- Better debugging and monitoring
+
+## Success Metrics
+
+### 1. **Error Reduction**
+- 90% reduction in "content too large" errors
+- 50% reduction in AI call failures
+- 95% success rate for document processing
+
+### 2. **Performance Improvement**
+- 20% faster processing for large documents
+- 30% reduction in API costs
+- 50% reduction in retry attempts
+
+### 3. **User Experience**
+- Faster response times
+- More reliable document processing
+- Better content extraction quality
+
+## Conclusion
+
+The new AI Engine architecture provides a robust, scalable solution for handling AI calls with large content. The migration can be done gradually with full backward compatibility, ensuring minimal risk while providing significant benefits in reliability, performance, and maintainability.
diff --git a/config.ini b/config.ini
index 0ba1e0bf..9c529400 100644
--- a/config.ini
+++ b/config.ini
@@ -36,20 +36,6 @@ Security_LOCK_DURATION_MINUTES = 30
 # Content Neutralization configuration
 Content_Neutralization_ENABLED = False
 
-# Agent Webcrawler configuration
-Agent_Webcrawler_SERPAPI_ENGINE = google
-Agent_Webcrawler_SERPAPI_APIKEY = 7304bd34bca767aa52dd3233297e30a9edc0abc57871f702b3f8238b9d3ee7bc
-Agent_Webcrawler_SERPAPI_MAX_URLS = 3
-Agent_Webcrawler_SERPAPI_MAX_SEARCH_KEYWORDS = 3
-Agent_Webcrawler_SERPAPI_MAX_SEARCH_RESULTS = 5
-Agent_Webcrawler_SERPAPI_TIMEOUT = 10
-Agent_Webcrawler_SERPAPI_USER_AGENT = Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36
-
-# Agent Coder configuration
-Agent_Coder_INSTALL_TIMEOUT = 180
-Agent_Coder_EXECUTION_TIMEOUT = 60
-Agent_Coder_EXECUTION_RETRY = 5
-
 # Agent Mail configuration
 Service_MSFT_CLIENT_ID = c7e7112d-61dc-4f3a-8cd3-08cc4cd7504c
 Service_MSFT_CLIENT_SECRET = Kxf8Q~2lJIteZ~JaI32kMf1lfaWKATqxXiNiFbzV
@@ -58,3 +44,16 @@ Service_MSFT_TENANT_ID = common
 # Google Service configuration
 Service_GOOGLE_CLIENT_ID = 354925410565-aqs2b2qaiqmm73qpjnel6al8eid78uvg.apps.googleusercontent.com
 Service_GOOGLE_CLIENT_SECRET = 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
+
+# Tavily Web Search configuration
+Connector_WebTavily_API_KEY = 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
+
+# Web Search configuration
+Web_Search_MAX_QUERY_LENGTH = 400
+Web_Search_MAX_RESULTS = 20
+Web_Search_MIN_RESULTS = 1
+
+# Web Crawl configuration
+Web_Crawl_TIMEOUT = 30
+Web_Crawl_MAX_RETRIES = 3
+Web_Crawl_RETRY_DELAY = 2
\ No newline at end of file
diff --git a/modules/__init__.py b/modules/__init__.py
deleted file mode 100644
index e69de29b..00000000
diff --git a/modules/chat/serviceCenter.py b/modules/chat/serviceCenter.py
index 13545001..703531f0 100644
--- a/modules/chat/serviceCenter.py
+++ b/modules/chat/serviceCenter.py
@@ -283,7 +283,6 @@ class ServiceCenter:
                     methodList.append(signature)
         return methodList
 
-        
     def generateDocumentLabel(self, document: ChatDocument, message: ChatMessage) -> str:
         """Generate new document label: round+task+action+filename.extension"""
         try:
@@ -1302,10 +1301,6 @@ Please provide a comprehensive summary of this conversation."""
             except Exception as e:
                 logger.error(f"Error refreshing file attributes for document {doc.id}: {e}")
 
-    # Note: Workflow progress update methods have been moved to handlingTasks.py
-    # where they belong since that's where the actual workflow execution happens
-    # This avoids circular import issues between ServiceCenter and ChatInterface
-
     def diagnoseDocumentAccess(self, document: ChatDocument) -> Dict[str, Any]:
         """
         Diagnose document access issues and provide recovery information.
diff --git a/modules/chat/serviceCenter_ai_engine.py b/modules/chat/serviceCenter_ai_engine.py
new file mode 100644
index 00000000..a33a5813
--- /dev/null
+++ b/modules/chat/serviceCenter_ai_engine.py
@@ -0,0 +1,266 @@
+"""
+ServiceCenter integration with Smart AI Engine
+"""
+
+import logging
+from typing import List, Dict, Any, Optional
+from modules.interfaces.interfaceChatModel import ChatDocument
+from modules.interfaces.interfaceAiEngine import (
+    AIRequest, AIResponse, AIModelType, ProcessingStrategy, 
+    ContentReductionStrategy
+)
+from modules.engines.aiEngine import SmartAIEngine
+
+logger = logging.getLogger(__name__)
+
+
+class ServiceCenterAIEngine:
+    """ServiceCenter integration with Smart AI Engine"""
+    
+    def __init__(self, service_center):
+        self.service_center = service_center
+        self.ai_engine = SmartAIEngine(service_center)
+    
+    async def callAiWithDocuments(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        context: str = None,
+        preferred_model: AIModelType = None,
+        operation_type: str = "general",
+        processing_strategy: ProcessingStrategy = None,
+        reduction_strategy: ContentReductionStrategy = None,
+        **kwargs
+    ) -> str:
+        """
+        Unified AI call method that handles documents and prompts separately
+        
+        Args:
+            prompt: The AI prompt
+            documents: List of documents to process
+            context: Additional context
+            preferred_model: Preferred AI model
+            operation_type: Type of operation (for strategy selection)
+            processing_strategy: Explicit processing strategy
+            reduction_strategy: Explicit content reduction strategy
+            **kwargs: Additional parameters
+            
+        Returns:
+            AI response content
+        """
+        try:
+            # Create AI request
+            request = AIRequest(
+                prompt=prompt,
+                documents=documents or [],
+                context=context,
+                preferred_model=preferred_model,
+                processing_strategy=processing_strategy,
+                reduction_strategy=reduction_strategy,
+                metadata={
+                    "operation_type": operation_type,
+                    **kwargs
+                }
+            )
+            
+            # Process request
+            response = await self.ai_engine.process_request(request)
+            
+            if response.success:
+                return response.content
+            else:
+                raise Exception(f"AI processing failed: {response.error}")
+                
+        except Exception as e:
+            logger.error(f"Error in AI call with documents: {str(e)}")
+            raise e
+    
+    # Convenience methods for different operation types
+    
+    async def callAiForTaskPlanning(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        context: str = None
+    ) -> str:
+        """AI call optimized for task planning"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="task_planning",
+            preferred_model=AIModelType.ANTHROPIC_CLAUDE  # Better for complex planning
+        )
+    
+    async def callAiForActionDefinition(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        context: str = None
+    ) -> str:
+        """AI call optimized for action definition"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="action_definition",
+            preferred_model=AIModelType.ANTHROPIC_CLAUDE
+        )
+    
+    async def callAiForDocumentExtraction(
+        self,
+        prompt: str,
+        documents: List[ChatDocument],
+        context: str = None
+    ) -> str:
+        """AI call optimized for document extraction"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="document_extraction",
+            processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT
+        )
+    
+    async def callAiForReportGeneration(
+        self,
+        prompt: str,
+        documents: List[ChatDocument],
+        context: str = None
+    ) -> str:
+        """AI call optimized for report generation"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="report_generation",
+            processing_strategy=ProcessingStrategy.CHUNKED_PROCESSING
+        )
+    
+    async def callAiForEmailComposition(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        context: str = None
+    ) -> str:
+        """AI call optimized for email composition"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="email_composition",
+            preferred_model=AIModelType.OPENAI_GPT4  # Better for creative writing
+        )
+    
+    async def callAiForChatSummarization(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        context: str = None
+    ) -> str:
+        """AI call optimized for chat summarization"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="chat_summarization",
+            processing_strategy=ProcessingStrategy.SUMMARIZED_CONTENT
+        )
+    
+    async def callAiForImageAnalysis(
+        self,
+        prompt: str,
+        documents: List[ChatDocument],
+        context: str = None
+    ) -> str:
+        """AI call optimized for image analysis"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            documents=documents,
+            context=context,
+            operation_type="image_analysis",
+            preferred_model=AIModelType.OPENAI_VISION,
+            requires_vision=True
+        )
+    
+    # Backward compatibility methods
+    
+    async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
+        """Backward compatibility method"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            context=context,
+            operation_type="general",
+            preferred_model=AIModelType.ANTHROPIC_CLAUDE
+        )
+    
+    async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
+        """Backward compatibility method"""
+        return await self.callAiWithDocuments(
+            prompt=prompt,
+            context=context,
+            operation_type="general",
+            preferred_model=AIModelType.OPENAI_GPT35
+        )
+    
+    async def callAiImageBasic(self, prompt: str, image_data: str, mime_type: str) -> str:
+        """Backward compatibility method for image processing"""
+        # Create a document from image data
+        image_doc = self.service_center.createDocument(
+            "image_analysis.jpg",
+            mime_type,
+            image_data,
+            base64encoded=True
+        )
+        
+        return await self.callAiForImageAnalysis(
+            prompt=prompt,
+            documents=[image_doc]
+        )
+    
+    async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
+        """Enhanced document extraction using AI engine"""
+        try:
+            return await self.callAiForDocumentExtraction(
+                prompt=prompt,
+                documents=[document]
+            )
+        except Exception as e:
+            logger.error(f"Error in enhanced document extraction: {str(e)}")
+            # Fall back to original method
+            from modules.interfaces.interfaceChatModel import ExtractedContent
+            extracted = await self.service_center.documentProcessor.processFileData(
+                fileData=self.service_center.getFileData(document.fileId),
+                fileName=document.fileName,
+                mimeType=document.mimeType,
+                prompt=prompt,
+                documentId=document.id
+            )
+            if extracted and extracted.contents:
+                return "\n".join([item.data for item in extracted.contents])
+            return ""
+    
+    async def summarizeChat(self, messages: List) -> str:
+        """Enhanced chat summarization using AI engine"""
+        try:
+            # Convert messages to a simple text format
+            chat_content = "\n".join([f"{msg.role}: {msg.message}" for msg in messages if hasattr(msg, 'message')])
+            
+            # Create a document from chat content
+            chat_doc = self.service_center.createDocument(
+                "chat_history.txt",
+                "text/plain",
+                chat_content,
+                base64encoded=False
+            )
+            
+            return await self.callAiForChatSummarization(
+                prompt="Summarize this chat conversation, focusing on key decisions, outcomes, and next steps.",
+                documents=[chat_doc]
+            )
+        except Exception as e:
+            logger.error(f"Error in enhanced chat summarization: {str(e)}")
+            # Fall back to original method
+            return await self.service_center.callAiTextBasic(
+                f"Summarize this chat conversation: {chat_content}"
+            )
diff --git a/modules/connectors/connectorAiOpenai.py b/modules/connectors/connectorAiOpenai.py
index b81991d3..4a9f4888 100644
--- a/modules/connectors/connectorAiOpenai.py
+++ b/modules/connectors/connectorAiOpenai.py
@@ -8,6 +8,10 @@ from modules.shared.configuration import APP_CONFIG
 # Configure logger
 logger = logging.getLogger(__name__)
 
+class ContextLengthExceededException(Exception):
+    """Exception raised when the context length exceeds the model's limit"""
+    pass
+
 def loadConfigData():
     """Load configuration data for OpenAI connector"""
     return {
@@ -75,12 +79,29 @@ class AiOpenai:
             
             if response.status_code != 200:
                 logger.error(f"OpenAI API error: {response.status_code} - {response.text}")
+                
+                # Check for context length exceeded error
+                if response.status_code == 400:
+                    try:
+                        error_data = response.json()
+                        if (error_data.get("error", {}).get("code") == "context_length_exceeded" or
+                            "context length" in error_data.get("error", {}).get("message", "").lower()):
+                            # Raise a specific exception for context length issues
+                            raise ContextLengthExceededException(
+                                f"Context length exceeded: {error_data.get('error', {}).get('message', 'Unknown error')}"
+                            )
+                    except (ValueError, KeyError):
+                        pass  # If we can't parse the error, fall through to generic error
+                
                 raise HTTPException(status_code=500, detail="Error communicating with OpenAI API")
             
             responseJson = response.json()
             content = responseJson["choices"][0]["message"]["content"]
             return content
             
+        except ContextLengthExceededException:
+            # Re-raise context length exceptions without wrapping
+            raise
         except Exception as e:
             logger.error(f"Error calling OpenAI API: {str(e)}")
             raise HTTPException(status_code=500, detail=f"Error calling OpenAI API: {str(e)}")
diff --git a/modules/connectors/connector_tavily.py b/modules/connectors/connectorWebTavily.py
similarity index 70%
rename from modules/connectors/connector_tavily.py
rename to modules/connectors/connectorWebTavily.py
index 8a05e781..7a9ec038 100644
--- a/modules/connectors/connector_tavily.py
+++ b/modules/connectors/connectorWebTavily.py
@@ -3,7 +3,7 @@
 import logging
 import os
 from dataclasses import dataclass
-from modules.interfaces.interface_web_model import (
+from modules.interfaces.interfaceWebModel import (
     WebCrawlBase,
     WebCrawlDocumentData,
     WebCrawlRequest,
@@ -22,16 +22,35 @@ from modules.interfaces.interface_web_model import (
     WebSearchResultItem,
     WebCrawlActionDocument,
     WebCrawlActionResult,
+    get_web_search_min_results,
+    get_web_search_max_results,
 )
 
 # from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
 from tavily import AsyncTavilyClient
 from modules.shared.timezoneUtils import get_utc_timestamp
+from modules.shared.configuration import APP_CONFIG
 
 
 logger = logging.getLogger(__name__)
 
 
+# Configuration loading functions
+def get_web_crawl_timeout() -> int:
+    """Get web crawl timeout from configuration"""
+    return int(APP_CONFIG.get("Web_Crawl_TIMEOUT", "30"))
+
+
+def get_web_crawl_max_retries() -> int:
+    """Get web crawl max retries from configuration"""
+    return int(APP_CONFIG.get("Web_Crawl_MAX_RETRIES", "3"))
+
+
+def get_web_crawl_retry_delay() -> int:
+    """Get web crawl retry delay from configuration"""
+    return int(APP_CONFIG.get("Web_Crawl_RETRY_DELAY", "2"))
+
+
 @dataclass
 class TavilySearchResult:
     title: str
@@ -50,7 +69,10 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
 
     @classmethod
     async def create(cls):
-        return cls(client=AsyncTavilyClient(api_key=os.getenv("TAVILY_API_KEY")))
+        api_key = APP_CONFIG.get("Connector_WebTavily_API_KEY")
+        if not api_key:
+            raise ValueError("Tavily API key not configured. Please set Connector_WebTavily_API_KEY in config.ini")
+        return cls(client=AsyncTavilyClient(api_key=api_key))
 
     async def search_urls(self, request: WebSearchRequest) -> WebSearchActionResult:
         """Handles the web search request.
@@ -113,14 +135,14 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
     async def _search(self, query: str, max_results: int) -> list[TavilySearchResult]:
         """Calls the Tavily API to perform a web search."""
         # Make sure max_results is within the allowed range
-        if max_results < 0 or max_results > 20:
-            raise ValueError("max_results must be between 0 and 20")
+        min_results = get_web_search_min_results()
+        max_allowed_results = get_web_search_max_results()
+        if max_results < min_results or max_results > max_allowed_results:
+            raise ValueError(f"max_results must be between {min_results} and {max_allowed_results}")
 
         # Perform actual API call
         response = await self.client.search(query=query, max_results=max_results)
 
-        logger.info(f"Tavily API search response:\n{response}")
-
         return [
             TavilySearchResult(title=result["title"], url=result["url"])
             for result in response["results"]
@@ -153,18 +175,41 @@ class ConnectorTavily(WebSearchBase, WebCrawlBase, WebScrapeBase):
         )
 
     async def _crawl(self, urls: list) -> list[TavilyCrawlResult]:
-        """Calls the Tavily API to extract text content from URLs."""
-        response = await self.client.extract(
-            urls=urls, extract_depth="advanced", format="text"
-        )
+        """Calls the Tavily API to extract text content from URLs with retry logic."""
+        import asyncio
+        
+        max_retries = get_web_crawl_max_retries()
+        retry_delay = get_web_crawl_retry_delay()
+        timeout = get_web_crawl_timeout()
+        
+        for attempt in range(max_retries + 1):
+            try:
+                # Use asyncio.wait_for for timeout
+                response = await asyncio.wait_for(
+                    self.client.extract(urls=urls, extract_depth="advanced", format="text"),
+                    timeout=timeout
+                )
 
-        # Log the result
-        logger.info(f"Tavily API extract (crawl) response:\n{response}")
-
-        return [
-            TavilyCrawlResult(url=result["url"], content=result["raw_content"])
-            for result in response["results"]
-        ]
+                return [
+                    TavilyCrawlResult(url=result["url"], content=result["raw_content"])
+                    for result in response["results"]
+                ]
+                
+            except asyncio.TimeoutError:
+                logger.warning(f"Crawl attempt {attempt + 1} timed out after {timeout} seconds")
+                if attempt < max_retries:
+                    logger.info(f"Retrying in {retry_delay} seconds...")
+                    await asyncio.sleep(retry_delay)
+                else:
+                    raise Exception(f"Crawl failed after {max_retries + 1} attempts due to timeout")
+                    
+            except Exception as e:
+                logger.warning(f"Crawl attempt {attempt + 1} failed: {str(e)}")
+                if attempt < max_retries:
+                    logger.info(f"Retrying in {retry_delay} seconds...")
+                    await asyncio.sleep(retry_delay)
+                else:
+                    raise Exception(f"Crawl failed after {max_retries + 1} attempts: {str(e)}")
 
     def _build_crawl_action_result(
         self, crawl_results: list[TavilyCrawlResult], urls: list[str] = None
diff --git a/modules/engines/aiEngine.py b/modules/engines/aiEngine.py
new file mode 100644
index 00000000..f2f74c27
--- /dev/null
+++ b/modules/engines/aiEngine.py
@@ -0,0 +1,544 @@
+"""
+Smart AI Engine with intelligent content management and model selection
+"""
+
+import logging
+import asyncio
+from typing import List, Dict, Any, Optional, Tuple
+from modules.interfaces.interfaceAiEngine import (
+    AIEngine, AIRequest, AIResponse, AIModelType, ProcessingStrategy, 
+    ContentReductionStrategy, ModelCapabilities, ContentReducer
+)
+from modules.interfaces.interfaceChatModel import ChatDocument
+from modules.interfaces.interfaceAiCalls import AiCalls
+from modules.chat.documents.documentExtraction import DocumentExtraction
+from modules.shared.configuration import APP_CONFIG
+
+logger = logging.getLogger(__name__)
+
+
+class SmartAIEngine(AIEngine):
+    """Smart AI Engine with automatic content management and model selection"""
+    
+    def __init__(self, service_center=None):
+        self.service_center = service_center
+        self.ai_calls = AiCalls()
+        self.document_processor = DocumentExtraction(service_center)
+        self.content_reducer = SmartContentReducer(service_center)
+        
+        # Model capabilities mapping
+        self.model_capabilities = {
+            AIModelType.OPENAI_GPT4: ModelCapabilities(
+                max_tokens=8192,
+                max_input_tokens=128000,
+                supports_vision=False,
+                supports_function_calling=True,
+                cost_per_1k_tokens=0.03,
+                processing_speed="medium"
+            ),
+            AIModelType.OPENAI_GPT35: ModelCapabilities(
+                max_tokens=4096,
+                max_input_tokens=16384,
+                supports_vision=False,
+                supports_function_calling=True,
+                cost_per_1k_tokens=0.002,
+                processing_speed="fast"
+            ),
+            AIModelType.ANTHROPIC_CLAUDE: ModelCapabilities(
+                max_tokens=4096,
+                max_input_tokens=200000,
+                supports_vision=False,
+                supports_function_calling=False,
+                cost_per_1k_tokens=0.015,
+                processing_speed="medium"
+            ),
+            AIModelType.OPENAI_VISION: ModelCapabilities(
+                max_tokens=4096,
+                max_input_tokens=128000,
+                supports_vision=True,
+                supports_function_calling=False,
+                cost_per_1k_tokens=0.01,
+                processing_speed="slow"
+            )
+        }
+        
+        # Processing strategy preferences
+        self.strategy_preferences = {
+            "task_planning": ProcessingStrategy.SINGLE_CALL,
+            "action_definition": ProcessingStrategy.SINGLE_CALL,
+            "document_extraction": ProcessingStrategy.DOCUMENT_BY_DOCUMENT,
+            "report_generation": ProcessingStrategy.CHUNKED_PROCESSING,
+            "email_composition": ProcessingStrategy.SINGLE_CALL,
+            "chat_summarization": ProcessingStrategy.SUMMARIZED_CONTENT
+        }
+    
+    async def process_request(self, request: AIRequest) -> AIResponse:
+        """Process AI request with intelligent content management"""
+        try:
+            # Step 1: Determine optimal processing strategy
+            strategy = self._determine_processing_strategy(request)
+            request.processing_strategy = strategy
+            
+            # Step 2: Estimate token usage
+            estimated_tokens = await self.estimate_token_usage(request)
+            
+            # Step 3: Select appropriate model
+            model = self._select_optimal_model(request, estimated_tokens)
+            
+            # Step 4: Process with selected strategy
+            if strategy == ProcessingStrategy.SINGLE_CALL:
+                return await self._process_single_call(request, model)
+            elif strategy == ProcessingStrategy.DOCUMENT_BY_DOCUMENT:
+                return await self._process_document_by_document(request, model)
+            elif strategy == ProcessingStrategy.CHUNKED_PROCESSING:
+                return await self._process_chunked(request, model)
+            elif strategy == ProcessingStrategy.SUMMARIZED_CONTENT:
+                return await self._process_with_summarization(request, model)
+            else:
+                raise ValueError(f"Unknown processing strategy: {strategy}")
+                
+        except Exception as e:
+            logger.error(f"Error processing AI request: {str(e)}")
+            return AIResponse(
+                success=False,
+                content="",
+                model_used=AIModelType.OPENAI_GPT35,
+                processing_strategy=ProcessingStrategy.SINGLE_CALL,
+                error=str(e)
+            )
+    
+    def _determine_processing_strategy(self, request: AIRequest) -> ProcessingStrategy:
+        """Determine the best processing strategy based on request characteristics"""
+        
+        # Use explicit strategy if provided
+        if request.processing_strategy:
+            return request.processing_strategy
+        
+        # Determine based on metadata or content characteristics
+        metadata = request.metadata or {}
+        operation_type = metadata.get("operation_type", "general")
+        
+        # Check if we have a preference for this operation type
+        if operation_type in self.strategy_preferences:
+            return self.strategy_preferences[operation_type]
+        
+        # Auto-determine based on content characteristics
+        num_documents = len(request.documents)
+        prompt_length = len(request.prompt)
+        
+        if num_documents == 0:
+            return ProcessingStrategy.SINGLE_CALL
+        elif num_documents == 1:
+            return ProcessingStrategy.SINGLE_CALL
+        elif num_documents <= 3 and prompt_length < 1000:
+            return ProcessingStrategy.SINGLE_CALL
+        elif num_documents > 5:
+            return ProcessingStrategy.DOCUMENT_BY_DOCUMENT
+        else:
+            return ProcessingStrategy.CHUNKED_PROCESSING
+    
+    def _select_optimal_model(self, request: AIRequest, estimated_tokens: int) -> AIModelType:
+        """Select the optimal AI model based on request characteristics"""
+        
+        # Use preferred model if specified and suitable
+        if request.preferred_model:
+            capabilities = self.get_model_capabilities(request.preferred_model)
+            if estimated_tokens <= capabilities.max_input_tokens:
+                return request.preferred_model
+        
+        # Select model based on requirements
+        metadata = request.metadata or {}
+        requires_vision = metadata.get("requires_vision", False)
+        requires_function_calling = metadata.get("requires_function_calling", False)
+        
+        # Filter models by requirements
+        suitable_models = []
+        for model, capabilities in self.model_capabilities.items():
+            if estimated_tokens <= capabilities.max_input_tokens:
+                if requires_vision and not capabilities.supports_vision:
+                    continue
+                if requires_function_calling and not capabilities.supports_function_calling:
+                    continue
+                suitable_models.append((model, capabilities))
+        
+        if not suitable_models:
+            # If no model can handle the full content, use the one with highest capacity
+            best_model = max(self.model_capabilities.items(), 
+                           key=lambda x: x[1].max_input_tokens)
+            logger.warning(f"No model can handle {estimated_tokens} tokens, using {best_model[0]}")
+            return best_model[0]
+        
+        # Select based on cost and speed preferences
+        # For now, prefer Claude for large content, GPT-4 for complex tasks, GPT-3.5 for simple tasks
+        if estimated_tokens > 50000:
+            return AIModelType.ANTHROPIC_CLAUDE
+        elif metadata.get("complex_task", False):
+            return AIModelType.OPENAI_GPT4
+        else:
+            return AIModelType.OPENAI_GPT35
+    
+    async def _process_single_call(self, request: AIRequest, model: AIModelType) -> AIResponse:
+        """Process request with a single AI call"""
+        try:
+            # Prepare content
+            content = await self._prepare_content_for_single_call(request)
+            
+            # Make AI call
+            if model in [AIModelType.OPENAI_GPT4, AIModelType.OPENAI_GPT35]:
+                response = await self.ai_calls.callAiTextAdvanced(content, request.context)
+            elif model == AIModelType.ANTHROPIC_CLAUDE:
+                response = await self.ai_calls.callAiTextAdvanced(content, request.context)
+            else:
+                raise ValueError(f"Unsupported model for single call: {model}")
+            
+            return AIResponse(
+                success=True,
+                content=response,
+                model_used=model,
+                processing_strategy=ProcessingStrategy.SINGLE_CALL
+            )
+            
+        except Exception as e:
+            # If single call fails due to size, try with content reduction
+            if "too large" in str(e).lower() or "400" in str(e):
+                return await self._process_with_content_reduction(request, model)
+            else:
+                raise e
+    
+    async def _process_document_by_document(self, request: AIRequest, model: AIModelType) -> AIResponse:
+        """Process each document separately and merge results"""
+        try:
+            results = []
+            
+            for i, document in enumerate(request.documents):
+                # Create individual request for each document
+                doc_request = AIRequest(
+                    prompt=request.prompt,
+                    documents=[document],
+                    context=request.context,
+                    preferred_model=model,
+                    metadata=request.metadata
+                )
+                
+                # Process document
+                doc_response = await self._process_single_call(doc_request, model)
+                if doc_response.success:
+                    results.append(f"Document {i+1} ({document.fileName}):\n{doc_response.content}")
+                else:
+                    results.append(f"Document {i+1} ({document.fileName}): Error - {doc_response.error}")
+            
+            # Merge results
+            merged_content = "\n\n".join(results)
+            
+            return AIResponse(
+                success=True,
+                content=merged_content,
+                model_used=model,
+                processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT
+            )
+            
+        except Exception as e:
+            logger.error(f"Error in document-by-document processing: {str(e)}")
+            return AIResponse(
+                success=False,
+                content="",
+                model_used=model,
+                processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT,
+                error=str(e)
+            )
+    
+    async def _process_chunked(self, request: AIRequest, model: AIModelType) -> AIResponse:
+        """Process content in chunks and merge results"""
+        try:
+            # This would implement chunked processing logic
+            # For now, fall back to document-by-document
+            return await self._process_document_by_document(request, model)
+            
+        except Exception as e:
+            logger.error(f"Error in chunked processing: {str(e)}")
+            return AIResponse(
+                success=False,
+                content="",
+                model_used=model,
+                processing_strategy=ProcessingStrategy.CHUNKED_PROCESSING,
+                error=str(e)
+            )
+    
+    async def _process_with_summarization(self, request: AIRequest, model: AIModelType) -> AIResponse:
+        """Process with content summarization first"""
+        try:
+            # Summarize documents first
+            summarized_docs = []
+            for document in request.documents:
+                summary_doc = await self.content_reducer.summarize_document(
+                    document, 
+                    f"Summarize this document for: {request.prompt}"
+                )
+                summarized_docs.append(summary_doc)
+            
+            # Create new request with summarized documents
+            summary_request = AIRequest(
+                prompt=request.prompt,
+                documents=summarized_docs,
+                context=request.context,
+                preferred_model=model,
+                metadata=request.metadata
+            )
+            
+            # Process with summarized content
+            return await self._process_single_call(summary_request, model)
+            
+        except Exception as e:
+            logger.error(f"Error in summarization processing: {str(e)}")
+            return AIResponse(
+                success=False,
+                content="",
+                model_used=model,
+                processing_strategy=ProcessingStrategy.SUMMARIZED_CONTENT,
+                error=str(e)
+            )
+    
+    async def _process_with_content_reduction(self, request: AIRequest, model: AIModelType) -> AIResponse:
+        """Process with automatic content reduction"""
+        try:
+            # Determine reduction strategy
+            strategy = self._determine_reduction_strategy(request)
+            
+            # Reduce content
+            reduced_docs, reduced_prompt = await self.content_reducer.reduce_content(
+                request.documents,
+                request.prompt,
+                strategy,
+                target_reduction=0.5
+            )
+            
+            # Create new request with reduced content
+            reduced_request = AIRequest(
+                prompt=reduced_prompt,
+                documents=reduced_docs,
+                context=request.context,
+                preferred_model=model,
+                metadata=request.metadata
+            )
+            
+            # Try processing with reduced content
+            return await self._process_single_call(reduced_request, model)
+            
+        except Exception as e:
+            logger.error(f"Error in content reduction processing: {str(e)}")
+            return AIResponse(
+                success=False,
+                content="",
+                model_used=model,
+                processing_strategy=ProcessingStrategy.SINGLE_CALL,
+                error=f"Content reduction failed: {str(e)}"
+            )
+    
+    def _determine_reduction_strategy(self, request: AIRequest) -> ContentReductionStrategy:
+        """Determine the best content reduction strategy"""
+        
+        # Use explicit strategy if provided
+        if request.reduction_strategy:
+            return request.reduction_strategy
+        
+        # Auto-determine based on request characteristics
+        metadata = request.metadata or {}
+        operation_type = metadata.get("operation_type", "general")
+        
+        # Different strategies for different operations
+        if operation_type in ["task_planning", "action_definition"]:
+            # For planning tasks, prompt is crucial
+            return ContentReductionStrategy.REDUCE_DOCUMENTS_ONLY
+        elif operation_type in ["document_extraction", "report_generation"]:
+            # For document processing, documents are crucial
+            return ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS
+        else:
+            # Default: reduce both
+            return ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS
+    
+    async def _prepare_content_for_single_call(self, request: AIRequest) -> str:
+        """Prepare content for a single AI call"""
+        content_parts = [request.prompt]
+        
+        if request.context:
+            content_parts.append(f"Context: {request.context}")
+        
+        # Add document content
+        for i, document in enumerate(request.documents):
+            try:
+                # Extract document content
+                extracted = await self.service_center.extractContentFromDocument(
+                    "Extract all relevant text content",
+                    document
+                )
+                
+                if extracted and extracted.contents:
+                    doc_content = "\n".join([item.data for item in extracted.contents])
+                    content_parts.append(f"Document {i+1} ({document.fileName}):\n{doc_content}")
+                else:
+                    content_parts.append(f"Document {i+1} ({document.fileName}): [No content extracted]")
+                    
+            except Exception as e:
+                logger.warning(f"Could not extract content from document {document.fileName}: {str(e)}")
+                content_parts.append(f"Document {i+1} ({document.fileName}): [Error extracting content]")
+        
+        return "\n\n".join(content_parts)
+    
+    def get_model_capabilities(self, model: AIModelType) -> ModelCapabilities:
+        """Get capabilities for a specific model"""
+        return self.model_capabilities.get(model, self.model_capabilities[AIModelType.OPENAI_GPT35])
+    
+    async def estimate_token_usage(self, request: AIRequest) -> int:
+        """Estimate token usage for a request"""
+        # Simple estimation: ~4 characters per token
+        prompt_tokens = len(request.prompt) // 4
+        context_tokens = len(request.context or "") // 4
+        
+        # Estimate document tokens
+        doc_tokens = 0
+        for document in request.documents:
+            # Rough estimate based on file size
+            doc_tokens += document.fileSize // 4
+        
+        return prompt_tokens + context_tokens + doc_tokens
+
+
+class SmartContentReducer(ContentReducer):
+    """Smart content reducer using document extraction engine"""
+    
+    def __init__(self, service_center):
+        self.service_center = service_center
+        self.document_processor = DocumentExtraction(service_center)
+    
+    async def reduce_content(
+        self, 
+        documents: List[ChatDocument], 
+        prompt: str,
+        strategy: ContentReductionStrategy,
+        target_reduction: float = 0.5
+    ) -> Tuple[List[ChatDocument], str]:
+        """Reduce content size while preserving important information"""
+        
+        reduced_docs = []
+        reduced_prompt = prompt
+        
+        # Sort documents by size (largest first)
+        sorted_docs = sorted(documents, key=lambda d: d.fileSize, reverse=True)
+        
+        for document in sorted_docs:
+            try:
+                # Create reduction prompt based on strategy
+                if strategy == ContentReductionStrategy.REDUCE_DOCUMENTS_ONLY:
+                    reduction_prompt = f"""
+                    Summarize this document to {int(100 * (1 - target_reduction))}% of its original size.
+                    Focus on the most important information relevant to: {prompt}
+                    Preserve key facts, data, and conclusions.
+                    """
+                elif strategy == ContentReductionStrategy.SUMMARIZE_DOCUMENTS:
+                    reduction_prompt = f"""
+                    Create a concise summary of this document focusing on: {prompt}
+                    Include only the most relevant information.
+                    """
+                else:  # REDUCE_PROMPT_AND_DOCS or EXTRACT_KEY_INFO
+                    reduction_prompt = f"""
+                    Extract only the key information from this document that is relevant to: {prompt}
+                    Be very selective and concise.
+                    """
+                
+                # Process document with reduction
+                extracted = await self.service_center.extractContentFromDocument(
+                    reduction_prompt,
+                    document
+                )
+                
+                if extracted and extracted.contents:
+                    # Create new document with reduced content
+                    reduced_content = "\n".join([item.data for item in extracted.contents])
+                    reduced_doc = await self._create_reduced_document(document, reduced_content)
+                    reduced_docs.append(reduced_doc)
+                else:
+                    # If reduction fails, keep original document
+                    reduced_docs.append(document)
+                    
+            except Exception as e:
+                logger.warning(f"Could not reduce document {document.fileName}: {str(e)}")
+                reduced_docs.append(document)
+        
+        # Reduce prompt if strategy requires it
+        if strategy in [ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS]:
+            reduced_prompt = self._reduce_prompt(prompt, target_reduction)
+        
+        return reduced_docs, reduced_prompt
+    
+    async def summarize_document(
+        self, 
+        document: ChatDocument, 
+        focus_prompt: str
+    ) -> ChatDocument:
+        """Create a summary of a document focused on specific aspects"""
+        
+        summary_prompt = f"""
+        Create a comprehensive summary of this document focusing on: {focus_prompt}
+        
+        Include:
+        - Key points and main ideas
+        - Important data and statistics
+        - Conclusions and recommendations
+        - Any relevant details
+        
+        Keep the summary concise but informative.
+        """
+        
+        try:
+            extracted = await self.service_center.extractContentFromDocument(
+                summary_prompt,
+                document
+            )
+            
+            if extracted and extracted.contents:
+                summary_content = "\n".join([item.data for item in extracted.contents])
+                return await self._create_reduced_document(document, summary_content)
+            else:
+                return document
+                
+        except Exception as e:
+            logger.warning(f"Could not summarize document {document.fileName}: {str(e)}")
+            return document
+    
+    async def _create_reduced_document(self, original_doc: ChatDocument, reduced_content: str) -> ChatDocument:
+        """Create a new document with reduced content"""
+        try:
+            # Create new file with reduced content
+            file_id = self.service_center.createFile(
+                f"reduced_{original_doc.fileName}",
+                "text/plain",
+                reduced_content,
+                base64encoded=False
+            )
+            
+            # Create new document
+            return self.service_center.createDocument(
+                f"reduced_{original_doc.fileName}",
+                "text/plain",
+                reduced_content,
+                base64encoded=False,
+                existing_file_id=file_id
+            )
+            
+        except Exception as e:
+            logger.error(f"Could not create reduced document: {str(e)}")
+            return original_doc
+    
+    def _reduce_prompt(self, prompt: str, target_reduction: float) -> str:
+        """Reduce prompt size while preserving essential information"""
+        # Simple prompt reduction - keep first and last parts
+        lines = prompt.split('\n')
+        if len(lines) <= 3:
+            return prompt
+        
+        # Keep first 30% and last 20% of lines
+        keep_start = int(len(lines) * 0.3)
+        keep_end = int(len(lines) * 0.2)
+        
+        reduced_lines = lines[:keep_start] + ["... (content reduced) ..."] + lines[-keep_end:]
+        return '\n'.join(reduced_lines)
diff --git a/modules/interfaces/interfaceAiCalls.py b/modules/interfaces/interfaceAiCalls.py
index 2c47ff33..fe93105f 100644
--- a/modules/interfaces/interfaceAiCalls.py
+++ b/modules/interfaces/interfaceAiCalls.py
@@ -1,6 +1,6 @@
 import logging
 from typing import Dict, Any, List, Union, Optional
-from modules.connectors.connectorAiOpenai import AiOpenai
+from modules.connectors.connectorAiOpenai import AiOpenai, ContextLengthExceededException
 from modules.connectors.connectorAiAnthropic import AiAnthropic
 
 logger = logging.getLogger(__name__)
@@ -53,14 +53,23 @@ class AiCalls:
         
         try:
             return await self.openaiService.callAiBasic(messages)
+        except ContextLengthExceededException as e:
+            logger.warning(f"OpenAI context length exceeded, falling back to Anthropic: {str(e)}")
+            # Fallback to Anthropic (AI Advanced) when context length is exceeded
+            return await self.callAiTextAdvanced(prompt, context, _is_fallback=True)
         except Exception as e:
             logger.error(f"Error in OpenAI call: {str(e)}")
             return f"Error: {str(e)}"
 
-    async def callAiTextAdvanced(self, prompt: str, context: Optional[str] = None) -> str:
+    async def callAiTextAdvanced(self, prompt: str, context: Optional[str] = None, _is_fallback: bool = False) -> str:
         """
         Advanced text processing using Anthropic.
         Fallback to OpenAI if Anthropic is overloaded or rate-limited.
+        
+        Args:
+            prompt: The user prompt to process
+            context: Optional system context/prompt
+            _is_fallback: Internal flag to prevent infinite recursion
         """
         # For Anthropic, we need to handle system content differently
         # Anthropic expects system content in a top-level parameter, not as a message role
@@ -97,8 +106,13 @@ class AiCalls:
         except Exception as e:
             err_str = str(e)
             logger.warning(f"[UI NOTICE] Advanced AI failed, falling back to Basic AI (OpenAI). Reason: {err_str}")
-            # Fallback to OpenAI basic
-            return await self.callAiTextBasic(prompt, context)
+            # Fallback to OpenAI basic, but only if we're not already in a fallback
+            if not _is_fallback:
+                return await self.callAiTextBasic(prompt, context)
+            else:
+                # If we're already in a fallback, return error to prevent infinite recursion
+                logger.error("Both AI services failed, cannot provide fallback")
+                return f"Error: Both AI services failed. Anthropic error: {err_str}"
 
     async def callAiImageBasic(self, prompt: str, imageData: Union[str, bytes], mimeType: str = None) -> str:
         """
diff --git a/modules/interfaces/interfaceAiEngine.py b/modules/interfaces/interfaceAiEngine.py
new file mode 100644
index 00000000..2ccdd70e
--- /dev/null
+++ b/modules/interfaces/interfaceAiEngine.py
@@ -0,0 +1,115 @@
+"""
+Centralized AI Engine Interface for intelligent content processing
+"""
+
+from abc import ABC, abstractmethod
+from typing import List, Dict, Any, Optional, Union, Tuple
+from enum import Enum
+from dataclasses import dataclass
+from modules.interfaces.interfaceChatModel import ChatDocument, ExtractedContent
+
+
+class AIModelType(Enum):
+    """Available AI model types"""
+    OPENAI_GPT4 = "openai_gpt4"
+    OPENAI_GPT35 = "openai_gpt35"
+    ANTHROPIC_CLAUDE = "anthropic_claude"
+    OPENAI_VISION = "openai_vision"
+    ANTHROPIC_VISION = "anthropic_vision"
+
+
+class ProcessingStrategy(Enum):
+    """Content processing strategies"""
+    SINGLE_CALL = "single_call"           # One AI call with full content
+    DOCUMENT_BY_DOCUMENT = "doc_by_doc"   # One call per document, merge results
+    CHUNKED_PROCESSING = "chunked"        # Process in chunks, merge results
+    SUMMARIZED_CONTENT = "summarized"     # Summarize content first, then process
+
+
+class ContentReductionStrategy(Enum):
+    """Content reduction strategies"""
+    REDUCE_DOCUMENTS_ONLY = "reduce_docs"      # Keep prompt, reduce documents
+    REDUCE_PROMPT_AND_DOCS = "reduce_both"     # Reduce both prompt and documents
+    SUMMARIZE_DOCUMENTS = "summarize_docs"     # Summarize documents to key points
+    EXTRACT_KEY_INFO = "extract_key"           # Extract only relevant information
+
+
+@dataclass
+class AIRequest:
+    """Standardized AI request structure"""
+    prompt: str
+    documents: List[ChatDocument]
+    context: Optional[str] = None
+    preferred_model: Optional[AIModelType] = None
+    max_tokens: Optional[int] = None
+    temperature: Optional[float] = None
+    processing_strategy: Optional[ProcessingStrategy] = None
+    reduction_strategy: Optional[ContentReductionStrategy] = None
+    metadata: Optional[Dict[str, Any]] = None
+
+
+@dataclass
+class AIResponse:
+    """Standardized AI response structure"""
+    success: bool
+    content: str
+    model_used: AIModelType
+    processing_strategy: ProcessingStrategy
+    tokens_used: Optional[int] = None
+    processing_time: Optional[float] = None
+    error: Optional[str] = None
+    metadata: Optional[Dict[str, Any]] = None
+
+
+@dataclass
+class ModelCapabilities:
+    """AI model capabilities and limits"""
+    max_tokens: int
+    max_input_tokens: int
+    supports_vision: bool
+    supports_function_calling: bool
+    cost_per_1k_tokens: float
+    processing_speed: str  # "fast", "medium", "slow"
+
+
+class AIEngine(ABC):
+    """Abstract AI Engine interface"""
+    
+    @abstractmethod
+    async def process_request(self, request: AIRequest) -> AIResponse:
+        """Process an AI request with intelligent content management"""
+        pass
+    
+    @abstractmethod
+    def get_model_capabilities(self, model: AIModelType) -> ModelCapabilities:
+        """Get capabilities and limits for a specific model"""
+        pass
+    
+    @abstractmethod
+    async def estimate_token_usage(self, request: AIRequest) -> int:
+        """Estimate token usage for a request"""
+        pass
+
+
+class ContentReducer(ABC):
+    """Abstract content reduction interface"""
+    
+    @abstractmethod
+    async def reduce_content(
+        self, 
+        documents: List[ChatDocument], 
+        prompt: str,
+        strategy: ContentReductionStrategy,
+        target_reduction: float = 0.5
+    ) -> Tuple[List[ChatDocument], str]:
+        """Reduce content size while preserving important information"""
+        pass
+    
+    @abstractmethod
+    async def summarize_document(
+        self, 
+        document: ChatDocument, 
+        focus_prompt: str
+    ) -> ChatDocument:
+        """Create a summary of a document focused on specific aspects"""
+        pass
diff --git a/modules/interfaces/interface_web_model.py b/modules/interfaces/interfaceWebModel.py
similarity index 69%
rename from modules/interfaces/interface_web_model.py
rename to modules/interfaces/interfaceWebModel.py
index bb4a82e0..26a16560 100644
--- a/modules/interfaces/interface_web_model.py
+++ b/modules/interfaces/interfaceWebModel.py
@@ -4,6 +4,23 @@ from abc import ABC, abstractmethod
 from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
 from pydantic import BaseModel, Field, HttpUrl
 from typing import List
+from modules.shared.configuration import APP_CONFIG
+
+
+# Configuration loading functions
+def get_web_search_max_query_length() -> int:
+    """Get maximum query length from configuration"""
+    return int(APP_CONFIG.get("Web_Search_MAX_QUERY_LENGTH", "400"))
+
+
+def get_web_search_max_results() -> int:
+    """Get maximum search results from configuration"""
+    return int(APP_CONFIG.get("Web_Search_MAX_RESULTS", "20"))
+
+
+def get_web_search_min_results() -> int:
+    """Get minimum search results from configuration"""
+    return int(APP_CONFIG.get("Web_Search_MIN_RESULTS", "1"))
 
 
 # --- Web search ---
@@ -12,8 +29,8 @@ from typing import List
 
 
 class WebSearchRequest(BaseModel):
-    query: str = Field(min_length=1, max_length=400)
-    max_results: int = Field(ge=1, le=20)
+    query: str = Field(min_length=1, max_length=get_web_search_max_query_length())
+    max_results: int = Field(ge=get_web_search_min_results(), le=get_web_search_max_results())
 
 
 class WebSearchResultItem(BaseModel):
@@ -26,7 +43,7 @@ class WebSearchResultItem(BaseModel):
 class WebSearchDocumentData(BaseModel):
     """Complete search results document"""
 
-    query: str = Field(min_length=1, max_length=400)
+    query: str = Field(min_length=1, max_length=get_web_search_max_query_length())
     results: List[WebSearchResultItem]
     total_count: int
 
@@ -89,8 +106,8 @@ class WebCrawlBase(ABC):
 
 
 class WebScrapeRequest(BaseModel):
-    query: str = Field(min_length=1, max_length=400)
-    max_results: int = Field(ge=1, le=20)
+    query: str = Field(min_length=1, max_length=get_web_search_max_query_length())
+    max_results: int = Field(ge=get_web_search_min_results(), le=get_web_search_max_results())
 
 
 class WebScrapeResultItem(BaseModel):
@@ -103,7 +120,7 @@ class WebScrapeResultItem(BaseModel):
 class WebScrapeDocumentData(BaseModel):
     """Complete scrape results document"""
 
-    query: str = Field(min_length=1, max_length=400)
+    query: str = Field(min_length=1, max_length=get_web_search_max_query_length())
     results: List[WebScrapeResultItem]
     total_count: int
 
diff --git a/modules/interfaces/interfaceWebObjects.py b/modules/interfaces/interfaceWebObjects.py
new file mode 100644
index 00000000..bdd1fd53
--- /dev/null
+++ b/modules/interfaces/interfaceWebObjects.py
@@ -0,0 +1,118 @@
+from typing import Optional
+import json
+import csv
+import io
+from modules.interfaces.interfaceWebModel import (
+    WebCrawlActionResult,
+    WebSearchActionResult,
+    WebSearchRequest,
+    WebCrawlRequest,
+    WebScrapeActionResult,
+    WebScrapeRequest,
+    WebCrawlDocumentData,
+    WebScrapeDocumentData,
+    WebSearchDocumentData,
+)
+
+from dataclasses import dataclass
+from modules.connectors.connectorWebTavily import ConnectorTavily
+from modules.interfaces.interfaceChatModel import ActionDocument
+
+
+@dataclass(slots=True)
+class WebInterface:
+    connectorWebTavily: ConnectorTavily
+
+    def __post_init__(self) -> None:
+        if self.connectorWebTavily is None:
+            raise TypeError(
+                "connectorWebTavily must be provided. "
+                "Use `await WebInterface.create()` or pass a ConnectorTavily."
+            )
+
+    @classmethod
+    async def create(cls) -> "WebInterface":
+        connectorWebTavily = await ConnectorTavily.create()
+
+        return WebInterface(connectorWebTavily=connectorWebTavily)
+
+    async def search(
+        self, web_search_request: WebSearchRequest
+    ) -> WebSearchActionResult:
+        # NOTE: Add connectors here
+        return await self.connectorWebTavily.search_urls(web_search_request)
+
+    async def crawl(self, web_crawl_request: WebCrawlRequest) -> WebCrawlActionResult:
+        # NOTE: Add connectors here
+        return await self.connectorWebTavily.crawl_urls(web_crawl_request)
+
+    async def scrape(
+        self, web_scrape_request: WebScrapeRequest
+    ) -> WebScrapeActionResult:
+        # NOTE: Add connectors here
+        return await self.connectorWebTavily.scrape(web_scrape_request)
+
+    def convert_web_result_to_json(self, web_result) -> str:
+        """Convert WebCrawlActionResult or WebScrapeActionResult to proper JSON format"""
+        if not web_result.success or not web_result.documents:
+            return json.dumps({"success": web_result.success, "error": web_result.error})
+        
+        # Extract the document data and convert to dict
+        document_data = web_result.documents[0].documentData
+        
+        # Convert Pydantic model to dict
+        result_dict = {
+            "success": web_result.success,
+            "results": [
+                {
+                    "url": str(result.url),
+                    "content": result.content
+                }
+                for result in document_data.results
+            ],
+            "total_count": document_data.total_count
+        }
+        
+        # Add type-specific fields
+        if hasattr(document_data, 'urls'):
+            # WebCrawlDocumentData has urls field
+            result_dict["urls"] = [str(url) for url in document_data.urls]
+        elif hasattr(document_data, 'query'):
+            # WebScrapeDocumentData has query field
+            result_dict["query"] = document_data.query
+        
+        return json.dumps(result_dict, indent=2, ensure_ascii=False)
+
+    def convert_web_search_result_to_csv(self, web_search_result: WebSearchActionResult) -> str:
+        """Convert WebSearchActionResult to CSV format with url and title columns"""
+        if not web_search_result.success or not web_search_result.documents:
+            return ""
+        
+        output = io.StringIO()
+        writer = csv.writer(output, delimiter=';')
+        
+        # Write header
+        writer.writerow(['url', 'title'])
+        
+        # Write data rows
+        document_data = web_search_result.documents[0].documentData
+        for result in document_data.results:
+            writer.writerow([str(result.url), result.title])
+        
+        return output.getvalue()
+
+    def create_json_action_document(self, json_content: str, document_name: str) -> ActionDocument:
+        """Create an ActionDocument with JSON content"""
+        return ActionDocument(
+            documentName=document_name,
+            documentData=json_content,
+            mimeType="application/json"
+        )
+
+    def create_csv_action_document(self, csv_content: str, document_name: str) -> ActionDocument:
+        """Create an ActionDocument with CSV content"""
+        return ActionDocument(
+            documentName=document_name,
+            documentData=csv_content,
+            mimeType="text/csv"
+        )
\ No newline at end of file
diff --git a/modules/interfaces/interface_web_objects.py b/modules/interfaces/interface_web_objects.py
deleted file mode 100644
index f348f0bd..00000000
--- a/modules/interfaces/interface_web_objects.py
+++ /dev/null
@@ -1,46 +0,0 @@
-from typing import Optional
-from modules.interfaces.interface_web_model import (
-    WebCrawlActionResult,
-    WebSearchActionResult,
-    WebSearchRequest,
-    WebCrawlRequest,
-    WebScrapeActionResult,
-    WebScrapeRequest,
-)
-
-from dataclasses import dataclass
-from modules.connectors.connector_tavily import ConnectorTavily
-
-
-@dataclass(slots=True)
-class WebInterface:
-    connector_tavily: ConnectorTavily
-
-    def __post_init__(self) -> None:
-        if self.connector_tavily is None:
-            raise TypeError(
-                "connector_tavily must be provided. "
-                "Use `await WebInterface.create()` or pass a ConnectorTavily."
-            )
-
-    @classmethod
-    async def create(cls) -> "WebInterface":
-        connector_tavily = await ConnectorTavily.create()
-
-        return WebInterface(connector_tavily=connector_tavily)
-
-    async def search(
-        self, web_search_request: WebSearchRequest
-    ) -> WebSearchActionResult:
-        # NOTE: Add connectors here
-        return await self.connector_tavily.search_urls(web_search_request)
-
-    async def crawl(self, web_crawl_request: WebCrawlRequest) -> WebCrawlActionResult:
-        # NOTE: Add connectors here
-        return await self.connector_tavily.crawl_urls(web_crawl_request)
-
-    async def scrape(
-        self, web_scrape_request: WebScrapeRequest
-    ) -> WebScrapeActionResult:
-        # NOTE: Add connectors here
-        return await self.connector_tavily.scrape(web_scrape_request)
diff --git a/modules/methods/methodWeb.py b/modules/methods/methodWeb.py
index d3535916..96c597db 100644
--- a/modules/methods/methodWeb.py
+++ b/modules/methods/methodWeb.py
@@ -1,817 +1,284 @@
-"""
-Web operations method module.
-Handles web scraping, crawling, and search operations.
-"""
-
 import logging
-import requests
-import json
-import re
-import copy
-from typing import Dict, Any, List, Optional
-from datetime import datetime, UTC
-from urllib.parse import urlparse, urljoin
-import time
-import random
-from bs4 import BeautifulSoup
-import os
-
-# Selenium imports for JavaScript-heavy pages
-from selenium import webdriver
-from selenium.webdriver.chrome.options import Options
-from selenium.common.exceptions import WebDriverException
-from selenium.webdriver.common.by import By
-from selenium.webdriver.support.ui import WebDriverWait
-from selenium.webdriver.support import expected_conditions as EC
-
+import csv
+import io
+from typing import Any, Dict
 from modules.chat.methodBase import MethodBase, action
-from modules.interfaces.interfaceChatModel import ActionResult
-from modules.shared.configuration import APP_CONFIG
-from modules.shared.timezoneUtils import get_utc_timestamp
+from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
+from modules.interfaces.interfaceWebObjects import WebInterface
+from modules.interfaces.interfaceWebModel import (
+    WebSearchRequest,
+    WebCrawlRequest,
+    WebScrapeRequest,
+)
+
 
 logger = logging.getLogger(__name__)
 
+
 class MethodWeb(MethodBase):
-    """
-    Web method implementation for web operations.
-    - web.search: Uses Google SerpAPI to find relevant URLs for a query. Returns only search result metadata (title, URL, snippet). Does NOT fetch or extract page content.
-    - web.crawl: Fetches and extracts main content from a list of URLs, either provided directly or via referenced documents. Uses a headless browser for JavaScript-heavy pages.
-    """
-    
+    """Web method implementation for web operations."""
+
     def __init__(self, serviceCenter: Any):
         super().__init__(serviceCenter)
         self.name = "web"
-        self.description = "Handle web operations like search and crawling"
-        self.srcApikey = APP_CONFIG.get("Agent_Webcrawler_SERPAPI_APIKEY", "")
-        self.srcEngine = APP_CONFIG.get("Agent_Webcrawler_SERPAPI_ENGINE", "google")
-        self.srcCountry = APP_CONFIG.get("Agent_Webcrawler_SERPAPI_COUNTRY", "auto")
-        self.maxResults = int(APP_CONFIG.get("Agent_Webcrawler_SERPAPI_MAX_SEARCH_RESULTS", "5"))
-        self.user_agent = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36"
-        self.timeout = 30
-
-    def _format_timestamp_for_filename(self) -> str:
-        """Format current timestamp as YYYYMMDD-hhmmss for filenames."""
-        return datetime.now(UTC).strftime("%Y%m%d-%H%M%S")
-
-    def _readUrl(self, url: str) -> BeautifulSoup:
-        """Read a URL and return a BeautifulSoup parser for the content with enhanced error handling"""
-        if not url or not url.startswith(('http://', 'https://')):
-            logger.error(f"Invalid URL: {url}")
-            return None
-        
-        # Enhanced headers to mimic real browser
-        headers = {
-            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
-            'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8',
-            'Accept-Language': 'en-US,en;q=0.9,de;q=0.8',
-            'Accept-Encoding': 'gzip, deflate, br',
-            'DNT': '1',
-            'Connection': 'keep-alive',
-            'Upgrade-Insecure-Requests': '1',
-            'Sec-Fetch-Dest': 'document',
-            'Sec-Fetch-Mode': 'navigate',
-            'Sec-Fetch-Site': 'none',
-            'Cache-Control': 'max-age=0'
-        }
-        
-        try:
-            # Use session for better connection handling
-            session = requests.Session()
-            session.headers.update(headers)
-            
-            # Initial request with allow_redirects
-            response = session.get(url, timeout=self.timeout, allow_redirects=True)
-            
-            # Handle various status codes
-            if response.status_code == 200:
-                # Success - parse content
-                logger.debug(f"Successfully read URL: {url}")
-                return BeautifulSoup(response.text, 'html.parser')
-                
-            elif response.status_code == 202:
-                # Accepted - retry with backoff
-                logger.info(f"Status 202 for {url}, retrying with backoff...")
-                backoff_times = [1.0, 2.0, 5.0, 10.0]
-                
-                for wait_time in backoff_times:
-                    time.sleep(wait_time)
-                    retry_response = session.get(url, timeout=self.timeout, allow_redirects=True)
-                    
-                    if retry_response.status_code == 200:
-                        logger.debug(f"Successfully read URL after retry: {url}")
-                        return BeautifulSoup(retry_response.text, 'html.parser')
-                    elif retry_response.status_code != 202:
-                        break
-                
-                logger.warning(f"Failed to read URL after retries: {url}")
-                return None
-                
-            elif response.status_code in [301, 302, 307, 308]:
-                # Redirect - should be handled by allow_redirects=True
-                logger.warning(f"Unexpected redirect status {response.status_code} for {url}")
-                return None
-                
-            elif response.status_code == 403:
-                # Forbidden - try with different user agent
-                logger.warning(f"403 Forbidden for {url}, trying with different user agent...")
-                headers['User-Agent'] = 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36'
-                session.headers.update(headers)
-                
-                retry_response = session.get(url, timeout=self.timeout, allow_redirects=True)
-                if retry_response.status_code == 200:
-                    logger.debug(f"Successfully read URL with different user agent: {url}")
-                    return BeautifulSoup(retry_response.text, 'html.parser')
-                else:
-                    logger.error(f"Still getting {retry_response.status_code} for {url}")
-                    return None
-                    
-            elif response.status_code == 429:
-                # Rate limited - wait and retry
-                logger.warning(f"Rate limited for {url}, waiting 30 seconds...")
-                time.sleep(30)
-                retry_response = session.get(url, timeout=self.timeout, allow_redirects=True)
-                if retry_response.status_code == 200:
-                    logger.debug(f"Successfully read URL after rate limit: {url}")
-                    return BeautifulSoup(retry_response.text, 'html.parser')
-                else:
-                    logger.error(f"Still getting {retry_response.status_code} after rate limit wait for {url}")
-                    return None
-                    
-            else:
-                # Other error status codes
-                logger.error(f"HTTP {response.status_code} for {url}")
-                return None
-                
-        except requests.exceptions.Timeout:
-            logger.error(f"Timeout reading URL: {url}")
-            return None
-        except requests.exceptions.ConnectionError:
-            logger.error(f"Connection error reading URL: {url}")
-            return None
-        except requests.exceptions.RequestException as e:
-            logger.error(f"Request error reading URL {url}: {str(e)}")
-            return None
-        except Exception as e:
-            logger.error(f"Unexpected error reading URL {url}: {str(e)}")
-            return None
-    
-    def _extractTitle(self, soup: BeautifulSoup, url: str) -> str:
-        """Extract the title from a webpage"""
-        if not soup:
-            return f"Error with {url}"
-        
-        # Extract title from title tag
-        title_tag = soup.find('title')
-        title = title_tag.text.strip() if title_tag else "No title"
-        
-        # Alternative: Also look for h1 tags if title tag is missing
-        if title == "No title":
-            h1_tag = soup.find('h1')
-            if h1_tag:
-                title = h1_tag.text.strip()
-        
-        return title
-    
-    def _extractMainContent(self, soup: BeautifulSoup, max_chars: int = 50000) -> str:
-        """Extract the main content from an HTML page with enhanced content detection"""
-        if not soup:
-            return ""
-        
-        # Try to find main content elements in priority order with more selectors
-        main_content = None
-        content_selectors = [
-            'main',
-            'article',
-            '#content',
-            '.content',
-            '#main',
-            '.main',
-            '.post-content',
-            '.entry-content',
-            '.article-content',
-            '.page-content',
-            '[role="main"]',
-            '.container',
-            '.wrapper'
-        ]
-        
-        for selector in content_selectors:
-            content = soup.select_one(selector)
-            if content:
-                main_content = content
-                logger.debug(f"Found main content using selector: {selector}")
-                break
-        
-        # If no main content found, use the body
-        if not main_content:
-            main_content = soup.find('body') or soup
-            logger.debug("Using body as main content")
-        
-        # Safely copy the main_content element
-        if main_content is None:
-            return ""
-        try:
-            content_copy = copy.copy(main_content)
-        except Exception:
-            content_copy = main_content
-        
-        # Remove elements that don't contribute to main content (less aggressive)
-        elements_to_remove = [
-            'script', 'style', 'noscript',
-            'nav', 'footer', 'header', 'aside',
-            '.sidebar', '#sidebar', '.comments', '#comments',
-            '.advertisement', '.ads', '.ad', '.banner',
-            'iframe', '.social-share', '.share-buttons',
-            '.breadcrumb', '.breadcrumbs', '.pagination',
-            '.related-posts', '.related-articles',
-            '.newsletter', '.subscribe', '.signup',
-            '.cookie-notice', '.privacy-notice',
-            '.popup', '.modal', '.overlay'
-        ]
-        
-        for selector in elements_to_remove:
-            for element in content_copy.select(selector):
-                element.extract()
-        
-        # Extract text content with better formatting
-        text_content = content_copy.get_text(separator='\n', strip=True)
-        
-        # Clean up the text
-        lines = text_content.split('\n')
-        cleaned_lines = []
-        
-        for line in lines:
-            line = line.strip()
-            if line and len(line) > 10:  # Only keep meaningful lines
-                cleaned_lines.append(line)
-        
-        # Join lines with proper spacing
-        cleaned_content = '\n\n'.join(cleaned_lines)
-        
-        # If content is too short, try alternative extraction
-        if len(cleaned_content) < 500:
-            logger.debug("Content too short, trying alternative extraction...")
-            
-            # Try to extract from all paragraphs
-            paragraphs = soup.find_all(['p', 'div', 'section'])
-            alt_content = []
-            
-            for p in paragraphs:
-                text = p.get_text(strip=True)
-                if text and len(text) > 20:  # Only meaningful paragraphs
-                    alt_content.append(text)
-            
-            if alt_content:
-                cleaned_content = '\n\n'.join(alt_content[:20])  # Limit to first 20 paragraphs
-        
-        # Limit to max_chars but preserve complete sentences
-        if len(cleaned_content) > max_chars:
-            # Try to cut at a sentence boundary
-            sentences = cleaned_content.split('. ')
-            truncated_content = ""
-            
-            for sentence in sentences:
-                if len(truncated_content + sentence) < max_chars:
-                    truncated_content += sentence + ". "
-                else:
-                    break
-            
-            cleaned_content = truncated_content.strip()
-        
-        logger.debug(f"Extracted {len(cleaned_content)} characters of content")
-        return cleaned_content
-    
-    def _checkAccessibility(self, soup: BeautifulSoup) -> Dict[str, Any]:
-        """Check basic accessibility features"""
-        issues = []
-        warnings = []
-        
-        # Check for alt text on images
-        images_without_alt = soup.find_all('img', alt='')
-        if images_without_alt:
-            issues.append(f"Found {len(images_without_alt)} images without alt text")
-        
-        # Check for proper heading structure
-        headings = soup.find_all(['h1', 'h2', 'h3', 'h4', 'h5', 'h6'])
-        if not headings:
-            warnings.append("No headings found - poor document structure")
-        
-        # Check for form labels
-        forms = soup.find_all('form')
-        for form in forms:
-            inputs = form.find_all('input')
-            for input_elem in inputs:
-                if input_elem.get('type') not in ['submit', 'button', 'hidden']:
-                    if not input_elem.get('id') or not soup.find('label', attrs={'for': input_elem.get('id')}):
-                        warnings.append("Form input without proper label")
-        
-        return {
-            "status": "warning" if warnings else "pass",
-            "issues": issues,
-            "warnings": warnings
-        }
-    
-    def _checkSEO(self, soup: BeautifulSoup) -> Dict[str, Any]:
-        """Check basic SEO features"""
-        issues = []
-        warnings = []
-        
-        # Check for title tag
-        title = soup.find('title')
-        if not title:
-            issues.append("Missing title tag")
-        elif len(title.get_text()) < 10:
-            warnings.append("Title tag is too short")
-        elif len(title.get_text()) > 60:
-            warnings.append("Title tag is too long")
-        
-        # Check for meta description
-        meta_desc = soup.find('meta', attrs={'name': 'description'})
-        if not meta_desc:
-            warnings.append("Missing meta description")
-        elif meta_desc.get('content'):
-            if len(meta_desc.get('content')) < 50:
-                warnings.append("Meta description is too short")
-            elif len(meta_desc.get('content')) > 160:
-                warnings.append("Meta description is too long")
-        
-        # Check for h1 tag
-        h1_tags = soup.find_all('h1')
-        if not h1_tags:
-            warnings.append("No H1 tag found")
-        elif len(h1_tags) > 1:
-            warnings.append("Multiple H1 tags found")
-        
-        return {
-            "status": "warning" if warnings else "pass",
-            "issues": issues,
-            "warnings": warnings
-        }
-    
-    def _checkPerformance(self, soup: BeautifulSoup, url: str) -> Dict[str, Any]:
-        """Check basic performance indicators"""
-        warnings = []
-        
-        # Count images
-        images = soup.find_all('img')
-        if len(images) > 20:
-            warnings.append(f"Many images found ({len(images)}) - may impact loading speed")
-        
-        # Check for external resources
-        external_scripts = soup.find_all('script', src=True)
-        external_styles = soup.find_all('link', rel='stylesheet')
-        
-        if len(external_scripts) > 10:
-            warnings.append(f"Many external scripts ({len(external_scripts)}) - may impact loading speed")
-        
-        if len(external_styles) > 5:
-            warnings.append(f"Many external stylesheets ({len(external_styles)}) - may impact loading speed")
-        
-        return {
-            "status": "warning" if warnings else "pass",
-            "warnings": warnings,
-            "metrics": {
-                "images": len(images),
-                "external_scripts": len(external_scripts),
-                "external_styles": len(external_styles)
-            }
-        }
-    
-    def _detectJavaScriptRendering(self, soup: BeautifulSoup) -> bool:
-        """Detect if a page likely requires JavaScript rendering"""
-        if not soup:
-            return False
-        
-        # Check for common indicators of JavaScript-rendered content
-        indicators = [
-            # Angular, React, Vue indicators
-            soup.find('div', {'ng-app': True}),
-            soup.find('div', {'id': 'root'}),
-            soup.find('div', {'id': 'app'}),
-            soup.find('div', {'id': 'react-root'}),
-            
-            # SPA indicators
-            soup.find('div', {'id': 'spa-root'}),
-            soup.find('div', {'class': 'spa-container'}),
-            
-            # Modern framework indicators
-            soup.find('div', {'data-reactroot': True}),
-            soup.find('div', {'data-ng-controller': True}),
-            
-            # Empty content with scripts
-            len(soup.get_text(strip=True)) < 100 and len(soup.find_all('script')) > 2
-        ]
-        
-        return any(indicators)
-    
-    def _extractMetaInformation(self, soup: BeautifulSoup, url: str) -> Dict[str, Any]:
-        """Extract meta information from the page"""
-        meta_info = {
-            "url": url,
-            "title": self._extractTitle(soup, url),
-            "description": "",
-            "keywords": "",
-            "author": "",
-            "language": "",
-            "robots": "",
-            "viewport": "",
-            "charset": "",
-            "canonical": ""
-        }
-        
-        # Extract meta tags
-        meta_tags = soup.find_all('meta')
-        for meta in meta_tags:
-            name = meta.get('name', '').lower()
-            property = meta.get('property', '').lower()
-            content = meta.get('content', '')
-            
-            if name == 'description' or property == 'og:description':
-                meta_info['description'] = content
-            elif name == 'keywords':
-                meta_info['keywords'] = content
-            elif name == 'author':
-                meta_info['author'] = content
-            elif name == 'language':
-                meta_info['language'] = content
-            elif name == 'robots':
-                meta_info['robots'] = content
-            elif name == 'viewport':
-                meta_info['viewport'] = content
-            elif property == 'og:title':
-                meta_info['title'] = content
-            elif property == 'og:url':
-                meta_info['canonical'] = content
-        
-        # Extract charset
-        charset_meta = soup.find('meta', charset=True)
-        if charset_meta:
-            meta_info['charset'] = charset_meta.get('charset', '')
-        
-        # Extract canonical URL
-        canonical_link = soup.find('link', rel='canonical')
-        if canonical_link:
-            meta_info['canonical'] = canonical_link.get('href', '')
-        
-        return meta_info
-    
-    def _getAlternativeApproaches(self, url: str, requires_js: bool, content_length: int) -> List[str]:
-        """Get alternative approaches for sites that are difficult to crawl"""
-        approaches = []
-        
-        if requires_js:
-            approaches.extend([
-                "Site requires JavaScript rendering - consider using a headless browser",
-                "Try accessing the site's API endpoints directly",
-                "Look for RSS feeds or sitemaps",
-                "Check if the site has a mobile version that's easier to parse"
-            ])
-        
-        if content_length < 100:
-            approaches.extend([
-                "Site may have anti-bot protection - try with different user agents",
-                "Check if the site requires authentication",
-                "Look for alternative URLs (www vs non-www, http vs https)",
-                "Try accessing the site's robots.txt for crawling guidelines"
-            ])
-        
-        # Add general suggestions
-        approaches.extend([
-            "Use the web.search action to find alternative sources",
-            "Try the web.scrape action with specific CSS selectors",
-            "Check if the site has a public API or data export"
-        ])
-        
-        return approaches
+        self.description = "Web search, crawling, and scraping operations using Tavily"
 
     @action
     async def search(self, parameters: Dict[str, Any]) -> ActionResult:
-        """
-        Perform a web search and output a .txt file with a plain list of URLs (one per line).
-        
+        """Perform a web search and outputs a csv file with a list of found URLs
+
+        Each result contains columns "url" and "title".
+
         Parameters:
             query (str): Search query to perform
             maxResults (int, optional): Maximum number of results (default: 10)
-            filter (str, optional): Filter criteria for search results
+        """
+
+        try:
+            # Prepare request data
+            web_search_request = WebSearchRequest(
+                query=parameters.get("query"),
+                max_results=parameters.get("maxResults", 10),
+            )
+
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_search_result = await web_interface.search(web_search_request)
+
+            # Convert search results to CSV format
+            if web_search_result.success and web_search_result.documents:
+                csv_content = web_interface.convert_web_search_result_to_csv(web_search_result)
+                
+                # Create CSV document
+                csv_document = web_interface.create_csv_action_document(
+                    csv_content, 
+                    f"web_search_results.csv"
+                )
+                
+                return ActionResult(
+                    success=True,
+                    documents=[csv_document]
+                )
+            else:
+                return web_search_result
+
+        except Exception as e:
+            return ActionResult(success=False, error=str(e))
+
+
+
+    def _read_csv_with_urls(self, csv_content: str) -> list:
+        """Read CSV content and extract URLs from url,title or title,url format (both ; and , delimiters)"""
+        urls = []
+        
+        # Try both semicolon and comma delimiters
+        for delimiter in [';', ',']:
+            try:
+                reader = csv.DictReader(io.StringIO(csv_content), delimiter=delimiter)
+                for row in reader:
+                    # Look for url column (case insensitive)
+                    url = None
+                    for key in row.keys():
+                        if key.lower() == 'url':
+                            url = row[key].strip()
+                            break
+                    
+                    if url and (url.startswith('http://') or url.startswith('https://')):
+                        urls.append(url)
+                
+                # If we found URLs with this delimiter, return them
+                if urls:
+                    return urls
+                    
+            except Exception:
+                # Try next delimiter
+                continue
+        
+        # If no valid CSV found, try simple text parsing as fallback
+        lines = csv_content.split('\n')
+        for line in lines:
+            line = line.strip()
+            if line and (line.startswith('http://') or line.startswith('https://')):
+                urls.append(line)
+        
+        return urls
+
+    @action
+    async def crawl(self, parameters: Dict[str, Any]) -> ActionResult:
+        """Crawls a list of URLs and extracts information from them.
+
+        Parameters:
+            documentList (str): Document list reference containing URL lists from search results
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
+        try:
+            document_list = parameters.get("documentList")
+
+            if not document_list:
+                return ActionResult(
+                    success=False, error="No document list reference provided."
+                )
+
+            # Resolve document list reference to ChatDocument objects
+            chat_documents = self.service.getChatDocumentsFromDocumentList(document_list)
+
+            if not chat_documents:
+                return ActionResult(
+                    success=False,
+                    error=f"No documents found for reference: {document_list}",
+                )
+
+            # Extract URLs from all documents and combine them
+            all_urls = []
+            import json
+            import re
+
+            for i, doc in enumerate(chat_documents):
+                logger.info(f"Processing document {i+1}/{len(chat_documents)}: {doc.fileName}")
+                
+                # Get file data using the service center
+                file_data = self.service.getFileData(doc.fileId)
+                if not file_data:
+                    logger.warning(f"Could not retrieve file data for document: {doc.fileName}")
+                    continue
+
+                content = file_data.decode("utf-8")
+
+                # Try to parse as CSV first (for new CSV format)
+                if doc.fileName.lower().endswith('.csv') or 'csv' in doc.mimeType.lower():
+                    logger.info(f"Processing CSV file: {doc.fileName}")
+                    doc_urls = self._read_csv_with_urls(content)
+                else:
+                    # Parse JSON to extract URLs from search results
+                    try:
+                        # The document structure from WebSearchActionResult
+                        search_data = json.loads(content)
+
+                        # Extract URLs from the search results structure
+                        doc_urls = []
+                        if isinstance(search_data, dict):
+                            # Handle the document structure: documentData contains the actual search results
+                            doc_data = search_data.get("documentData", search_data)
+                            if "results" in doc_data and isinstance(doc_data["results"], list):
+                                doc_urls = [
+                                    result["url"]
+                                    for result in doc_data["results"]
+                                    if isinstance(result, dict) and "url" in result
+                                ]
+                            elif "urls" in doc_data and isinstance(doc_data["urls"], list):
+                                # Fallback: if URLs are stored directly in a 'urls' field
+                                doc_urls = [url for url in doc_data["urls"] if isinstance(url, str)]
+
+                        # Fallback: try to parse as plain text with regex (for backward compatibility)
+                        if not doc_urls:
+                            logger.warning(
+                                f"Could not extract URLs from JSON structure in {doc.fileName}, trying plain text parsing"
+                            )
+                            doc_urls = re.split(r"[\n,;]+", content)
+                            doc_urls = [
+                                u.strip()
+                                for u in doc_urls
+                                if u.strip()
+                                and (
+                                    u.strip().startswith("http://")
+                                    or u.strip().startswith("https://")
+                                )
+                            ]
+
+                    except json.JSONDecodeError:
+                        # Fallback to plain text parsing if JSON parsing fails
+                        logger.warning(f"Document {doc.fileName} is not valid JSON, trying plain text parsing")
+                        doc_urls = re.split(r"[\n,;]+", content)
+                        doc_urls = [
+                            u.strip()
+                            for u in doc_urls
+                            if u.strip()
+                            and (
+                                u.strip().startswith("http://")
+                                or u.strip().startswith("https://")
+                            )
+                        ]
+
+                if doc_urls:
+                    all_urls.extend(doc_urls)
+                    logger.info(f"Extracted {len(doc_urls)} URLs from {doc.fileName}")
+                else:
+                    logger.warning(f"No valid URLs found in document: {doc.fileName}")
+
+            if not all_urls:
+                return ActionResult(
+                    success=False, error="No valid URLs found in any of the documents."
+                )
+
+            # Remove duplicates while preserving order
+            unique_urls = list(dict.fromkeys(all_urls))
+            logger.info(f"Extracted {len(unique_urls)} unique URLs from {len(chat_documents)} documents")
+
+            # Prepare request data
+            web_crawl_request = WebCrawlRequest(urls=unique_urls)
+
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_crawl_result = await web_interface.crawl(web_crawl_request)
+
+            # Convert to proper JSON format
+            if web_crawl_result.success:
+                json_content = web_interface.convert_web_result_to_json(web_crawl_result)
+                json_document = web_interface.create_json_action_document(
+                    json_content, 
+                    f"web_crawl_results.json"
+                )
+                return ActionResult(
+                    success=True,
+                    documents=[json_document]
+                )
+            else:
+                return web_crawl_result
+
+        except Exception as e:
+            logger.error(f"Error in crawl method: {str(e)}")
+            return ActionResult(success=False, error=str(e))
+
+    @action
+    async def scrape(self, parameters: Dict[str, Any]) -> ActionResult:
+        """Scrapes web content by searching for URLs and then extracting their content.
+
+        Combines search and crawl operations in one step.
+
+        Parameters:
+            query (str): Search query to perform
+            maxResults (int, optional): Maximum number of results (default: 10)
+        """
         try:
             query = parameters.get("query")
             max_results = parameters.get("maxResults", 10)
-            filter_param = parameters.get("filter")
-            expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
-            
+
             if not query:
-                return ActionResult.isFailure(error="Search query is required")
-            
-            if not self.srcApikey:
-                return ActionResult.isFailure(error="SerpAPI key not configured")
-            
-            userLanguage = "en"
-            if hasattr(self.service, 'user') and hasattr(self.service.user, 'language'):
-                userLanguage = self.service.user.language
-            
-            params = {
-                "engine": self.srcEngine,
-                "q": query,
-                "api_key": self.srcApikey,
-                "num": min(max_results, self.maxResults),
-                "hl": userLanguage
-            }
-            
-            if filter_param:
-                params["filter"] = filter_param
-            
-            response = requests.get("https://serpapi.com/search", params=params, timeout=self.timeout)
-            response.raise_for_status()
-            search_results = response.json()
-            results = []
-            
-            if "organic_results" in search_results:
-                results = search_results["organic_results"][:max_results]
-            
-            # Assume 'results' is a list of dicts with 'url' keys
-            urls = [item['url'] for item in results if 'url' in item and isinstance(item['url'], str)]
-            url_list_str = "\n".join(urls)
-            
-            # Determine output format based on expected formats
-            output_extension = ".txt"  # Default
-            output_mime_type = "text/plain"  # Default
-            
-            if expectedDocumentFormats and len(expectedDocumentFormats) > 0:
-                # Use the first expected format
-                expected_format = expectedDocumentFormats[0]
-                output_extension = expected_format.get("extension", ".txt")
-                output_mime_type = expected_format.get("mimeType", "text/plain")
-                logger.info(f"Using expected format: {output_extension} ({output_mime_type})")
-            else:
-                logger.info("No expected format specified, using default .txt format")
-            
-            # Create result data
-            result_data = {
-                "query": query,
-                "maxResults": max_results,
-                "filter": filter_param,
-                "totalResults": len(urls),
-                "urls": urls,
-                "urlList": url_list_str,
-                "timestamp": get_utc_timestamp()
-            }
-            
-            return ActionResult(
-                success=True,
-                documents=[
-                    {
-                        "documentName": f"web_search_{self._format_timestamp_for_filename()}{output_extension}",
-                        "documentData": result_data,
-                        "mimeType": output_mime_type
-                    }
-                ]
-            )
-            
-        except Exception as e:
-            logger.error(f"Error searching web: {str(e)}")
-            return ActionResult(
-                success=False,
-                error=str(e)
+                return ActionResult(success=False, error="Search query is required")
+
+            # Prepare request data
+            web_scrape_request = WebScrapeRequest(
+                query=query,
+                max_results=max_results,
             )
 
-    def _selenium_extract_content(self, url: str) -> Optional[str]:
-        """Use Selenium to fetch and extract main content from a JS-heavy page."""
-        options = Options()
-        options.headless = True
-        options.add_argument('--no-sandbox')
-        options.add_argument('--disable-dev-shm-usage')
-        options.add_argument(f'user-agent={self.user_agent}')
-        try:
-            driver = webdriver.Chrome(options=options)
-            driver.set_page_load_timeout(self.timeout)
-            driver.get(url)
-            # Wait for body to load
-            WebDriverWait(driver, 10).until(EC.presence_of_element_located((By.TAG_NAME, "body")))
-            html = driver.page_source
-            driver.quit()
-            soup = BeautifulSoup(html, 'html.parser')
-            return self._extractMainContent(soup)
-        except WebDriverException as e:
-            logger.warning(f"Selenium failed for {url}: {str(e)}")
-            return None
-        except Exception as e:
-            logger.warning(f"Selenium error for {url}: {str(e)}")
-            return None
+            # Perform request
+            web_interface = await WebInterface.create()
+            web_scrape_result = await web_interface.scrape(web_scrape_request)
 
-    @action
-    async def crawl(self, parameters: Dict[str, Any]) -> ActionResult:
-        """
-        Crawl a list of URLs provided in a document (.txt) with URLs separated by newline, comma, or semicolon.
-        
-        Parameters:
-            document (str): Document containing URL list
-            expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
-        """
-        try:
-            document = parameters.get("document")
-            expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
-            
-            if not document:
-                return ActionResult.isFailure(error="No document with URL list provided.")
-            
-            # Read the document content
-            with open(document, "r", encoding="utf-8") as f:
-                content = f.read()
-            
-            # Split URLs by newline, comma, or semicolon
-            import re
-            urls = re.split(r'[\n,;]+', content)
-            urls = [u.strip() for u in urls if u.strip()]
-            
-            if not urls:
-                return ActionResult.isFailure(error="No valid URLs provided in the document.")
-            
-            crawl_results = []
-            for url in urls:
-                try:
-                    logger.info(f"Crawling URL: {url}")
-                    # Try Selenium first
-                    content = self._selenium_extract_content(url)
-                    if not content:
-                        # Fallback to requests/BeautifulSoup
-                        soup = self._readUrl(url)
-                        content = self._extractMainContent(soup)
-                    
-                    title = self._extractTitle(BeautifulSoup(content, 'html.parser'), url) if content else "No title"
-                    meta_info = {"url": url, "title": title}
-                    content_length = len(content) if content else 0
-                    
-                    crawl_results.append({
-                        "url": url,
-                        "title": title,
-                        "content": content,
-                        "content_length": content_length,
-                        "meta_info": meta_info,
-                        "timestamp": get_utc_timestamp()
-                    })
-                    logger.info(f"Successfully crawled {url} - extracted {content_length} characters")
-                    
-                except Exception as e:
-                    logger.error(f"Error crawling web page {url}: {str(e)}")
-                    crawl_results.append({
-                        "error": str(e),
-                        "url": url,
-                        "suggestions": [
-                            "Check if the URL is accessible",
-                            "Try with a different user agent",
-                            "Verify the site doesn't block automated access"
-                        ]
-                    })
-            
-            # Determine output format based on expected formats
-            output_extension = ".json"  # Default
-            output_mime_type = "application/json"  # Default
-            
-            if expectedDocumentFormats and len(expectedDocumentFormats) > 0:
-                # Use the first expected format
-                expected_format = expectedDocumentFormats[0]
-                output_extension = expected_format.get("extension", ".json")
-                output_mime_type = expected_format.get("mimeType", "application/json")
-                logger.info(f"Using expected format: {output_extension} ({output_mime_type})")
-            else:
-                logger.info("No expected format specified, using default .json format")
-            
-            result_data = {
-                "urls": urls,
-                "maxDepth": 1, # Simplified crawl
-                "includeImages": False,
-                "followLinks": True,
-                "crawlResults": crawl_results,
-                "summary": {
-                    "total_urls": len(urls),
-                    "successful_crawls": len([r for r in crawl_results if "error" not in r]),
-                    "failed_crawls": len([r for r in crawl_results if "error" in r]),
-                    "total_content_chars": sum([r.get("content_length", 0) for r in crawl_results if "content_length" in r])
-                },
-                "timestamp": get_utc_timestamp()
-            }
-            
-            return ActionResult(
-                success=True,
-                documents=[
-                    {
-                        "documentName": f"web_crawl_{self._format_timestamp_for_filename()}{output_extension}",
-                        "documentData": result_data,
-                        "mimeType": output_mime_type
-                    }
-                ]
-            )
-            
-        except Exception as e:
-            logger.error(f"Error crawling web pages: {str(e)}")
-            return ActionResult(
-                success=False,
-                error=str(e)
-            )
-    
-    @action
-    async def scrape(self, parameters: Dict[str, Any]) -> ActionResult:
-        """
-        Scrape specific data from web pages
-        
-        Parameters:
-            url (str): URL to scrape
-            selectors (Dict[str, str]): CSS selectors for data extraction
-            format (str, optional): Output format (default: "json")
-            expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
-        """
-        try:
-            url = parameters.get("url")
-            selectors = parameters.get("selectors")
-            format = parameters.get("format", "json")
-            expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
-            
-            if not url or not selectors:
-                return ActionResult(
-                    success=False,
-                    error="URL and selectors are required"
+            # Convert to proper JSON format
+            if web_scrape_result.success:
+                json_content = web_interface.convert_web_result_to_json(web_scrape_result)
+                json_document = web_interface.create_json_action_document(
+                    json_content, 
+                    f"web_scrape_results.json"
                 )
-            
-            # Read the URL
-            soup = self._readUrl(url)
-            if not soup:
                 return ActionResult(
-                    success=False,
-                    error="Failed to read URL"
+                    success=True,
+                    documents=[json_document]
                 )
-            
-            extracted_content = {}
-            
-            if selectors:
-                # Extract content using provided selectors
-                for selector_name, selector in selectors.items():
-                    elements = soup.select(selector)
-                    if elements:
-                        if format == "text":
-                            extracted_content[selector_name] = [elem.get_text(strip=True) for elem in elements]
-                        elif format == "html":
-                            extracted_content[selector_name] = [str(elem) for elem in elements]
-                        else:
-                            extracted_content[selector_name] = [elem.get_text(strip=True) for elem in elements]
-                    else:
-                        extracted_content[selector_name] = []
             else:
-                # Auto-extract common elements
-                extracted_content = {
-                    "title": self._extractTitle(soup, url),
-                    "main_content": self._extractMainContent(soup),
-                    "headings": [h.get_text(strip=True) for h in soup.find_all(['h1', 'h2', 'h3'])],
-                    "links": [a.get('href') for a in soup.find_all('a', href=True) if a.get('href').startswith(('http://', 'https://'))],
-                    "images": [img.get('src') for img in soup.find_all('img', src=True)]
-                }
-            
-            scrape_result = {
-                "url": url,
-                "selectors": selectors,
-                "format": format,
-                "content": extracted_content,
-                "timestamp": get_utc_timestamp()
-            }
-            
-            # Create result data
-            result_data = {
-                "url": url,
-                "selectors": selectors,
-                "format": format,
-                "scrapedData": scrape_result,
-                "timestamp": get_utc_timestamp()
-            }
-            
-            # Determine output format based on expected formats
-            output_extension = f".{format}"  # Default to format parameter
-            output_mime_type = "application/json"  # Default
-            
-            if expectedDocumentFormats and len(expectedDocumentFormats) > 0:
-                # Use the first expected format
-                expected_format = expectedDocumentFormats[0]
-                output_extension = expected_format.get("extension", f".{format}")
-                output_mime_type = expected_format.get("mimeType", "application/json")
-                logger.info(f"Using expected format: {output_extension} ({output_mime_type})")
-            else:
-                logger.info(f"No expected format specified, using format parameter: {format}")
-            
-            return ActionResult(
-                success=True,
-                documents=[
-                    {
-                        "documentName": f"web_scrape_{self._format_timestamp_for_filename()}{output_extension}",
-                        "documentData": result_data,
-                        "mimeType": output_mime_type
-                    }
-                ]
-            )
-            
+                return web_scrape_result
+
         except Exception as e:
-            logger.error(f"Error scraping web page: {str(e)}")
-            return ActionResult(
-                success=False,
-                error=str(e)
-            )
-    
+            return ActionResult(success=False, error=str(e))
diff --git a/modules/methods/method_web.py b/modules/methods/method_web.py
deleted file mode 100644
index ccb0f185..00000000
--- a/modules/methods/method_web.py
+++ /dev/null
@@ -1,197 +0,0 @@
-import logging
-from typing import Any, Dict
-from modules.chat.methodBase import MethodBase, action
-from modules.interfaces.interfaceChatModel import ActionResult
-from modules.interfaces.interface_web_objects import WebInterface
-from modules.interfaces.interface_web_model import (
-    WebSearchRequest,
-    WebCrawlRequest,
-    WebScrapeRequest,
-)
-
-
-logger = logging.getLogger(__name__)
-
-
-class MethodWeb(MethodBase):
-    """Web method implementation for web operations."""
-
-    def __init__(self, serviceCenter: Any):
-        super().__init__(serviceCenter)
-        self.name = "web"
-        self.description = "Web search, crawling, and scraping operations using Tavily"
-
-    @action
-    async def search(self, parameters: Dict[str, Any]) -> ActionResult:
-        """Perform a web search and outputs a .json file with a list of found URLs.
-
-        Each result contains "title" and "url".
-
-        Parameters:
-            query (str): Search query to perform
-            maxResults (int, optional): Maximum number of results (default: 10)
-        """
-        # TODO: Fix docstrings - do we need that format for parsing?
-
-        try:
-            # Prepare request data
-            web_search_request = WebSearchRequest(
-                query=parameters.get("query"),
-                max_results=parameters.get("maxResults", 10),
-            )
-
-            # Perform request
-            web_interface = await WebInterface.create()
-            web_search_result = await web_interface.search(web_search_request)
-
-            return web_search_result
-
-        except Exception as e:
-            return ActionResult(success=False, error=str(e))
-
-    @action
-    async def crawl(self, parameters: Dict[str, Any]) -> ActionResult:
-        """Crawls a list of URLs and extracts information from them.
-
-        Parameters:
-            document (str): Document reference containing URL list from search results
-            expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
-        """
-        try:
-            document_ref = parameters.get("document")
-
-            if not document_ref:
-                return ActionResult(
-                    success=False, error="No document reference provided."
-                )
-
-            # Resolve document reference to ChatDocument objects
-            chat_documents = self.service.getChatDocumentsFromDocumentList(
-                [document_ref]
-            )
-
-            if not chat_documents:
-                return ActionResult(
-                    success=False,
-                    error=f"No documents found for reference: {document_ref}",
-                )
-
-            # Get the first document (search results)
-            search_doc = chat_documents[0]
-
-            # Get file data using the service center
-            file_data = self.service.getFileData(search_doc.fileId)
-            if not file_data:
-                return ActionResult(
-                    success=False, error="Could not retrieve file data for document"
-                )
-
-            content = file_data.decode("utf-8")
-
-            # Parse JSON to extract URLs from search results
-            import json
-
-            try:
-                # The document structure from WebSearchActionResult
-                search_data = json.loads(content)
-
-                # Extract URLs from the search results structure
-                urls = []
-                if isinstance(search_data, dict):
-                    # Handle the document structure: documentData contains the actual search results
-                    doc_data = search_data.get("documentData", search_data)
-                    if "results" in doc_data and isinstance(doc_data["results"], list):
-                        urls = [
-                            result["url"]
-                            for result in doc_data["results"]
-                            if isinstance(result, dict) and "url" in result
-                        ]
-                    elif "urls" in doc_data and isinstance(doc_data["urls"], list):
-                        # Fallback: if URLs are stored directly in a 'urls' field
-                        urls = [url for url in doc_data["urls"] if isinstance(url, str)]
-
-                # Fallback: try to parse as plain text with regex (for backward compatibility)
-                if not urls:
-                    logger.warning(
-                        "Could not extract URLs from JSON structure, trying plain text parsing"
-                    )
-                    import re
-
-                    urls = re.split(r"[\n,;]+", content)
-                    urls = [
-                        u.strip()
-                        for u in urls
-                        if u.strip()
-                        and (
-                            u.strip().startswith("http://")
-                            or u.strip().startswith("https://")
-                        )
-                    ]
-
-            except json.JSONDecodeError:
-                # Fallback to plain text parsing if JSON parsing fails
-                logger.warning("Document is not valid JSON, trying plain text parsing")
-                import re
-
-                urls = re.split(r"[\n,;]+", content)
-                urls = [
-                    u.strip()
-                    for u in urls
-                    if u.strip()
-                    and (
-                        u.strip().startswith("http://")
-                        or u.strip().startswith("https://")
-                    )
-                ]
-
-            if not urls:
-                return ActionResult(
-                    success=False, error="No valid URLs found in the document."
-                )
-
-            logger.info(f"Extracted {len(urls)} URLs from document: {urls}")
-
-            # Prepare request data
-            web_crawl_request = WebCrawlRequest(urls=urls)
-
-            # Perform request
-            web_interface = await WebInterface.create()
-            web_crawl_result = await web_interface.crawl(web_crawl_request)
-
-            return web_crawl_result
-
-        except Exception as e:
-            logger.error(f"Error in crawl method: {str(e)}")
-            return ActionResult(success=False, error=str(e))
-
-    @action
-    async def scrape(self, parameters: Dict[str, Any]) -> ActionResult:
-        """Scrapes web content by searching for URLs and then extracting their content.
-
-        Combines search and crawl operations in one step.
-
-        Parameters:
-            query (str): Search query to perform
-            maxResults (int, optional): Maximum number of results (default: 10)
-        """
-        try:
-            query = parameters.get("query")
-            max_results = parameters.get("maxResults", 10)
-
-            if not query:
-                return ActionResult(success=False, error="Search query is required")
-
-            # Prepare request data
-            web_scrape_request = WebScrapeRequest(
-                query=query,
-                max_results=max_results,
-            )
-
-            # Perform request
-            web_interface = await WebInterface.create()
-            web_scrape_result = await web_interface.scrape(web_scrape_request)
-
-            return web_scrape_result
-
-        except Exception as e:
-            return ActionResult(success=False, error=str(e))
diff --git a/modules/methods/web/web_search/web_search_base.py b/modules/methods/web/web_search/web_search_base.py
deleted file mode 100644
index d655bfd3..00000000
--- a/modules/methods/web/web_search/web_search_base.py
+++ /dev/null
@@ -1,31 +0,0 @@
-"""Base class for web search classes."""
-
-from abc import ABC, abstractmethod
-from modules.interfaces.interfaceChatModel import ActionDocument, ActionResult
-
-
-from pydantic import BaseModel, Field
-from typing import List
-
-
-class WebSearchRequest(BaseModel):
-    query: str
-    max_results: int
-
-
-class WebSearchDocumentData(BaseModel):
-    title: str
-    url: str
-
-
-class WebSearchActionDocument(ActionDocument):
-    documentData: List[WebSearchDocumentData]
-
-
-class WebSearchActionResult(ActionResult):
-    documents: List[WebSearchActionDocument] = Field(default_factory=list)
-
-
-class WebSearchBase(ABC):
-    @abstractmethod
-    async def __call__(self, request: WebSearchRequest) -> WebSearchActionResult: ...
diff --git a/modules/methods/web/web_search/web_search_tavily.py b/modules/methods/web/web_search/web_search_tavily.py
deleted file mode 100644
index dcbea35c..00000000
--- a/modules/methods/web/web_search/web_search_tavily.py
+++ /dev/null
@@ -1,70 +0,0 @@
-"""Tavily web search class."""
-
-import os
-from dataclasses import dataclass
-from web_search_base import (
-    WebSearchBase,
-    WebSearchRequest,
-    WebSearchActionResult,
-    WebSearchActionDocument,
-    WebSearchDocumentData,
-)
-
-# from modules.interfaces.interfaceChatModel import ActionResult, ActionDocument
-from tavily import AsyncTavilyClient
-from modules.shared.timezoneUtils import get_utc_timestamp
-
-
-@dataclass
-class WebSearchTavily(WebSearchBase):
-    client: AsyncTavilyClient = None
-
-    @classmethod
-    async def create(cls):
-        return cls(client=AsyncTavilyClient(api_key=os.getenv("TAVILY_API_KEY")))
-
-    async def __call__(self, request: WebSearchRequest) -> WebSearchActionResult:
-        """Handles the web search request."""
-        # Step 1: Search
-        try:
-            search_results = await self._search(request.query, request.max_results)
-        except Exception as e:
-            return WebSearchActionResult(success=False, error=str(e))
-
-        # Step 2: Build ActionResult
-        try:
-            result = self._build_action_result(search_results)
-        except Exception as e:
-            return WebSearchActionResult(success=False, error=str(e))
-
-        return result
-
-    async def _search(self, query: str, max_results: int) -> WebSearchActionResult:
-        """Calls the Tavily API to perform a web search."""
-        # Make sure max_results is within the allowed range
-        if max_results < 0 or max_results > 20:
-            raise ValueError("max_results must be between 0 and 20")
-
-        # Perform actual API call
-        response = await self.client.search(query=query, max_results=max_results)
-        return response["results"]
-
-    def _build_action_result(self, search_results: list) -> WebSearchActionResult:
-        """Builds the ActionResult from the search results."""
-        documents = []
-        for result in search_results:
-            document_name = f"web_search_{get_utc_timestamp()}.txt"
-            document_data = WebSearchDocumentData(
-                title=result["title"], url=result["url"]
-            )
-            mime_type = "text/plain"
-            doc = WebSearchActionDocument(
-                documentName=document_name,
-                documentData=document_data,
-                mimeType=mime_type,
-            )
-            documents.append(doc)
-
-        return WebSearchActionResult(
-            success=True, documents=documents, resultLabel="web_search_results"
-        )
diff --git a/notes/changelog.txt b/notes/changelog.txt
index 5e017239..fca700df 100644
--- a/notes/changelog.txt
+++ b/notes/changelog.txt
@@ -19,7 +19,13 @@ TODO
 - check zusammenfassung von 10 dokumenten >10 MB
 - test case bewerbung
 
-
+# DOCUMENTATION
+Design principles
+- UI: Module classes for data management (CRUD tables & forms --> formGeneric)
+- Basic: All timestamps to be timezone aware fehlerabfangroutinen
+- Backend: All external components to attach over connectorXxx --> interfaceXxx --> our codebase
+- all model definitions in interfaceXxxModel
+- action functions for ai: why to use documentList and not just document as input parameter? --> to have full flexibility to pass either list of documents, or documentList 
 
 ********************
 
diff --git a/requirements.txt b/requirements.txt
index 75bd81b6..783db728 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -72,3 +72,22 @@ chardet>=4.0.0  # For encoding detection
 ## Testing Dependencies
 pytest>=8.0.0
 pytest-asyncio>=0.21.0
+
+## Missing Dependencies for IPython and other tools
+decorator>=5.0.0
+jedi>=0.16
+matplotlib-inline>=0.1.0
+stack-data>=0.1.0
+traitlets>=5.0.0
+docutils>=0.13.1
+markdown-it-py>=2.2.0
+keyring>=15.1
+pkginfo>=1.8.1
+
+## Missing Dependencies for Panel 1.3.8
+bleach>=4.0.0
+bokeh>=3.2.0,<3.4.0
+linkify-it-py>=1.0.0
+mdit-py-plugins>=0.3.0
+pyviz-comms>=2.0.0
+xyzservices>=2021.09.1
\ No newline at end of file
diff --git a/test_ai_calls.md b/test_ai_calls.md
new file mode 100644
index 00000000..75ed3310
--- /dev/null
+++ b/test_ai_calls.md
@@ -0,0 +1,235 @@
+# AI Call Functions Test and Content Size Analysis
+
+## Overview
+This file documents the ServiceCenter AI functions that have risk of delivering too big content,
+along with their usage patterns and potential size issues.
+
+## High-Risk AI Functions
+
+### 1. summarizeChat() -> callAiTextBasic()
+**Location**: gateway/modules/chat/handling/promptFactory.py:122
+**Risk Level**: MEDIUM
+**Content**: Entire workflow message history
+**Usage**:
+```python
+messageSummary = await service.summarizeChat(context.workflow.messages) if context.workflow else ""
+```
+**Potential Issues**:
+- Long conversations can generate very large summaries
+- Includes all previous messages in workflow
+- No size limits or truncation
+
+### 2. callAiTextAdvanced() -> interfaceAiCalls.callAiTextAdvanced()
+**Risk Level**: HIGH
+**Multiple Usage Points**:
+
+#### A. Task Planning (handlingTasks.py:116)
+```python
+prompt = await self.service.callAiTextAdvanced(task_planning_prompt)
+```
+**Content**: User input + document context + connection context + previous results
+**Risk**: VERY HIGH - includes all available documents and context
+
+#### B. Action Definition (handlingTasks.py:388)
+```python
+prompt = await self.service.callAiTextAdvanced(action_prompt)
+```
+**Content**: Task context + available documents + connections + previous results
+**Risk**: HIGH - comprehensive context for action planning
+
+#### C. Result Review (handlingTasks.py:894)
+```python
+response = await self.service.callAiTextAdvanced(prompt)
+```
+**Content**: Action results + success criteria + context
+**Risk**: MEDIUM-HIGH - depends on result size
+
+#### D. Email Composition (methodOutlook.py:1609)
+```python
+composed_email = await self.service.interfaceAiCalls.callAiTextAdvanced(ai_prompt)
+```
+**Content**: Document content + email requirements
+**Risk**: MEDIUM - depends on document size
+
+#### E. AI Processing (methodAi.py:175)
+```python
+result = await self.service.callAiTextAdvanced(enhanced_prompt, context)
+```
+**Content**: User prompt + extracted document content
+**Risk**: HIGH - includes full document content
+
+### 3. callAiTextBasic() -> interfaceAiCalls.callAiTextBasic()
+**Risk Level**: MEDIUM
+**Multiple Usage Points**:
+
+#### A. Document Format Conversion (methodDocument.py:429)
+```python
+formatted_content = await self.service.callAiTextBasic(ai_prompt, content)
+```
+**Content**: Document content + format requirements
+**Risk**: MEDIUM - depends on document size
+
+#### B. HTML Report Generation (methodDocument.py:642)
+```python
+aiReport = await self.service.callAiTextBasic(aiPrompt, combinedContent)
+```
+**Content**: Combined content from multiple documents
+**Risk**: HIGH - combines multiple documents
+
+#### C. AI Processing Fallback (methodAi.py:177)
+```python
+result = await self.service.callAiTextBasic(enhanced_prompt, context)
+```
+**Content**: User prompt + document context
+**Risk**: MEDIUM - includes document content
+
+#### D. Document Content Processing (documentExtraction.py:1459)
+```python
+processedContent = await self._serviceCenter.callAiTextBasic(aiPrompt, contentToProcess)
+```
+**Content**: Document chunks + AI prompt
+**Risk**: MEDIUM - processes document chunks
+
+### 4. extractContentFromDocument() -> documentProcessor.processFileData()
+**Risk Level**: HIGH
+**Multiple Usage Points**:
+
+#### A. Document Content Extraction (methodDocument.py:74)
+```python
+extracted_content = await self.service.extractContentFromDocument(
+    prompt=aiPrompt,
+    document=chatDocument
+)
+```
+**Content**: Full document + extraction prompt
+**Risk**: HIGH - processes entire documents
+
+#### B. HTML Report Generation (methodDocument.py:581)
+```python
+extracted_content = await self.service.extractContentFromDocument(
+    prompt="Extract readable text content for HTML report generation", 
+    document=doc
+)
+```
+**Content**: Full document content
+**Risk**: HIGH - processes documents for reports
+
+#### C. Email Composition (methodOutlook.py:1510)
+```python
+extracted_content = await self.service.extractContentFromDocument(
+    prompt="Extract readable text content for email composition", 
+    document=doc
+)
+```
+**Content**: Full document content
+**Risk**: HIGH - processes documents for emails
+
+#### D. AI Processing (methodAi.py:94)
+```python
+extracted_content = await self.service.extractContentFromDocument(
+    prompt=extraction_prompt.strip(), 
+    document=doc
+)
+```
+**Content**: Full document content
+**Risk**: HIGH - processes documents for AI analysis
+
+## Risk Assessment Summary
+
+### CRITICAL RISK (Immediate Attention Required)
+1. **Task Planning** (handlingTasks.py:116) - Entire workflow context
+2. **Action Definition** (handlingTasks.py:388) - Comprehensive context
+3. **Document Processing** (all extractContentFromDocument calls) - Full documents
+4. **AI Method Processing** (methodAi.py:175) - Document content + context
+5. **Report Generation** (methodDocument.py:642) - Multiple documents combined
+
+### HIGH RISK (Monitor Closely)
+1. **Chat Summarization** (promptFactory.py:122) - Message history
+2. **Document Format Conversion** (methodDocument.py:429) - Single documents
+3. **Email Composition** (methodOutlook.py:1609) - Document content
+
+## Potential Issues
+
+### Content Size Problems
+- Large documents (PDFs, Word docs, Excel files) can exceed AI model limits
+- Combined document content in reports can be massive
+- Long conversation histories in chat summarization
+- Full workflow context in task planning
+
+### Performance Issues
+- Timeout errors for large content
+- Memory issues with large document processing
+- API rate limiting with large requests
+- Cost implications for large AI calls
+
+### Error Scenarios
+- OpenAI API 400 errors (content too large)
+- Timeout errors (processing too slow)
+- Memory exhaustion (large document processing)
+- Incomplete processing (truncated content)
+
+## Recommended Solutions
+
+### 1. Content Size Limits
+- Implement maximum content size checks before AI calls
+- Truncate large content with appropriate warnings
+- Split large documents into chunks
+
+### 2. Content Filtering
+- Remove unnecessary context from prompts
+- Filter out large binary content
+- Use document summaries instead of full content
+
+### 3. Chunking Strategy
+- Process large documents in smaller chunks
+- Implement progressive processing
+- Use streaming for large responses
+
+### 4. Caching and Optimization
+- Cache processed document content
+- Reuse extracted content across operations
+- Implement smart content selection
+
+### 5. Error Handling
+- Graceful degradation for oversized content
+- Fallback strategies for failed AI calls
+- User notifications for content size issues
+
+## Test Scenarios
+
+### Test Case 1: Large Document Processing
+- Upload a 10MB PDF document
+- Try to extract content for AI processing
+- Monitor for size limit errors
+
+### Test Case 2: Multiple Document Reports
+- Upload 5+ large documents
+- Generate HTML report
+- Check for combined content size issues
+
+### Test Case 3: Long Conversation History
+- Create workflow with 50+ messages
+- Test chat summarization
+- Monitor for context size limits
+
+### Test Case 4: Task Planning with Large Context
+- Create workflow with many documents
+- Test task planning functionality
+- Check for prompt size limits
+
+## Monitoring Recommendations
+
+1. **Log Content Sizes**: Track the size of content sent to AI functions
+2. **Monitor API Errors**: Watch for 400 errors indicating content too large
+3. **Performance Metrics**: Track processing times for large content
+4. **User Feedback**: Monitor for incomplete or failed operations
+5. **Cost Tracking**: Monitor AI API costs for large requests
+
+## Implementation Priority
+
+1. **Immediate**: Add content size checks to extractContentFromDocument
+2. **High**: Implement chunking for large document processing
+3. **Medium**: Add content filtering to task planning prompts
+4. **Low**: Implement caching for processed content
+
+This analysis should help identify and mitigate the risks of delivering too big content to AI functions.
diff --git a/test_ai_fallback.py b/test_ai_fallback.py
new file mode 100644
index 00000000..fc320229
--- /dev/null
+++ b/test_ai_fallback.py
@@ -0,0 +1,103 @@
+#!/usr/bin/env python3
+"""
+Test script to verify AI fallback mechanism from Basic to Advanced when context length is exceeded.
+"""
+
+import asyncio
+import logging
+from modules.interfaces.interfaceAiCalls import AiCalls
+from modules.connectors.connectorAiOpenai import ContextLengthExceededException
+
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+async def test_context_length_fallback():
+    """Test the fallback mechanism when context length is exceeded"""
+    
+    # Create AI calls instance
+    ai_calls = AiCalls()
+    
+    # Create a very large context that would exceed OpenAI's context limit
+    large_context = "This is a test context. " * 10000  # Create a large context
+    prompt = "Please summarize this context in one sentence."
+    
+    logger.info("Testing AI Basic with large context (should trigger fallback)...")
+    
+    try:
+        # This should trigger the context length exceeded error and fallback to Advanced
+        result = await ai_calls.callAiTextBasic(prompt, large_context)
+        logger.info(f"✅ Fallback successful! Result: {result[:100]}...")
+        return True
+    except Exception as e:
+        logger.error(f"❌ Test failed: {str(e)}")
+        return False
+
+async def test_direct_context_length_exception():
+    """Test that the ContextLengthExceededException is properly raised"""
+    
+    from modules.connectors.connectorAiOpenai import AiOpenai
+    
+    logger.info("Testing direct ContextLengthExceededException...")
+    
+    try:
+        # Create OpenAI connector
+        openai_connector = AiOpenai()
+        
+        # Create messages that would exceed context length
+        large_messages = [
+            {"role": "user", "content": "Test message. " * 50000}  # Very large message
+        ]
+        
+        # This should raise ContextLengthExceededException
+        await openai_connector.callAiBasic(large_messages)
+        logger.error("❌ Expected ContextLengthExceededException but none was raised")
+        return False
+        
+    except ContextLengthExceededException as e:
+        logger.info(f"✅ ContextLengthExceededException properly raised: {str(e)}")
+        return True
+    except Exception as e:
+        logger.error(f"❌ Unexpected exception: {str(e)}")
+        return False
+
+async def main():
+    """Run all tests"""
+    logger.info("Starting AI fallback mechanism tests...")
+    
+    tests = [
+        ("Context Length Fallback", test_context_length_fallback),
+        ("Direct Exception Test", test_direct_context_length_exception),
+    ]
+    
+    results = []
+    for test_name, test_func in tests:
+        logger.info(f"\n--- Running {test_name} ---")
+        try:
+            result = await test_func()
+            results.append((test_name, result))
+        except Exception as e:
+            logger.error(f"Test {test_name} crashed: {str(e)}")
+            results.append((test_name, False))
+    
+    # Summary
+    logger.info("\n" + "="*50)
+    logger.info("TEST SUMMARY")
+    logger.info("="*50)
+    
+    passed = 0
+    for test_name, result in results:
+        status = "✅ PASSED" if result else "❌ FAILED"
+        logger.info(f"{test_name}: {status}")
+        if result:
+            passed += 1
+    
+    logger.info(f"\nTotal: {passed}/{len(results)} tests passed")
+    
+    if passed == len(results):
+        logger.info("🎉 All tests passed! Fallback mechanism is working correctly.")
+    else:
+        logger.warning("⚠️  Some tests failed. Please check the implementation.")
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/test_methodWeb.py b/test_methodWeb.py
new file mode 100644
index 00000000..a4578418
--- /dev/null
+++ b/test_methodWeb.py
@@ -0,0 +1,658 @@
+#!/usr/bin/env python3
+"""
+Test script for MethodWeb class.
+Tests all web actions: search, crawl, and scrape with various parameter sets.
+
+Features:
+- Tests web search functionality with different queries
+- Tests web crawling with URL lists
+- Tests web scraping (search + crawl combined)
+- Detailed logging and progress tracking
+- Error handling and validation testing
+- Configuration validation
+
+Usage:
+- Interactive mode: python test_methodWeb.py
+- Automated mode: python test_methodWeb.py --auto
+- Verbose mode: python test_methodWeb.py --verbose
+"""
+
+import os
+import asyncio
+import logging
+import sys
+import argparse
+import json
+from pathlib import Path
+from typing import List, Optional, Dict, Any
+from datetime import datetime, UTC
+
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+# Filter out specific unwanted log messages
+class LogFilter(logging.Filter):
+    """Filter to hide specific unwanted log messages."""
+    
+    def filter(self, record):
+        # Hide HTTP request info messages
+        if "HTTP Request:" in record.getMessage() and "POST https://api.tavily.com" in record.getMessage():
+            return False
+        
+        # Hide HTTP response info messages
+        if "HTTP/1.1 200 OK" in record.getMessage():
+            return False
+        
+        return True
+
+# Apply the filter to the root logger
+root_logger = logging.getLogger()
+root_logger.addFilter(LogFilter())
+
+def check_dependencies():
+    """Check if required dependencies are available."""
+    missing_deps = []
+    
+    # Check for required dependencies
+    try:
+        import tavily
+        logger.info("tavily-python is available")
+    except ImportError:
+        missing_deps.append("tavily-python")
+        logger.error("tavily-python is missing")
+    
+    try:
+        import httpx
+        logger.info("httpx is available")
+    except ImportError:
+        missing_deps.append("httpx")
+        logger.error("httpx is missing")
+    
+    if missing_deps:
+        logger.error("\n" + "="*60)
+        logger.error("MISSING DEPENDENCIES DETECTED!")
+        logger.error("="*60)
+        logger.error("The following packages are required but not installed:")
+        for dep in missing_deps:
+            logger.error(f"  - {dep}")
+        logger.error("\nTo install all dependencies, run:")
+        logger.error("pip install -r requirements.txt")
+        logger.error("="*60)
+        return False
+    
+    logger.info("All required dependencies are available!")
+    return True
+
+def check_module_imports():
+    """Check if we can import the required modules."""
+    try:
+        # Add the gateway directory to the path so we can import our modules
+        sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
+        
+        from modules.methods.methodWeb import MethodWeb
+        from modules.chat.serviceCenter import ServiceCenter
+        from modules.interfaces.interfaceAppModel import User, UserConnection, UserPrivilege, AuthAuthority
+        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
+        from modules.shared.configuration import APP_CONFIG
+        
+        logger.info("All required modules imported successfully")
+        return True
+    except ImportError as e:
+        logger.error(f"Failed to import required modules: {e}")
+        logger.error("Make sure you're running this script from the gateway directory")
+        return False
+    except Exception as e:
+        logger.error(f"Unexpected error importing modules: {e}")
+        return False
+
+def check_configuration():
+    """Check if required configuration is available."""
+    try:
+        from modules.shared.configuration import APP_CONFIG
+        
+        # Check Tavily API key
+        tavily_api_key = APP_CONFIG.get("Connector_WebTavily_API_KEY")
+        if not tavily_api_key or tavily_api_key == "your_tavily_api_key_here":
+            logger.error("Tavily API key not configured!")
+            logger.error("Please set Connector_WebTavily_API_KEY in config.ini")
+            return False
+        
+        logger.info("Tavily API key is configured")
+        
+        # Check other web configuration
+        web_configs = [
+            "Web_Search_MAX_QUERY_LENGTH",
+            "Web_Search_MAX_RESULTS", 
+            "Web_Search_MIN_RESULTS",
+            "Web_Crawl_TIMEOUT",
+            "Web_Crawl_MAX_RETRIES",
+            "Web_Crawl_RETRY_DELAY"
+        ]
+        
+        for config_key in web_configs:
+            value = APP_CONFIG.get(config_key)
+            if value:
+                logger.info(f"Configuration {config_key}: {value}")
+            else:
+                logger.warning(f"Configuration {config_key} not set, using default")
+        
+        return True
+        
+    except Exception as e:
+        logger.error(f"Failed to check configuration: {e}")
+        return False
+
+def create_mock_service_center():
+    """Create a proper ServiceCenter for testing purposes."""
+    try:
+        from modules.chat.serviceCenter import ServiceCenter
+        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
+        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
+        from modules.interfaces.interfaceChatModel import ChatLog, ChatMessage, ChatStat
+        
+        # Create proper user with all required fields
+        mock_user = User(
+            id="test_user_web_001",
+            username="testuser_web",
+            email="testweb@example.com",
+            fullName="Test Web User",
+            language="en",
+            enabled=True,
+            privilege=UserPrivilege.USER,
+            authenticationAuthority=AuthAuthority.LOCAL,
+            mandateId="test_mandate_web_001"
+        )
+        
+        # Create proper workflow with all required fields
+        current_time = datetime.now(UTC).timestamp()
+        mock_workflow = ChatWorkflow(
+            id="test_workflow_web_001",
+            mandateId="test_mandate_web_001",
+            status="active",
+            name="Test Web Method Workflow",
+            currentRound=1,
+            lastActivity=current_time,
+            startedAt=current_time,
+            logs=[],
+            messages=[],
+            stats=None,
+            tasks=[]
+        )
+        
+        # Create service center
+        service_center = ServiceCenter(mock_user, mock_workflow)
+        logger.info("ServiceCenter created successfully for web testing")
+        return service_center
+        
+    except Exception as e:
+        logger.error(f"Failed to create ServiceCenter: {e}")
+        return None
+
+class MethodWebTester:
+    """Test class for MethodWeb functionality."""
+    
+    def __init__(self):
+        """Initialize the tester."""
+        self.method_web = None
+        self.service_center = None
+        
+        # Test results tracking
+        self.test_results = []
+        
+        # Test parameter sets
+        self.test_queries = [
+            "Python programming tutorial",
+            "FastAPI documentation",
+            "machine learning basics",
+            "web scraping best practices"
+        ]
+        
+        self.test_urls = [
+            "https://docs.python.org/3/tutorial/",
+            "https://fastapi.tiangolo.com/",
+            "https://scikit-learn.org/stable/",
+            "https://requests.readthedocs.io/en/latest/"
+        ]
+    
+    def initialize_method_web(self):
+        """Initialize the MethodWeb instance with a proper ServiceCenter."""
+        try:
+            # First create the service center
+            self.service_center = create_mock_service_center()
+            if not self.service_center:
+                logger.error("Failed to create ServiceCenter!")
+                return False
+            
+            # Now create MethodWeb with the service center
+            from modules.methods.methodWeb import MethodWeb
+            self.method_web = MethodWeb(self.service_center)
+            logger.info("MethodWeb initialized successfully with ServiceCenter")
+            return True
+        except Exception as e:
+            logger.error(f"Failed to initialize MethodWeb: {e}")
+            return False
+    
+    async def test_search_action(self, query: str, max_results: int = 5) -> Dict[str, Any]:
+        """Test the search action with given parameters."""
+        logger.info(f"Testing search action with query: '{query}', max_results: {max_results}")
+        
+        try:
+            parameters = {
+                "query": query,
+                "maxResults": max_results
+            }
+            
+            result = await self.method_web.search(parameters)
+            
+            test_result = {
+                "action": "search",
+                "query": query,
+                "max_results": max_results,
+                "success": result.success,
+                "error": result.error if not result.success else None,
+                "documents_count": len(result.documents) if result.documents else 0,
+                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
+            }
+            
+            if result.success:
+                logger.info(f"✅ Search successful: {test_result['documents_count']} documents returned")
+                if result.documents:
+                    for i, doc in enumerate(result.documents):
+                        logger.info(f"   Document {i+1}: {doc.documentName}")
+                        if hasattr(doc, 'documentData') and hasattr(doc.documentData, 'results'):
+                            logger.info(f"   Results count: {len(doc.documentData.results)}")
+            else:
+                logger.error(f"❌ Search failed: {result.error}")
+            
+            return test_result
+            
+        except Exception as e:
+            error_msg = str(e)
+            logger.error(f"❌ Search action exception: {error_msg}")
+            return {
+                "action": "search",
+                "query": query,
+                "max_results": max_results,
+                "success": False,
+                "error": f"Exception: {error_msg}",
+                "documents_count": 0,
+                "result_label": None
+            }
+    
+    async def test_crawl_action(self, urls: List[str]) -> Dict[str, Any]:
+        """Test the crawl action with given URLs."""
+        logger.info(f"Testing crawl action with {len(urls)} URLs")
+        
+        try:
+            # Monkeypatch the service to return a mock document and file data
+            class _MockDoc:
+                def __init__(self, fileId: str, fileName: str = "mock_search_results.json"):
+                    self.fileId = fileId
+                    self.fileName = fileName
+
+            def _mock_get_docs(_doc_ids):
+                return [_MockDoc(fileId="mock_file_id", fileName="mock_search_results.json")]
+
+            # Build minimal JSON structure expected by methodWeb.crawl
+            mock_payload = {
+                "documentData": {
+                    "results": [{"url": u} for u in urls]
+                }
+            }
+
+            def _mock_get_file_data(_file_id):
+                return json.dumps(mock_payload).encode("utf-8")
+
+            # Apply monkeypatches to the method's service
+            self.method_web.service.getChatDocumentsFromDocumentList = _mock_get_docs
+            self.method_web.service.getFileData = _mock_get_file_data
+
+            # Use any string as the document list reference; service is mocked
+            parameters = {"documentList": "mock_document_list_ref"}
+            
+            result = await self.method_web.crawl(parameters)
+            
+            test_result = {
+                "action": "crawl",
+                "urls_count": len(urls),
+                "success": result.success,
+                "error": result.error if not result.success else None,
+                "documents_count": len(result.documents) if result.documents else 0,
+                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
+            }
+            
+            if result.success:
+                logger.info(f"✅ Crawl successful: {test_result['documents_count']} documents returned")
+                if result.documents:
+                    for i, doc in enumerate(result.documents):
+                        logger.info(f"   Document {i+1}: {doc.documentName}")
+            else:
+                logger.error(f"❌ Crawl failed: {result.error}")
+            
+            return test_result
+            
+        except Exception as e:
+            error_msg = str(e)
+            logger.error(f"❌ Crawl action exception: {error_msg}")
+            return {
+                "action": "crawl",
+                "urls_count": len(urls),
+                "success": False,
+                "error": f"Exception: {error_msg}",
+                "documents_count": 0,
+                "result_label": None
+            }
+    
+    async def test_scrape_action(self, query: str, max_results: int = 3) -> Dict[str, Any]:
+        """Test the scrape action (search + crawl combined) with given parameters."""
+        logger.info(f"Testing scrape action with query: '{query}', max_results: {max_results}")
+        
+        try:
+            parameters = {
+                "query": query,
+                "maxResults": max_results
+            }
+            
+            result = await self.method_web.scrape(parameters)
+            
+            test_result = {
+                "action": "scrape",
+                "query": query,
+                "max_results": max_results,
+                "success": result.success,
+                "error": result.error if not result.success else None,
+                "documents_count": len(result.documents) if result.documents else 0,
+                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
+            }
+            
+            if result.success:
+                logger.info(f"✅ Scrape successful: {test_result['documents_count']} documents returned")
+                if result.documents:
+                    for i, doc in enumerate(result.documents):
+                        logger.info(f"   Document {i+1}: {doc.documentName}")
+                        if hasattr(doc, 'documentData') and hasattr(doc.documentData, 'results'):
+                            logger.info(f"   Results count: {len(doc.documentData.results)}")
+            else:
+                logger.error(f"❌ Scrape failed: {result.error}")
+            
+            return test_result
+            
+        except Exception as e:
+            error_msg = str(e)
+            logger.error(f"❌ Scrape action exception: {error_msg}")
+            return {
+                "action": "scrape",
+                "query": query,
+                "max_results": max_results,
+                "success": False,
+                "error": f"Exception: {error_msg}",
+                "documents_count": 0,
+                "result_label": None
+            }
+    
+    async def test_parameter_validation(self) -> List[Dict[str, Any]]:
+        """Test parameter validation with invalid inputs."""
+        logger.info("Testing parameter validation with invalid inputs")
+        
+        validation_tests = []
+        
+        # Test 1: Empty query
+        logger.info("Test 1: Empty query")
+        result = await self.test_search_action("", 5)
+        # For validation tests, we expect the request to fail with validation error
+        if not result["success"] and "validation error" in result.get("error", "").lower():
+            result["success"] = True  # Mark as successful validation test
+            result["validation_test"] = True
+            result["expected_behavior"] = "Correctly rejected empty query"
+            logger.info("✅ Validation test PASSED: Empty query correctly rejected")
+        validation_tests.append(result)
+        
+        # Test 2: Query too long (over 400 characters)
+        long_query = "a" * 500
+        logger.info("Test 2: Query too long")
+        result = await self.test_search_action(long_query, 5)
+        if not result["success"] and "validation error" in result.get("error", "").lower():
+            result["success"] = True  # Mark as successful validation test
+            result["validation_test"] = True
+            result["expected_behavior"] = "Correctly rejected overly long query"
+            logger.info("✅ Validation test PASSED: Long query correctly rejected")
+        validation_tests.append(result)
+        
+        # Test 3: Max results too high
+        logger.info("Test 3: Max results too high")
+        result = await self.test_search_action("test", 25)
+        if not result["success"] and "validation error" in result.get("error", "").lower():
+            result["success"] = True  # Mark as successful validation test
+            result["validation_test"] = True
+            result["expected_behavior"] = "Correctly rejected excessive max results"
+            logger.info("✅ Validation test PASSED: High max results correctly rejected")
+        validation_tests.append(result)
+        
+        # Test 4: Max results too low
+        logger.info("Test 4: Max results too low")
+        result = await self.test_search_action("test", 0)
+        if not result["success"] and "validation error" in result.get("error", "").lower():
+            result["success"] = True  # Mark as successful validation test
+            result["validation_test"] = True
+            result["expected_behavior"] = "Correctly rejected zero max results"
+            logger.info("✅ Validation test PASSED: Zero max results correctly rejected")
+        validation_tests.append(result)
+        
+        return validation_tests
+    
+    async def run_all_tests(self) -> None:
+        """Run all web method tests."""
+        logger.info("Starting MethodWeb comprehensive tests")
+        logger.info("=" * 60)
+        
+        # Initialize the method
+        if not self.initialize_method_web():
+            logger.error("Cannot proceed without MethodWeb!")
+            return
+        
+        # Test 1: Search actions with different queries
+        logger.info("\n" + "=" * 60)
+        logger.info("TEST 1: SEARCH ACTIONS")
+        logger.info("=" * 60)
+        
+        for i, query in enumerate(self.test_queries):
+            logger.info(f"\nSearch test {i+1}/{len(self.test_queries)}")
+            result = await self.test_search_action(query, 3)
+            self.test_results.append(result)
+            await asyncio.sleep(1)  # Rate limiting
+        
+        # Test 2: Scrape actions (search + crawl combined)
+        logger.info("\n" + "=" * 60)
+        logger.info("TEST 2: SCRAPE ACTIONS")
+        logger.info("=" * 60)
+        
+        scrape_queries = self.test_queries[:2]  # Use first 2 queries for scraping
+        for i, query in enumerate(scrape_queries):
+            logger.info(f"\nScrape test {i+1}/{len(scrape_queries)}")
+            result = await self.test_scrape_action(query, 2)
+            self.test_results.append(result)
+            await asyncio.sleep(2)  # Rate limiting for scraping
+        
+        # Test 3: Parameter validation
+        logger.info("\n" + "=" * 60)
+        logger.info("TEST 3: PARAMETER VALIDATION")
+        logger.info("=" * 60)
+        
+        validation_results = await self.test_parameter_validation()
+        self.test_results.extend(validation_results)
+        
+        # Test 4: Crawl action (if we have search results)
+        logger.info("\n" + "=" * 60)
+        logger.info("TEST 4: CRAWL ACTIONS")
+        logger.info("=" * 60)
+        
+        logger.info("Testing crawl with sample URLs")
+        result = await self.test_crawl_action(self.test_urls[:2])
+        self.test_results.append(result)
+        
+        # Print comprehensive summary
+        self.print_test_summary()
+    
+    def print_test_summary(self):
+        """Print comprehensive test summary."""
+        logger.info("\n" + "=" * 80)
+        logger.info("COMPREHENSIVE TEST SUMMARY")
+        logger.info("=" * 80)
+        
+        total_tests = len(self.test_results)
+        successful_tests = sum(1 for result in self.test_results if result["success"])
+        failed_tests = total_tests - successful_tests
+        
+        logger.info(f"Total tests run: {total_tests}")
+        logger.info(f"Successful: {successful_tests}")
+        logger.info(f"Failed: {failed_tests}")
+        logger.info(f"Success rate: {(successful_tests/total_tests)*100:.1f}%")
+        
+        # Group results by action type
+        action_groups = {}
+        for result in self.test_results:
+            action = result["action"]
+            if action not in action_groups:
+                action_groups[action] = []
+            action_groups[action].append(result)
+        
+        logger.info("\n" + "-" * 80)
+        logger.info("RESULTS BY ACTION TYPE:")
+        logger.info("-" * 80)
+        
+        for action, results in action_groups.items():
+            action_successful = sum(1 for r in results if r["success"])
+            action_total = len(results)
+            logger.info(f"\n{action.upper()} ACTIONS:")
+            logger.info(f"  Total: {action_total}, Successful: {action_successful}, Failed: {action_total - action_successful}")
+            
+            for i, result in enumerate(results):
+                status_icon = "✅" if result["success"] else "❌"
+                
+                # Handle validation tests specially
+                if result.get("validation_test", False):
+                    logger.info(f"  {status_icon} Validation Test {i+1}: {result.get('expected_behavior', 'Validation working correctly')}")
+                    if result.get("error"):
+                        logger.info(f"      Validation Error: {result['error']}")
+                elif action == "search":
+                    logger.info(f"  {status_icon} Test {i+1}: '{result['query']}' -> {result['documents_count']} docs")
+                elif action == "scrape":
+                    logger.info(f"  {status_icon} Test {i+1}: '{result['query']}' -> {result['documents_count']} docs")
+                elif action == "crawl":
+                    logger.info(f"  {status_icon} Test {i+1}: {result['urls_count']} URLs -> {result['documents_count']} docs")
+                
+                if not result["success"] and not result.get("validation_test", False):
+                    logger.info(f"      Error: {result['error']}")
+        
+        logger.info("\n" + "-" * 80)
+        logger.info("CONFIGURATION STATUS:")
+        logger.info("-" * 80)
+        
+        try:
+            from modules.shared.configuration import APP_CONFIG
+            tavily_key = APP_CONFIG.get("Connector_WebTavily_API_KEY")
+            if tavily_key and tavily_key != "your_tavily_api_key_here":
+                logger.info("✅ Tavily API key: Configured")
+            else:
+                logger.info("❌ Tavily API key: Not configured")
+            
+            web_configs = [
+                ("Web_Search_MAX_QUERY_LENGTH", "400"),
+                ("Web_Search_MAX_RESULTS", "20"),
+                ("Web_Search_MIN_RESULTS", "1"),
+                ("Web_Crawl_TIMEOUT", "30"),
+                ("Web_Crawl_MAX_RETRIES", "3"),
+                ("Web_Crawl_RETRY_DELAY", "2")
+            ]
+            
+            for config_key, default_value in web_configs:
+                value = APP_CONFIG.get(config_key, default_value)
+                logger.info(f"✅ {config_key}: {value}")
+                
+        except Exception as e:
+            logger.error(f"❌ Configuration check failed: {e}")
+        
+        logger.info("=" * 80)
+
+def parse_arguments():
+    """Parse command line arguments."""
+    parser = argparse.ArgumentParser(description='MethodWeb Test Script')
+    parser.add_argument('--auto', action='store_true', 
+                       help='Run tests automatically without user interaction')
+    parser.add_argument('--verbose', '-v', action='store_true',
+                       help='Enable verbose logging')
+    parser.add_argument('--quick', action='store_true',
+                       help='Run quick tests with fewer queries')
+    
+    return parser.parse_args()
+
+async def main():
+    """Main function to run the tests."""
+    # Parse command line arguments
+    args = parse_arguments()
+    
+    # Set logging level based on verbosity
+    if args.verbose:
+        logging.getLogger().setLevel(logging.DEBUG)
+    else:
+        logging.getLogger().setLevel(logging.INFO)
+    
+    logger.info("MethodWeb Test Script")
+    logger.info("=" * 50)
+    
+    # Check dependencies first
+    if not check_dependencies():
+        logger.error("Please install missing dependencies before running tests.")
+        return
+    
+    # Check module imports
+    if not check_module_imports():
+        logger.error("Cannot import required modules. Please check your setup.")
+        return
+    
+    # Check configuration
+    if not check_configuration():
+        logger.error("Configuration check failed. Please check your config.ini file.")
+        return
+    
+    # Determine test mode
+    if args.auto:
+        logger.info("Running in automated mode")
+    else:
+        # Interactive mode: ask user for confirmation
+        print("\n" + "=" * 50)
+        print("METHODWEB TEST SCRIPT")
+        print("=" * 50)
+        print("This script will test the MethodWeb functionality including:")
+        print("- Web search actions")
+        print("- Web scraping actions") 
+        print("- Web crawling actions")
+        print("- Parameter validation")
+        print("=" * 50)
+        
+        try:
+            choice = input("Do you want to proceed? (y/N): ").strip().lower()
+            if choice not in ['y', 'yes']:
+                logger.info("Test cancelled by user")
+                return
+        except (EOFError, KeyboardInterrupt):
+            logger.info("Test cancelled by user")
+            return
+    
+    # Create tester and run tests
+    tester = MethodWebTester()
+    
+    # Modify test queries for quick mode
+    if args.quick:
+        tester.test_queries = tester.test_queries[:2]  # Use only first 2 queries
+        logger.info("Running in quick mode with reduced test set")
+    
+    await tester.run_all_tests()
+
+if __name__ == "__main__":
+    # Run the tests
+    asyncio.run(main())
diff --git a/test_web_csv_functionality.py b/test_web_csv_functionality.py
new file mode 100644
index 00000000..7242c497
--- /dev/null
+++ b/test_web_csv_functionality.py
@@ -0,0 +1,207 @@
+#!/usr/bin/env python3
+"""
+Test script for web CSV functionality
+Tests both CSV output generation and CSV input reading
+"""
+
+import sys
+import os
+import asyncio
+from typing import Dict, Any
+
+# Add the gateway directory to the Python path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__)))
+
+from modules.methods.methodWeb import MethodWeb
+from modules.interfaces.interfaceWebModel import WebSearchResultItem, WebSearchDocumentData, WebSearchActionDocument, WebSearchActionResult
+from pydantic import HttpUrl
+
+
+def create_mock_web_search_result():
+    """Create a mock WebSearchActionResult with the provided example data"""
+    
+    # Create mock search result items based on the provided example
+    results = [
+        WebSearchResultItem(
+            title="Switzerland Market Analysis :: Fitch Solutions",
+            url=HttpUrl("https://www.fitchsolutions.com/bmi/region/switzerland")
+        ),
+        WebSearchResultItem(
+            title="OECD Economic Outlook, Volume 2024 Issue 2: Switzerland",
+            url=HttpUrl("https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html")
+        ),
+        WebSearchResultItem(
+            title="The economic context of Switzerland - International Trade Portal",
+            url=HttpUrl("https://www.lloydsbanktrade.com/en/market-potential/switzerland/economical-context")
+        ),
+        WebSearchResultItem(
+            title="Switzerland: Country File, Economic Risk Analysis | Coface",
+            url=HttpUrl("https://www.coface.com/news-economy-and-insights/business-risk-dashboard/country-risk-files/switzerland")
+        ),
+        WebSearchResultItem(
+            title="Swiss Economic Outlook 2025 - Roland Berger",
+            url=HttpUrl("https://www.rolandberger.com/en/Insights/Publications/Swiss-Economic-Outlook-2025.html")
+        )
+    ]
+    
+    # Create document data
+    document_data = WebSearchDocumentData(
+        query="current market trends Switzerland business economy 2024 analysis report",
+        results=results,
+        total_count=len(results)
+    )
+    
+    # Create action document
+    action_document = WebSearchActionDocument(
+        documentName="test_search_results.json",
+        documentData=document_data,
+        mimeType="application/json"
+    )
+    
+    # Create action result
+    action_result = WebSearchActionResult(
+        success=True,
+        documents=[action_document]
+    )
+    
+    return action_result
+
+
+def test_csv_output_generation():
+    """Test CSV output generation from web search results"""
+    print("Testing CSV output generation...")
+    
+    # Create method instance (without service center for testing)
+    method = MethodWeb(None)
+    
+    # Create mock search result
+    mock_result = create_mock_web_search_result()
+    
+    # Convert to CSV
+    csv_content = method._convert_search_results_to_csv(mock_result)
+    
+    print("Generated CSV content:")
+    print(csv_content)
+    print()
+    
+    # Verify CSV format
+    lines = csv_content.strip().split('\n')
+    assert len(lines) == 6, f"Expected 6 lines (header + 5 results), got {len(lines)}"
+    
+    # Check header
+    assert lines[0] == "url;title", f"Expected header 'url;title', got '{lines[0]}'"
+    
+    # Check that URLs are present
+    for i, line in enumerate(lines[1:], 1):
+        parts = line.split(';')
+        assert len(parts) == 2, f"Line {i} should have 2 parts separated by ';', got {len(parts)}"
+        url, title = parts
+        assert url.startswith('https://'), f"Line {i} URL should start with 'https://', got '{url}'"
+        assert title, f"Line {i} should have a title, got empty title"
+    
+    print("✓ CSV output generation test passed!")
+    return csv_content
+
+
+def test_csv_input_reading():
+    """Test CSV input reading functionality"""
+    print("Testing CSV input reading...")
+    
+    # Create method instance
+    method = MethodWeb(None)
+    
+    # Test semicolon-separated CSV
+    semicolon_csv = """url;title
+https://www.fitchsolutions.com/bmi/region/switzerland;Switzerland Market Analysis :: Fitch Solutions
+https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html;OECD Economic Outlook, Volume 2024 Issue 2: Switzerland
+https://www.lloydsbanktrade.com/en/market-potential/switzerland/economical-context;The economic context of Switzerland - International Trade Portal"""
+    
+    urls_semicolon = method._read_csv_with_urls(semicolon_csv)
+    print(f"Extracted {len(urls_semicolon)} URLs from semicolon CSV:")
+    for url in urls_semicolon:
+        print(f"  - {url}")
+    
+    assert len(urls_semicolon) == 3, f"Expected 3 URLs, got {len(urls_semicolon)}"
+    assert all(url.startswith('https://') for url in urls_semicolon), "All URLs should start with https://"
+    
+    print("✓ Semicolon CSV reading test passed!")
+    
+    # Test comma-separated CSV
+    comma_csv = """url,title
+https://www.fitchsolutions.com/bmi/region/switzerland,Switzerland Market Analysis :: Fitch Solutions
+https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html,OECD Economic Outlook, Volume 2024 Issue 2: Switzerland"""
+    
+    urls_comma = method._read_csv_with_urls(comma_csv)
+    print(f"Extracted {len(urls_comma)} URLs from comma CSV:")
+    for url in urls_comma:
+        print(f"  - {url}")
+    
+    assert len(urls_comma) == 2, f"Expected 2 URLs, got {len(urls_comma)}"
+    assert all(url.startswith('https://') for url in urls_comma), "All URLs should start with https://"
+    
+    print("✓ Comma CSV reading test passed!")
+    
+    # Test case-insensitive column names
+    case_insensitive_csv = """URL;Title
+https://example.com/test;Test Title"""
+    
+    urls_case = method._read_csv_with_urls(case_insensitive_csv)
+    assert len(urls_case) == 1, f"Expected 1 URL, got {len(urls_case)}"
+    assert urls_case[0] == "https://example.com/test", f"Expected 'https://example.com/test', got '{urls_case[0]}'"
+    
+    print("✓ Case-insensitive CSV reading test passed!")
+
+
+def test_integration():
+    """Test the complete integration: generate CSV and then read it back"""
+    print("Testing integration: generate CSV and read it back...")
+    
+    method = MethodWeb(None)
+    
+    # Generate CSV from mock data
+    mock_result = create_mock_web_search_result()
+    csv_content = method._convert_search_results_to_csv(mock_result)
+    
+    # Read URLs back from the generated CSV
+    extracted_urls = method._read_csv_with_urls(csv_content)
+    
+    print(f"Generated CSV with {len(mock_result.documents[0].documentData.results)} results")
+    print(f"Extracted {len(extracted_urls)} URLs from generated CSV")
+    
+    # Verify we got the same number of URLs
+    assert len(extracted_urls) == len(mock_result.documents[0].documentData.results), \
+        f"Expected {len(mock_result.documents[0].documentData.results)} URLs, got {len(extracted_urls)}"
+    
+    # Verify URLs match
+    original_urls = [str(result.url) for result in mock_result.documents[0].documentData.results]
+    for i, (original, extracted) in enumerate(zip(original_urls, extracted_urls)):
+        assert original == extracted, f"URL {i} mismatch: expected '{original}', got '{extracted}'"
+    
+    print("✓ Integration test passed!")
+
+
+if __name__ == "__main__":
+    print("Running Web CSV Functionality Tests")
+    print("=" * 50)
+    
+    try:
+        # Test CSV output generation
+        csv_content = test_csv_output_generation()
+        print()
+        
+        # Test CSV input reading
+        test_csv_input_reading()
+        print()
+        
+        # Test integration
+        test_integration()
+        print()
+        
+        print("=" * 50)
+        print("🎉 All tests passed successfully!")
+        
+    except Exception as e:
+        print(f"❌ Test failed: {e}")
+        import traceback
+        traceback.print_exc()
+        sys.exit(1)
diff --git a/tests/connectors/test_connector_tavily.py b/tests/connectors/test_connector_tavily.py
index 81ce64c3..23253cba 100644
--- a/tests/connectors/test_connector_tavily.py
+++ b/tests/connectors/test_connector_tavily.py
@@ -4,12 +4,12 @@ import pytest
 import logging
 
 from modules.interfaces.interfaceChatModel import ActionResult
-from modules.interfaces.interface_web_model import (
+from gateway.modules.interfaces.interfaceWebModel import (
     WebSearchRequest,
     WebCrawlRequest,
     WebScrapeRequest,
 )
-from modules.connectors.connector_tavily import ConnectorTavily
+from gateway.modules.connectors.connectorWebTavily import ConnectorTavily
 
 logger = logging.getLogger(__name__)
 
@@ -23,10 +23,10 @@ async def test_tavily_connector_search_test_live_api():
     request = WebSearchRequest(query="How old is the Earth?", max_results=5)
 
     # Tavily instance
-    connector_tavily = await ConnectorTavily.create()
+    connectorWebTavily = await ConnectorTavily.create()
 
     # Search test
-    action_result = await connector_tavily.search_urls(request=request)
+    action_result = await connectorWebTavily.search_urls(request=request)
 
     # Check results
     assert isinstance(action_result, ActionResult)
@@ -57,10 +57,10 @@ async def test_tavily_connector_crawl_test_live_api():
     request = WebCrawlRequest(urls=urls)
 
     # Tavily instance
-    connector_tavily = await ConnectorTavily.create()
+    connectorWebTavily = await ConnectorTavily.create()
 
     # Crawl test
-    action_result = await connector_tavily.crawl_urls(request=request)
+    action_result = await connectorWebTavily.crawl_urls(request=request)
 
     # Check results
     assert isinstance(action_result, ActionResult)
@@ -87,10 +87,10 @@ async def test_tavily_connector_scrape_test_live_api():
     request = WebScrapeRequest(query="How old is the Earth?", max_results=3)
 
     # Tavily instance
-    connector_tavily = await ConnectorTavily.create()
+    connectorWebTavily = await ConnectorTavily.create()
 
     # Scrape test
-    action_result = await connector_tavily.scrape(request=request)
+    action_result = await connectorWebTavily.scrape(request=request)
 
     # Check results
     assert isinstance(action_result, ActionResult)
diff --git a/tests/methods/test_method_web.py b/tests/methods/test_method_web.py
index 2d9305a2..27344ab3 100644
--- a/tests/methods/test_method_web.py
+++ b/tests/methods/test_method_web.py
@@ -5,7 +5,7 @@ import logging
 
 import pytest
 from unittest.mock import patch
-from modules.methods.method_web import MethodWeb
+from modules.methods.methodWeb import MethodWeb
 from tests.fixtures.tavily_responses import (
     RESPONSE_SEARCH_HOW_OLD_IS_EARTH_NO_ANSWER,
     RESPONSE_EXTRACT_HOW_OLD_IS_EARTH_NO_ANSWER,
@@ -101,14 +101,14 @@ async def test_method_web_crawl_live():
     # Mock the service center methods
     with patch.object(method_web, "service") as mock_service:
         mock_service.getChatDocumentsFromDocumentList.return_value = [
-            type("MockDoc", (), {"fileId": "test-file-id"})()
+            type("MockDoc", (), {"fileId": "test-file-id", "fileName": "test-search-results.json"})()
         ]
         mock_service.getFileData.return_value = json.dumps(search_results_json).encode(
             "utf-8"
         )
 
         # Actual request
-        action_result = await method_web.crawl({"document": "test-document-ref"})
+        action_result = await method_web.crawl({"documentList": "test-document-list-ref"})
 
     # Evaluate results
     assert action_result.success
@@ -153,13 +153,13 @@ async def test_method_web_crawl_dummy():
         ) as mock_client,
     ):
         mock_service.getChatDocumentsFromDocumentList.return_value = [
-            type("MockDoc", (), {"fileId": "test-file-id"})()
+            type("MockDoc", (), {"fileId": "test-file-id", "fileName": "test-search-results.json"})()
         ]
         mock_service.getFileData.return_value = json.dumps(search_results_json).encode(
             "utf-8"
         )
 
-        action_result = await method_web.crawl({"document": "test-document-ref"})
+        action_result = await method_web.crawl({"documentList": "test-document-list-ref"})
         mock_client.assert_called_once()
 
     # Evaluate results

From 8726cd4fb8302902cd8ee6088a913e31d6c5a555 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Tue, 2 Sep 2025 21:11:32 +0200
Subject: [PATCH 15/17] Centralized AI

---
 AI_ENGINE_MIGRATION_PLAN.md             | 276 ------------
 modules/chat/serviceCenter_ai_engine.py | 266 ------------
 modules/engines/aiEngine.py             | 544 ------------------------
 modules/interfaces/interfaceAiCalls.py  | 543 +++++++++++++++++++----
 modules/interfaces/interfaceAiEngine.py | 115 -----
 5 files changed, 459 insertions(+), 1285 deletions(-)
 delete mode 100644 AI_ENGINE_MIGRATION_PLAN.md
 delete mode 100644 modules/chat/serviceCenter_ai_engine.py
 delete mode 100644 modules/engines/aiEngine.py
 delete mode 100644 modules/interfaces/interfaceAiEngine.py

diff --git a/AI_ENGINE_MIGRATION_PLAN.md b/AI_ENGINE_MIGRATION_PLAN.md
deleted file mode 100644
index 71077e6f..00000000
--- a/AI_ENGINE_MIGRATION_PLAN.md
+++ /dev/null
@@ -1,276 +0,0 @@
-# AI Engine Migration Plan
-
-## Overview
-This document outlines the migration strategy from the current AI call system to the new Smart AI Engine architecture.
-
-## Benefits of the New Architecture
-
-### 1. **Separation of Concerns**
-- Applications no longer need to worry about content size limits
-- Centralized AI model selection and failover
-- Intelligent content reduction strategies
-
-### 2. **Improved Reliability**
-- Automatic handling of "content too large" errors
-- Multiple fallback strategies
-- Model-specific optimization
-
-### 3. **Better Performance**
-- Optimal model selection based on content characteristics
-- Intelligent chunking and processing strategies
-- Reduced API costs through smart model selection
-
-### 4. **Enhanced Maintainability**
-- Single point of AI logic
-- Easy to add new models and strategies
-- Consistent error handling
-
-## Migration Phases
-
-### Phase 1: Infrastructure Setup (Week 1-2)
-1. **Create AI Engine Interface**
-   - ✅ `interfaceAiEngine.py` - Core interfaces and data structures
-   - ✅ `aiEngine.py` - Smart AI Engine implementation
-   - ✅ `serviceCenter_ai_engine.py` - ServiceCenter integration
-
-2. **Update Dependencies**
-   - Add new imports to existing modules
-   - Update configuration for AI model selection
-   - Add logging for AI engine operations
-
-### Phase 2: ServiceCenter Integration (Week 3)
-1. **Update ServiceCenter Class**
-   ```python
-   # Add to ServiceCenter.__init__
-   self.ai_engine = ServiceCenterAIEngine(self)
-   
-   # Replace existing AI methods
-   async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
-       return await self.ai_engine.callAiTextAdvanced(prompt, context)
-   
-   async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
-       return await self.ai_engine.callAiTextBasic(prompt, context)
-   
-   async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
-       return await self.ai_engine.extractContentFromDocument(prompt, document)
-   
-   async def summarizeChat(self, messages: List[ChatMessage]) -> str:
-       return await self.ai_engine.summarizeChat(messages)
-   ```
-
-2. **Add New Document-Aware Methods**
-   ```python
-   async def callAiWithDocuments(
-       self,
-       prompt: str,
-       documents: List[ChatDocument] = None,
-       operation_type: str = "general"
-   ) -> str:
-       return await self.ai_engine.callAiWithDocuments(
-           prompt, documents, operation_type=operation_type
-       )
-   ```
-
-### Phase 3: Method Updates (Week 4-5)
-1. **Update MethodWeb.py**
-   ```python
-   # Before
-   web_scrape_result = await web_interface.scrape(web_scrape_request)
-   
-   # After - no changes needed, but can be enhanced
-   # The AI engine will automatically handle large content
-   ```
-
-2. **Update MethodDocument.py**
-   ```python
-   # Before
-   formatted_content = await self.service.callAiTextBasic(ai_prompt, content)
-   
-   # After
-   formatted_content = await self.service.callAiForReportGeneration(
-       prompt=ai_prompt,
-       documents=chat_documents
-   )
-   ```
-
-3. **Update MethodAi.py**
-   ```python
-   # Before
-   result = await self.service.callAiTextAdvanced(enhanced_prompt, context)
-   
-   # After
-   result = await self.service.callAiWithDocuments(
-       prompt=enhanced_prompt,
-       documents=document_list,
-       operation_type="ai_processing"
-   )
-   ```
-
-4. **Update MethodOutlook.py**
-   ```python
-   # Before
-   composed_email = await self.service.interfaceAiCalls.callAiTextAdvanced(ai_prompt)
-   
-   # After
-   composed_email = await self.service.callAiForEmailComposition(
-       prompt=ai_prompt,
-       documents=attached_documents
-   )
-   ```
-
-### Phase 4: Task Handling Updates (Week 6)
-1. **Update handlingTasks.py**
-   ```python
-   # Before
-   prompt = await self.service.callAiTextAdvanced(task_planning_prompt)
-   
-   # After
-   prompt = await self.service.callAiForTaskPlanning(
-       prompt=task_planning_prompt,
-       documents=available_documents,
-       context=workflow_context
-   )
-   ```
-
-2. **Update promptFactory.py**
-   ```python
-   # Before
-   messageSummary = await service.summarizeChat(context.workflow.messages)
-   
-   # After - no changes needed, method signature stays the same
-   # But internally uses the new AI engine
-   ```
-
-### Phase 5: Testing and Optimization (Week 7-8)
-1. **Unit Tests**
-   - Test AI engine with various content sizes
-   - Test fallback strategies
-   - Test model selection logic
-
-2. **Integration Tests**
-   - Test with real documents of various sizes
-   - Test error scenarios
-   - Test performance improvements
-
-3. **Performance Monitoring**
-   - Monitor AI call success rates
-   - Monitor processing times
-   - Monitor cost savings
-
-## Code Changes Required
-
-### 1. ServiceCenter Updates
-```python
-# Add to ServiceCenter.__init__
-from modules.chat.serviceCenter_ai_engine import ServiceCenterAIEngine
-self.ai_engine_wrapper = ServiceCenterAIEngine(self)
-
-# Update existing methods to use AI engine
-async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
-    return await self.ai_engine_wrapper.callAiTextAdvanced(prompt, context)
-
-async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
-    return await self.ai_engine_wrapper.callAiTextBasic(prompt, context)
-
-async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
-    return await self.ai_engine_wrapper.extractContentFromDocument(prompt, document)
-
-async def summarizeChat(self, messages: List[ChatMessage]) -> str:
-    return await self.ai_engine_wrapper.summarizeChat(messages)
-```
-
-### 2. Method Updates (Optional Enhancements)
-```python
-# Enhanced method calls with document awareness
-async def process_documents_with_ai(self, prompt: str, documents: List[ChatDocument]):
-    return await self.service.callAiWithDocuments(
-        prompt=prompt,
-        documents=documents,
-        operation_type="document_processing"
-    )
-```
-
-### 3. Configuration Updates
-```ini
-# Add to config.ini
-[AI_ENGINE]
-DEFAULT_MODEL=anthropic_claude
-FALLBACK_MODEL=openai_gpt35
-MAX_CONTENT_SIZE=100000
-ENABLE_CONTENT_REDUCTION=true
-CONTENT_REDUCTION_THRESHOLD=0.8
-```
-
-## Backward Compatibility
-
-### 1. **Method Signatures**
-- All existing method signatures remain unchanged
-- Internal implementation uses new AI engine
-- No breaking changes for existing code
-
-### 2. **Error Handling**
-- Same error types and messages
-- Enhanced error recovery with fallback strategies
-- Better error reporting with processing details
-
-### 3. **Performance**
-- Same or better performance
-- Automatic optimization based on content
-- Reduced API costs through smart model selection
-
-## Risk Mitigation
-
-### 1. **Gradual Rollout**
-- Deploy with feature flags
-- A/B testing with subset of users
-- Rollback capability
-
-### 2. **Monitoring**
-- Comprehensive logging of AI engine operations
-- Performance metrics tracking
-- Error rate monitoring
-
-### 3. **Fallback Strategy**
-- Keep original AI call methods as backup
-- Automatic fallback to original methods on errors
-- Manual override capability
-
-## Expected Benefits
-
-### 1. **Immediate Benefits**
-- Elimination of "content too large" errors
-- Better handling of large documents
-- Improved user experience
-
-### 2. **Long-term Benefits**
-- Easier addition of new AI models
-- Better cost optimization
-- Enhanced content processing capabilities
-- Improved system reliability
-
-### 3. **Developer Benefits**
-- Simplified AI integration
-- No need to worry about content size limits
-- Consistent AI behavior across the system
-- Better debugging and monitoring
-
-## Success Metrics
-
-### 1. **Error Reduction**
-- 90% reduction in "content too large" errors
-- 50% reduction in AI call failures
-- 95% success rate for document processing
-
-### 2. **Performance Improvement**
-- 20% faster processing for large documents
-- 30% reduction in API costs
-- 50% reduction in retry attempts
-
-### 3. **User Experience**
-- Faster response times
-- More reliable document processing
-- Better content extraction quality
-
-## Conclusion
-
-The new AI Engine architecture provides a robust, scalable solution for handling AI calls with large content. The migration can be done gradually with full backward compatibility, ensuring minimal risk while providing significant benefits in reliability, performance, and maintainability.
diff --git a/modules/chat/serviceCenter_ai_engine.py b/modules/chat/serviceCenter_ai_engine.py
deleted file mode 100644
index a33a5813..00000000
--- a/modules/chat/serviceCenter_ai_engine.py
+++ /dev/null
@@ -1,266 +0,0 @@
-"""
-ServiceCenter integration with Smart AI Engine
-"""
-
-import logging
-from typing import List, Dict, Any, Optional
-from modules.interfaces.interfaceChatModel import ChatDocument
-from modules.interfaces.interfaceAiEngine import (
-    AIRequest, AIResponse, AIModelType, ProcessingStrategy, 
-    ContentReductionStrategy
-)
-from modules.engines.aiEngine import SmartAIEngine
-
-logger = logging.getLogger(__name__)
-
-
-class ServiceCenterAIEngine:
-    """ServiceCenter integration with Smart AI Engine"""
-    
-    def __init__(self, service_center):
-        self.service_center = service_center
-        self.ai_engine = SmartAIEngine(service_center)
-    
-    async def callAiWithDocuments(
-        self,
-        prompt: str,
-        documents: List[ChatDocument] = None,
-        context: str = None,
-        preferred_model: AIModelType = None,
-        operation_type: str = "general",
-        processing_strategy: ProcessingStrategy = None,
-        reduction_strategy: ContentReductionStrategy = None,
-        **kwargs
-    ) -> str:
-        """
-        Unified AI call method that handles documents and prompts separately
-        
-        Args:
-            prompt: The AI prompt
-            documents: List of documents to process
-            context: Additional context
-            preferred_model: Preferred AI model
-            operation_type: Type of operation (for strategy selection)
-            processing_strategy: Explicit processing strategy
-            reduction_strategy: Explicit content reduction strategy
-            **kwargs: Additional parameters
-            
-        Returns:
-            AI response content
-        """
-        try:
-            # Create AI request
-            request = AIRequest(
-                prompt=prompt,
-                documents=documents or [],
-                context=context,
-                preferred_model=preferred_model,
-                processing_strategy=processing_strategy,
-                reduction_strategy=reduction_strategy,
-                metadata={
-                    "operation_type": operation_type,
-                    **kwargs
-                }
-            )
-            
-            # Process request
-            response = await self.ai_engine.process_request(request)
-            
-            if response.success:
-                return response.content
-            else:
-                raise Exception(f"AI processing failed: {response.error}")
-                
-        except Exception as e:
-            logger.error(f"Error in AI call with documents: {str(e)}")
-            raise e
-    
-    # Convenience methods for different operation types
-    
-    async def callAiForTaskPlanning(
-        self,
-        prompt: str,
-        documents: List[ChatDocument] = None,
-        context: str = None
-    ) -> str:
-        """AI call optimized for task planning"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="task_planning",
-            preferred_model=AIModelType.ANTHROPIC_CLAUDE  # Better for complex planning
-        )
-    
-    async def callAiForActionDefinition(
-        self,
-        prompt: str,
-        documents: List[ChatDocument] = None,
-        context: str = None
-    ) -> str:
-        """AI call optimized for action definition"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="action_definition",
-            preferred_model=AIModelType.ANTHROPIC_CLAUDE
-        )
-    
-    async def callAiForDocumentExtraction(
-        self,
-        prompt: str,
-        documents: List[ChatDocument],
-        context: str = None
-    ) -> str:
-        """AI call optimized for document extraction"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="document_extraction",
-            processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT
-        )
-    
-    async def callAiForReportGeneration(
-        self,
-        prompt: str,
-        documents: List[ChatDocument],
-        context: str = None
-    ) -> str:
-        """AI call optimized for report generation"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="report_generation",
-            processing_strategy=ProcessingStrategy.CHUNKED_PROCESSING
-        )
-    
-    async def callAiForEmailComposition(
-        self,
-        prompt: str,
-        documents: List[ChatDocument] = None,
-        context: str = None
-    ) -> str:
-        """AI call optimized for email composition"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="email_composition",
-            preferred_model=AIModelType.OPENAI_GPT4  # Better for creative writing
-        )
-    
-    async def callAiForChatSummarization(
-        self,
-        prompt: str,
-        documents: List[ChatDocument] = None,
-        context: str = None
-    ) -> str:
-        """AI call optimized for chat summarization"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="chat_summarization",
-            processing_strategy=ProcessingStrategy.SUMMARIZED_CONTENT
-        )
-    
-    async def callAiForImageAnalysis(
-        self,
-        prompt: str,
-        documents: List[ChatDocument],
-        context: str = None
-    ) -> str:
-        """AI call optimized for image analysis"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            documents=documents,
-            context=context,
-            operation_type="image_analysis",
-            preferred_model=AIModelType.OPENAI_VISION,
-            requires_vision=True
-        )
-    
-    # Backward compatibility methods
-    
-    async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
-        """Backward compatibility method"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            context=context,
-            operation_type="general",
-            preferred_model=AIModelType.ANTHROPIC_CLAUDE
-        )
-    
-    async def callAiTextBasic(self, prompt: str, context: str = None) -> str:
-        """Backward compatibility method"""
-        return await self.callAiWithDocuments(
-            prompt=prompt,
-            context=context,
-            operation_type="general",
-            preferred_model=AIModelType.OPENAI_GPT35
-        )
-    
-    async def callAiImageBasic(self, prompt: str, image_data: str, mime_type: str) -> str:
-        """Backward compatibility method for image processing"""
-        # Create a document from image data
-        image_doc = self.service_center.createDocument(
-            "image_analysis.jpg",
-            mime_type,
-            image_data,
-            base64encoded=True
-        )
-        
-        return await self.callAiForImageAnalysis(
-            prompt=prompt,
-            documents=[image_doc]
-        )
-    
-    async def extractContentFromDocument(self, prompt: str, document: ChatDocument) -> str:
-        """Enhanced document extraction using AI engine"""
-        try:
-            return await self.callAiForDocumentExtraction(
-                prompt=prompt,
-                documents=[document]
-            )
-        except Exception as e:
-            logger.error(f"Error in enhanced document extraction: {str(e)}")
-            # Fall back to original method
-            from modules.interfaces.interfaceChatModel import ExtractedContent
-            extracted = await self.service_center.documentProcessor.processFileData(
-                fileData=self.service_center.getFileData(document.fileId),
-                fileName=document.fileName,
-                mimeType=document.mimeType,
-                prompt=prompt,
-                documentId=document.id
-            )
-            if extracted and extracted.contents:
-                return "\n".join([item.data for item in extracted.contents])
-            return ""
-    
-    async def summarizeChat(self, messages: List) -> str:
-        """Enhanced chat summarization using AI engine"""
-        try:
-            # Convert messages to a simple text format
-            chat_content = "\n".join([f"{msg.role}: {msg.message}" for msg in messages if hasattr(msg, 'message')])
-            
-            # Create a document from chat content
-            chat_doc = self.service_center.createDocument(
-                "chat_history.txt",
-                "text/plain",
-                chat_content,
-                base64encoded=False
-            )
-            
-            return await self.callAiForChatSummarization(
-                prompt="Summarize this chat conversation, focusing on key decisions, outcomes, and next steps.",
-                documents=[chat_doc]
-            )
-        except Exception as e:
-            logger.error(f"Error in enhanced chat summarization: {str(e)}")
-            # Fall back to original method
-            return await self.service_center.callAiTextBasic(
-                f"Summarize this chat conversation: {chat_content}"
-            )
diff --git a/modules/engines/aiEngine.py b/modules/engines/aiEngine.py
deleted file mode 100644
index f2f74c27..00000000
--- a/modules/engines/aiEngine.py
+++ /dev/null
@@ -1,544 +0,0 @@
-"""
-Smart AI Engine with intelligent content management and model selection
-"""
-
-import logging
-import asyncio
-from typing import List, Dict, Any, Optional, Tuple
-from modules.interfaces.interfaceAiEngine import (
-    AIEngine, AIRequest, AIResponse, AIModelType, ProcessingStrategy, 
-    ContentReductionStrategy, ModelCapabilities, ContentReducer
-)
-from modules.interfaces.interfaceChatModel import ChatDocument
-from modules.interfaces.interfaceAiCalls import AiCalls
-from modules.chat.documents.documentExtraction import DocumentExtraction
-from modules.shared.configuration import APP_CONFIG
-
-logger = logging.getLogger(__name__)
-
-
-class SmartAIEngine(AIEngine):
-    """Smart AI Engine with automatic content management and model selection"""
-    
-    def __init__(self, service_center=None):
-        self.service_center = service_center
-        self.ai_calls = AiCalls()
-        self.document_processor = DocumentExtraction(service_center)
-        self.content_reducer = SmartContentReducer(service_center)
-        
-        # Model capabilities mapping
-        self.model_capabilities = {
-            AIModelType.OPENAI_GPT4: ModelCapabilities(
-                max_tokens=8192,
-                max_input_tokens=128000,
-                supports_vision=False,
-                supports_function_calling=True,
-                cost_per_1k_tokens=0.03,
-                processing_speed="medium"
-            ),
-            AIModelType.OPENAI_GPT35: ModelCapabilities(
-                max_tokens=4096,
-                max_input_tokens=16384,
-                supports_vision=False,
-                supports_function_calling=True,
-                cost_per_1k_tokens=0.002,
-                processing_speed="fast"
-            ),
-            AIModelType.ANTHROPIC_CLAUDE: ModelCapabilities(
-                max_tokens=4096,
-                max_input_tokens=200000,
-                supports_vision=False,
-                supports_function_calling=False,
-                cost_per_1k_tokens=0.015,
-                processing_speed="medium"
-            ),
-            AIModelType.OPENAI_VISION: ModelCapabilities(
-                max_tokens=4096,
-                max_input_tokens=128000,
-                supports_vision=True,
-                supports_function_calling=False,
-                cost_per_1k_tokens=0.01,
-                processing_speed="slow"
-            )
-        }
-        
-        # Processing strategy preferences
-        self.strategy_preferences = {
-            "task_planning": ProcessingStrategy.SINGLE_CALL,
-            "action_definition": ProcessingStrategy.SINGLE_CALL,
-            "document_extraction": ProcessingStrategy.DOCUMENT_BY_DOCUMENT,
-            "report_generation": ProcessingStrategy.CHUNKED_PROCESSING,
-            "email_composition": ProcessingStrategy.SINGLE_CALL,
-            "chat_summarization": ProcessingStrategy.SUMMARIZED_CONTENT
-        }
-    
-    async def process_request(self, request: AIRequest) -> AIResponse:
-        """Process AI request with intelligent content management"""
-        try:
-            # Step 1: Determine optimal processing strategy
-            strategy = self._determine_processing_strategy(request)
-            request.processing_strategy = strategy
-            
-            # Step 2: Estimate token usage
-            estimated_tokens = await self.estimate_token_usage(request)
-            
-            # Step 3: Select appropriate model
-            model = self._select_optimal_model(request, estimated_tokens)
-            
-            # Step 4: Process with selected strategy
-            if strategy == ProcessingStrategy.SINGLE_CALL:
-                return await self._process_single_call(request, model)
-            elif strategy == ProcessingStrategy.DOCUMENT_BY_DOCUMENT:
-                return await self._process_document_by_document(request, model)
-            elif strategy == ProcessingStrategy.CHUNKED_PROCESSING:
-                return await self._process_chunked(request, model)
-            elif strategy == ProcessingStrategy.SUMMARIZED_CONTENT:
-                return await self._process_with_summarization(request, model)
-            else:
-                raise ValueError(f"Unknown processing strategy: {strategy}")
-                
-        except Exception as e:
-            logger.error(f"Error processing AI request: {str(e)}")
-            return AIResponse(
-                success=False,
-                content="",
-                model_used=AIModelType.OPENAI_GPT35,
-                processing_strategy=ProcessingStrategy.SINGLE_CALL,
-                error=str(e)
-            )
-    
-    def _determine_processing_strategy(self, request: AIRequest) -> ProcessingStrategy:
-        """Determine the best processing strategy based on request characteristics"""
-        
-        # Use explicit strategy if provided
-        if request.processing_strategy:
-            return request.processing_strategy
-        
-        # Determine based on metadata or content characteristics
-        metadata = request.metadata or {}
-        operation_type = metadata.get("operation_type", "general")
-        
-        # Check if we have a preference for this operation type
-        if operation_type in self.strategy_preferences:
-            return self.strategy_preferences[operation_type]
-        
-        # Auto-determine based on content characteristics
-        num_documents = len(request.documents)
-        prompt_length = len(request.prompt)
-        
-        if num_documents == 0:
-            return ProcessingStrategy.SINGLE_CALL
-        elif num_documents == 1:
-            return ProcessingStrategy.SINGLE_CALL
-        elif num_documents <= 3 and prompt_length < 1000:
-            return ProcessingStrategy.SINGLE_CALL
-        elif num_documents > 5:
-            return ProcessingStrategy.DOCUMENT_BY_DOCUMENT
-        else:
-            return ProcessingStrategy.CHUNKED_PROCESSING
-    
-    def _select_optimal_model(self, request: AIRequest, estimated_tokens: int) -> AIModelType:
-        """Select the optimal AI model based on request characteristics"""
-        
-        # Use preferred model if specified and suitable
-        if request.preferred_model:
-            capabilities = self.get_model_capabilities(request.preferred_model)
-            if estimated_tokens <= capabilities.max_input_tokens:
-                return request.preferred_model
-        
-        # Select model based on requirements
-        metadata = request.metadata or {}
-        requires_vision = metadata.get("requires_vision", False)
-        requires_function_calling = metadata.get("requires_function_calling", False)
-        
-        # Filter models by requirements
-        suitable_models = []
-        for model, capabilities in self.model_capabilities.items():
-            if estimated_tokens <= capabilities.max_input_tokens:
-                if requires_vision and not capabilities.supports_vision:
-                    continue
-                if requires_function_calling and not capabilities.supports_function_calling:
-                    continue
-                suitable_models.append((model, capabilities))
-        
-        if not suitable_models:
-            # If no model can handle the full content, use the one with highest capacity
-            best_model = max(self.model_capabilities.items(), 
-                           key=lambda x: x[1].max_input_tokens)
-            logger.warning(f"No model can handle {estimated_tokens} tokens, using {best_model[0]}")
-            return best_model[0]
-        
-        # Select based on cost and speed preferences
-        # For now, prefer Claude for large content, GPT-4 for complex tasks, GPT-3.5 for simple tasks
-        if estimated_tokens > 50000:
-            return AIModelType.ANTHROPIC_CLAUDE
-        elif metadata.get("complex_task", False):
-            return AIModelType.OPENAI_GPT4
-        else:
-            return AIModelType.OPENAI_GPT35
-    
-    async def _process_single_call(self, request: AIRequest, model: AIModelType) -> AIResponse:
-        """Process request with a single AI call"""
-        try:
-            # Prepare content
-            content = await self._prepare_content_for_single_call(request)
-            
-            # Make AI call
-            if model in [AIModelType.OPENAI_GPT4, AIModelType.OPENAI_GPT35]:
-                response = await self.ai_calls.callAiTextAdvanced(content, request.context)
-            elif model == AIModelType.ANTHROPIC_CLAUDE:
-                response = await self.ai_calls.callAiTextAdvanced(content, request.context)
-            else:
-                raise ValueError(f"Unsupported model for single call: {model}")
-            
-            return AIResponse(
-                success=True,
-                content=response,
-                model_used=model,
-                processing_strategy=ProcessingStrategy.SINGLE_CALL
-            )
-            
-        except Exception as e:
-            # If single call fails due to size, try with content reduction
-            if "too large" in str(e).lower() or "400" in str(e):
-                return await self._process_with_content_reduction(request, model)
-            else:
-                raise e
-    
-    async def _process_document_by_document(self, request: AIRequest, model: AIModelType) -> AIResponse:
-        """Process each document separately and merge results"""
-        try:
-            results = []
-            
-            for i, document in enumerate(request.documents):
-                # Create individual request for each document
-                doc_request = AIRequest(
-                    prompt=request.prompt,
-                    documents=[document],
-                    context=request.context,
-                    preferred_model=model,
-                    metadata=request.metadata
-                )
-                
-                # Process document
-                doc_response = await self._process_single_call(doc_request, model)
-                if doc_response.success:
-                    results.append(f"Document {i+1} ({document.fileName}):\n{doc_response.content}")
-                else:
-                    results.append(f"Document {i+1} ({document.fileName}): Error - {doc_response.error}")
-            
-            # Merge results
-            merged_content = "\n\n".join(results)
-            
-            return AIResponse(
-                success=True,
-                content=merged_content,
-                model_used=model,
-                processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT
-            )
-            
-        except Exception as e:
-            logger.error(f"Error in document-by-document processing: {str(e)}")
-            return AIResponse(
-                success=False,
-                content="",
-                model_used=model,
-                processing_strategy=ProcessingStrategy.DOCUMENT_BY_DOCUMENT,
-                error=str(e)
-            )
-    
-    async def _process_chunked(self, request: AIRequest, model: AIModelType) -> AIResponse:
-        """Process content in chunks and merge results"""
-        try:
-            # This would implement chunked processing logic
-            # For now, fall back to document-by-document
-            return await self._process_document_by_document(request, model)
-            
-        except Exception as e:
-            logger.error(f"Error in chunked processing: {str(e)}")
-            return AIResponse(
-                success=False,
-                content="",
-                model_used=model,
-                processing_strategy=ProcessingStrategy.CHUNKED_PROCESSING,
-                error=str(e)
-            )
-    
-    async def _process_with_summarization(self, request: AIRequest, model: AIModelType) -> AIResponse:
-        """Process with content summarization first"""
-        try:
-            # Summarize documents first
-            summarized_docs = []
-            for document in request.documents:
-                summary_doc = await self.content_reducer.summarize_document(
-                    document, 
-                    f"Summarize this document for: {request.prompt}"
-                )
-                summarized_docs.append(summary_doc)
-            
-            # Create new request with summarized documents
-            summary_request = AIRequest(
-                prompt=request.prompt,
-                documents=summarized_docs,
-                context=request.context,
-                preferred_model=model,
-                metadata=request.metadata
-            )
-            
-            # Process with summarized content
-            return await self._process_single_call(summary_request, model)
-            
-        except Exception as e:
-            logger.error(f"Error in summarization processing: {str(e)}")
-            return AIResponse(
-                success=False,
-                content="",
-                model_used=model,
-                processing_strategy=ProcessingStrategy.SUMMARIZED_CONTENT,
-                error=str(e)
-            )
-    
-    async def _process_with_content_reduction(self, request: AIRequest, model: AIModelType) -> AIResponse:
-        """Process with automatic content reduction"""
-        try:
-            # Determine reduction strategy
-            strategy = self._determine_reduction_strategy(request)
-            
-            # Reduce content
-            reduced_docs, reduced_prompt = await self.content_reducer.reduce_content(
-                request.documents,
-                request.prompt,
-                strategy,
-                target_reduction=0.5
-            )
-            
-            # Create new request with reduced content
-            reduced_request = AIRequest(
-                prompt=reduced_prompt,
-                documents=reduced_docs,
-                context=request.context,
-                preferred_model=model,
-                metadata=request.metadata
-            )
-            
-            # Try processing with reduced content
-            return await self._process_single_call(reduced_request, model)
-            
-        except Exception as e:
-            logger.error(f"Error in content reduction processing: {str(e)}")
-            return AIResponse(
-                success=False,
-                content="",
-                model_used=model,
-                processing_strategy=ProcessingStrategy.SINGLE_CALL,
-                error=f"Content reduction failed: {str(e)}"
-            )
-    
-    def _determine_reduction_strategy(self, request: AIRequest) -> ContentReductionStrategy:
-        """Determine the best content reduction strategy"""
-        
-        # Use explicit strategy if provided
-        if request.reduction_strategy:
-            return request.reduction_strategy
-        
-        # Auto-determine based on request characteristics
-        metadata = request.metadata or {}
-        operation_type = metadata.get("operation_type", "general")
-        
-        # Different strategies for different operations
-        if operation_type in ["task_planning", "action_definition"]:
-            # For planning tasks, prompt is crucial
-            return ContentReductionStrategy.REDUCE_DOCUMENTS_ONLY
-        elif operation_type in ["document_extraction", "report_generation"]:
-            # For document processing, documents are crucial
-            return ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS
-        else:
-            # Default: reduce both
-            return ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS
-    
-    async def _prepare_content_for_single_call(self, request: AIRequest) -> str:
-        """Prepare content for a single AI call"""
-        content_parts = [request.prompt]
-        
-        if request.context:
-            content_parts.append(f"Context: {request.context}")
-        
-        # Add document content
-        for i, document in enumerate(request.documents):
-            try:
-                # Extract document content
-                extracted = await self.service_center.extractContentFromDocument(
-                    "Extract all relevant text content",
-                    document
-                )
-                
-                if extracted and extracted.contents:
-                    doc_content = "\n".join([item.data for item in extracted.contents])
-                    content_parts.append(f"Document {i+1} ({document.fileName}):\n{doc_content}")
-                else:
-                    content_parts.append(f"Document {i+1} ({document.fileName}): [No content extracted]")
-                    
-            except Exception as e:
-                logger.warning(f"Could not extract content from document {document.fileName}: {str(e)}")
-                content_parts.append(f"Document {i+1} ({document.fileName}): [Error extracting content]")
-        
-        return "\n\n".join(content_parts)
-    
-    def get_model_capabilities(self, model: AIModelType) -> ModelCapabilities:
-        """Get capabilities for a specific model"""
-        return self.model_capabilities.get(model, self.model_capabilities[AIModelType.OPENAI_GPT35])
-    
-    async def estimate_token_usage(self, request: AIRequest) -> int:
-        """Estimate token usage for a request"""
-        # Simple estimation: ~4 characters per token
-        prompt_tokens = len(request.prompt) // 4
-        context_tokens = len(request.context or "") // 4
-        
-        # Estimate document tokens
-        doc_tokens = 0
-        for document in request.documents:
-            # Rough estimate based on file size
-            doc_tokens += document.fileSize // 4
-        
-        return prompt_tokens + context_tokens + doc_tokens
-
-
-class SmartContentReducer(ContentReducer):
-    """Smart content reducer using document extraction engine"""
-    
-    def __init__(self, service_center):
-        self.service_center = service_center
-        self.document_processor = DocumentExtraction(service_center)
-    
-    async def reduce_content(
-        self, 
-        documents: List[ChatDocument], 
-        prompt: str,
-        strategy: ContentReductionStrategy,
-        target_reduction: float = 0.5
-    ) -> Tuple[List[ChatDocument], str]:
-        """Reduce content size while preserving important information"""
-        
-        reduced_docs = []
-        reduced_prompt = prompt
-        
-        # Sort documents by size (largest first)
-        sorted_docs = sorted(documents, key=lambda d: d.fileSize, reverse=True)
-        
-        for document in sorted_docs:
-            try:
-                # Create reduction prompt based on strategy
-                if strategy == ContentReductionStrategy.REDUCE_DOCUMENTS_ONLY:
-                    reduction_prompt = f"""
-                    Summarize this document to {int(100 * (1 - target_reduction))}% of its original size.
-                    Focus on the most important information relevant to: {prompt}
-                    Preserve key facts, data, and conclusions.
-                    """
-                elif strategy == ContentReductionStrategy.SUMMARIZE_DOCUMENTS:
-                    reduction_prompt = f"""
-                    Create a concise summary of this document focusing on: {prompt}
-                    Include only the most relevant information.
-                    """
-                else:  # REDUCE_PROMPT_AND_DOCS or EXTRACT_KEY_INFO
-                    reduction_prompt = f"""
-                    Extract only the key information from this document that is relevant to: {prompt}
-                    Be very selective and concise.
-                    """
-                
-                # Process document with reduction
-                extracted = await self.service_center.extractContentFromDocument(
-                    reduction_prompt,
-                    document
-                )
-                
-                if extracted and extracted.contents:
-                    # Create new document with reduced content
-                    reduced_content = "\n".join([item.data for item in extracted.contents])
-                    reduced_doc = await self._create_reduced_document(document, reduced_content)
-                    reduced_docs.append(reduced_doc)
-                else:
-                    # If reduction fails, keep original document
-                    reduced_docs.append(document)
-                    
-            except Exception as e:
-                logger.warning(f"Could not reduce document {document.fileName}: {str(e)}")
-                reduced_docs.append(document)
-        
-        # Reduce prompt if strategy requires it
-        if strategy in [ContentReductionStrategy.REDUCE_PROMPT_AND_DOCS]:
-            reduced_prompt = self._reduce_prompt(prompt, target_reduction)
-        
-        return reduced_docs, reduced_prompt
-    
-    async def summarize_document(
-        self, 
-        document: ChatDocument, 
-        focus_prompt: str
-    ) -> ChatDocument:
-        """Create a summary of a document focused on specific aspects"""
-        
-        summary_prompt = f"""
-        Create a comprehensive summary of this document focusing on: {focus_prompt}
-        
-        Include:
-        - Key points and main ideas
-        - Important data and statistics
-        - Conclusions and recommendations
-        - Any relevant details
-        
-        Keep the summary concise but informative.
-        """
-        
-        try:
-            extracted = await self.service_center.extractContentFromDocument(
-                summary_prompt,
-                document
-            )
-            
-            if extracted and extracted.contents:
-                summary_content = "\n".join([item.data for item in extracted.contents])
-                return await self._create_reduced_document(document, summary_content)
-            else:
-                return document
-                
-        except Exception as e:
-            logger.warning(f"Could not summarize document {document.fileName}: {str(e)}")
-            return document
-    
-    async def _create_reduced_document(self, original_doc: ChatDocument, reduced_content: str) -> ChatDocument:
-        """Create a new document with reduced content"""
-        try:
-            # Create new file with reduced content
-            file_id = self.service_center.createFile(
-                f"reduced_{original_doc.fileName}",
-                "text/plain",
-                reduced_content,
-                base64encoded=False
-            )
-            
-            # Create new document
-            return self.service_center.createDocument(
-                f"reduced_{original_doc.fileName}",
-                "text/plain",
-                reduced_content,
-                base64encoded=False,
-                existing_file_id=file_id
-            )
-            
-        except Exception as e:
-            logger.error(f"Could not create reduced document: {str(e)}")
-            return original_doc
-    
-    def _reduce_prompt(self, prompt: str, target_reduction: float) -> str:
-        """Reduce prompt size while preserving essential information"""
-        # Simple prompt reduction - keep first and last parts
-        lines = prompt.split('\n')
-        if len(lines) <= 3:
-            return prompt
-        
-        # Keep first 30% and last 20% of lines
-        keep_start = int(len(lines) * 0.3)
-        keep_end = int(len(lines) * 0.2)
-        
-        reduced_lines = lines[:keep_start] + ["... (content reduced) ..."] + lines[-keep_end:]
-        return '\n'.join(reduced_lines)
diff --git a/modules/interfaces/interfaceAiCalls.py b/modules/interfaces/interfaceAiCalls.py
index fe93105f..f0bb67b4 100644
--- a/modules/interfaces/interfaceAiCalls.py
+++ b/modules/interfaces/interfaceAiCalls.py
@@ -2,19 +2,377 @@ import logging
 from typing import Dict, Any, List, Union, Optional
 from modules.connectors.connectorAiOpenai import AiOpenai, ContextLengthExceededException
 from modules.connectors.connectorAiAnthropic import AiAnthropic
+from modules.chat.documents.documentExtraction import DocumentExtraction
+from modules.interfaces.interfaceChatModel import ChatDocument
 
 logger = logging.getLogger(__name__)
 
+# AI Model Registry with Performance Data
+AI_MODELS = {
+    "openai_gpt4o": {
+        "connector": "openai",
+        "max_tokens": 128000,
+        "cost_per_1k_tokens": 0.03,  # Input
+        "cost_per_1k_tokens_output": 0.06,  # Output
+        "speed_rating": 8,  # 1-10
+        "quality_rating": 9,  # 1-10
+        "supports_images": True,
+        "supports_documents": True,
+        "context_length": 128000,
+        "model_name": "gpt-4o"
+    },
+    "openai_gpt35": {
+        "connector": "openai", 
+        "max_tokens": 16000,
+        "cost_per_1k_tokens": 0.0015,
+        "cost_per_1k_tokens_output": 0.002,
+        "speed_rating": 9,
+        "quality_rating": 7,
+        "supports_images": False,
+        "supports_documents": True,
+        "context_length": 16000,
+        "model_name": "gpt-3.5-turbo"
+    },
+    "anthropic_claude": {
+        "connector": "anthropic",
+        "max_tokens": 200000,
+        "cost_per_1k_tokens": 0.015,
+        "cost_per_1k_tokens_output": 0.075,
+        "speed_rating": 7,
+        "quality_rating": 10,
+        "supports_images": True,
+        "supports_documents": True,
+        "context_length": 200000,
+        "model_name": "claude-3-sonnet-20240229"
+    }
+}
+
 class AiCalls:
-    """Interface for AI service interactions"""
+    """Interface for AI service interactions with centralized call method"""
     
     def __init__(self):
         self.openaiService = AiOpenai()
         self.anthropicService = AiAnthropic()
+        self.document_extractor = DocumentExtraction()
+    
+    async def callAi(
+        self,
+        prompt: str,
+        documents: List[ChatDocument] = None,
+        operation_type: str = "general",
+        priority: str = "balanced",  # "speed", "quality", "cost", "balanced"
+        compress_prompt: bool = True,
+        compress_documents: bool = True,
+        process_documents_individually: bool = False,
+        max_cost: float = None,
+        max_processing_time: int = None
+    ) -> str:
+        """
+        Zentrale AI Call Methode mit intelligenter Modell-Auswahl und Content-Verarbeitung.
         
+        Args:
+            prompt: Der Hauptprompt für die AI
+            documents: Liste von Dokumenten zur Verarbeitung
+            operation_type: Art der Operation ("general", "document_analysis", "image_analysis", etc.)
+            priority: Priorität für Modell-Auswahl ("speed", "quality", "cost", "balanced")
+            compress_prompt: Ob der Prompt komprimiert werden soll
+            compress_documents: Ob Dokumente komprimiert werden sollen
+            process_documents_individually: Ob Dokumente einzeln verarbeitet werden sollen
+            max_cost: Maximale Kosten für den Call
+            max_processing_time: Maximale Verarbeitungszeit in Sekunden
+            
+        Returns:
+            AI Response als String
+        """
+        try:
+            # 1. Dokumente verarbeiten falls vorhanden
+            document_content = ""
+            if documents:
+                document_content = await self._process_documents_for_ai(
+                    documents, 
+                    operation_type,
+                    compress_documents,
+                    process_documents_individually
+                )
+            
+            # 2. Bestes Modell basierend auf Priorität und Content auswählen
+            selected_model = self._select_optimal_model(
+                prompt, 
+                document_content, 
+                priority, 
+                operation_type,
+                max_cost,
+                max_processing_time
+            )
+            
+            # 3. Content für das gewählte Modell optimieren
+            optimized_prompt, optimized_content = await self._optimize_content_for_model(
+                prompt, 
+                document_content, 
+                selected_model,
+                compress_prompt,
+                compress_documents
+            )
+            
+            # 4. AI Call mit Failover ausführen
+            return await self._execute_ai_call_with_failover(
+                selected_model, 
+                optimized_prompt, 
+                optimized_content
+            )
+            
+        except Exception as e:
+            logger.error(f"Error in centralized AI call: {str(e)}")
+            return f"Error: {str(e)}"
+    
+    def _select_optimal_model(
+        self, 
+        prompt: str, 
+        document_content: str, 
+        priority: str,
+        operation_type: str,
+        max_cost: float = None,
+        max_processing_time: int = None
+    ) -> str:
+        """Wählt das optimale Modell basierend auf Priorität und Content aus"""
+        
+        # Content-Größe berechnen
+        total_content_size = len(prompt.encode('utf-8')) + len(document_content.encode('utf-8'))
+        
+        # Verfügbare Modelle filtern
+        available_models = {}
+        for model_name, model_info in AI_MODELS.items():
+            # Prüfe ob Modell für Content-Größe geeignet ist
+            if total_content_size > model_info["context_length"] * 0.8:  # 80% für Content
+                continue
+            
+            # Prüfe Kosten-Limit
+            if max_cost:
+                estimated_cost = self._estimate_cost(model_info, total_content_size)
+                if estimated_cost > max_cost:
+                    continue
+            
+            # Prüfe Operation-Type Kompatibilität
+            if operation_type == "image_analysis" and not model_info["supports_images"]:
+                continue
+                
+            available_models[model_name] = model_info
+        
+        if not available_models:
+            # Fallback zum kleinsten Modell
+            return "openai_gpt35"
+        
+        # Modell basierend auf Priorität auswählen
+        if priority == "speed":
+            return max(available_models.keys(), key=lambda x: available_models[x]["speed_rating"])
+        elif priority == "quality":
+            return max(available_models.keys(), key=lambda x: available_models[x]["quality_rating"])
+        elif priority == "cost":
+            return min(available_models.keys(), key=lambda x: available_models[x]["cost_per_1k_tokens"])
+        else:  # balanced
+            # Gewichtete Bewertung: 40% Qualität, 30% Geschwindigkeit, 30% Kosten
+            def balanced_score(model_name):
+                model_info = available_models[model_name]
+                quality_score = model_info["quality_rating"] * 0.4
+                speed_score = model_info["speed_rating"] * 0.3
+                cost_score = (10 - (model_info["cost_per_1k_tokens"] * 1000)) * 0.3  # Niedrigere Kosten = höherer Score
+                return quality_score + speed_score + cost_score
+            
+            return max(available_models.keys(), key=balanced_score)
+    
+    def _estimate_cost(self, model_info: Dict, content_size: int) -> float:
+        """Schätzt die Kosten für einen AI Call"""
+        # Grobe Schätzung: 1 Token ≈ 4 Zeichen
+        estimated_tokens = content_size / 4
+        input_cost = (estimated_tokens / 1000) * model_info["cost_per_1k_tokens"]
+        output_cost = (estimated_tokens / 1000) * model_info["cost_per_1k_tokens_output"] * 0.1  # 10% für Output
+        return input_cost + output_cost
+    
+    async def _process_documents_for_ai(
+        self, 
+        documents: List[ChatDocument], 
+        operation_type: str,
+        compress_documents: bool,
+        process_individually: bool
+    ) -> str:
+        """Verarbeitet Dokumente für AI Call mit documentExtraction.py"""
+        
+        if not documents:
+            return ""
+        
+        processed_contents = []
+        
+        for doc in documents:
+            try:
+                # Extrahiere Content mit documentExtraction.py
+                extracted = await self.document_extractor.processFileData(
+                    doc.fileData, 
+                    doc.fileName, 
+                    doc.mimeType,
+                    prompt=f"Extract relevant content for {operation_type}",
+                    documentId=doc.id,
+                    enableAI=True
+                )
+                
+                # Kombiniere alle Content-Items
+                doc_content = []
+                for content_item in extracted.contents:
+                    if content_item.data and content_item.data.strip():
+                        doc_content.append(content_item.data)
+                
+                if doc_content:
+                    combined_doc_content = "\n\n".join(doc_content)
+                    
+                    # Komprimiere falls gewünscht
+                    if compress_documents and len(combined_doc_content.encode('utf-8')) > 10000:  # 10KB Limit
+                        combined_doc_content = await self._compress_content(
+                            combined_doc_content, 
+                            10000, 
+                            "document"
+                        )
+                    
+                    processed_contents.append(f"Document: {doc.fileName}\n{combined_doc_content}")
+                
+            except Exception as e:
+                logger.warning(f"Error processing document {doc.fileName}: {str(e)}")
+                processed_contents.append(f"Document: {doc.fileName}\n[Error processing document: {str(e)}]")
+        
+        return "\n\n---\n\n".join(processed_contents)
+    
+    async def _optimize_content_for_model(
+        self, 
+        prompt: str, 
+        document_content: str, 
+        model_name: str,
+        compress_prompt: bool,
+        compress_documents: bool
+    ) -> tuple[str, str]:
+        """Optimiert Content für das gewählte Modell"""
+        
+        model_info = AI_MODELS[model_name]
+        max_content_size = model_info["context_length"] * 0.7  # 70% für Content
+        
+        optimized_prompt = prompt
+        optimized_content = document_content
+        
+        # Prompt komprimieren falls gewünscht
+        if compress_prompt and len(prompt.encode('utf-8')) > 2000:  # 2KB Limit für Prompt
+            optimized_prompt = await self._compress_content(prompt, 2000, "prompt")
+        
+        # Dokument-Content komprimieren falls gewünscht
+        if compress_documents and document_content:
+            content_size = len(document_content.encode('utf-8'))
+            if content_size > max_content_size:
+                optimized_content = await self._compress_content(
+                    document_content, 
+                    int(max_content_size), 
+                    "document"
+                )
+        
+        return optimized_prompt, optimized_content
+    
+    async def _compress_content(self, content: str, target_size: int, content_type: str) -> str:
+        """Komprimiert Content intelligent basierend auf Typ"""
+        
+        if len(content.encode('utf-8')) <= target_size:
+            return content
+        
+        try:
+            # Verwende AI für intelligente Kompression
+            compression_prompt = f"""
+            Komprimiere den folgenden {content_type} auf maximal {target_size} Zeichen, 
+            behalte aber alle wichtigen Informationen bei:
+            
+            {content}
+            
+            Gib nur den komprimierten Inhalt zurück, ohne zusätzliche Erklärungen.
+            """
+            
+            # Verwende das schnellste verfügbare Modell für Kompression
+            compression_model = "openai_gpt35"
+            model_info = AI_MODELS[compression_model]
+            connector = getattr(self, f"{model_info['connector']}Service")
+            
+            messages = [{"role": "user", "content": compression_prompt}]
+            
+            if model_info["connector"] == "openai":
+                compressed = await connector.callAiBasic(messages)
+            else:
+                response = await connector.callAiBasic(messages)
+                compressed = response["choices"][0]["message"]["content"]
+            
+            return compressed
+            
+        except Exception as e:
+            logger.warning(f"AI compression failed, using truncation: {str(e)}")
+            # Fallback: Einfache Truncation
+            return content[:target_size] + "... [truncated]"
+    
+    async def _execute_ai_call_with_failover(
+        self, 
+        model_name: str, 
+        prompt: str, 
+        document_content: str
+    ) -> str:
+        """Führt AI Call mit automatischem Failover aus"""
+        
+        try:
+            model_info = AI_MODELS[model_name]
+            connector = getattr(self, f"{model_info['connector']}Service")
+            
+            # Messages vorbereiten
+            messages = []
+            if document_content:
+                messages.append({
+                    "role": "system",
+                    "content": f"Context from documents:\n{document_content}"
+                })
+            
+            messages.append({
+                "role": "user", 
+                "content": prompt
+            })
+            
+            # AI Call ausführen
+            if model_info["connector"] == "openai":
+                return await connector.callAiBasic(messages)
+            else:  # anthropic
+                response = await connector.callAiBasic(messages)
+                return response["choices"][0]["message"]["content"]
+                
+        except ContextLengthExceededException:
+            logger.warning(f"Context length exceeded for {model_name}, trying fallback")
+            # Fallback zu Modell mit größerem Context
+            fallback_model = self._find_fallback_model(model_name)
+            if fallback_model:
+                return await self._execute_ai_call_with_failover(fallback_model, prompt, document_content)
+            else:
+                # Letzter Ausweg: Content weiter komprimieren
+                compressed_prompt = await self._compress_content(prompt, 1000, "prompt")
+                compressed_content = await self._compress_content(document_content, 5000, "document")
+                return await self._execute_ai_call_with_failover("openai_gpt35", compressed_prompt, compressed_content)
+        
+        except Exception as e:
+            logger.warning(f"AI call failed with {model_name}: {e}")
+            # Allgemeiner Fallback
+            return await self._execute_ai_call_with_failover("openai_gpt35", prompt, document_content)
+    
+    def _find_fallback_model(self, current_model: str) -> Optional[str]:
+        """Findet ein Fallback-Modell mit größerem Context"""
+        current_context = AI_MODELS[current_model]["context_length"]
+        
+        # Suche Modell mit größerem Context
+        for model_name, model_info in AI_MODELS.items():
+            if model_info["context_length"] > current_context:
+                return model_name
+        
+        return None
+        
+    # Legacy methods
+
     async def callAiTextBasic(self, prompt: str, context: Optional[str] = None) -> str:
         """
-        Basic text processing using OpenAI.
+        Basic text processing - now uses centralized AI call method.
         
         Args:
             prompt: The user prompt to process
@@ -23,100 +381,47 @@ class AiCalls:
         Returns:
             The AI response as text
         """
-        # Prepare messages in OpenAI format
-        messages = []
-        
-        # Add system message if context provided
+        # Combine context with prompt if provided
+        full_prompt = prompt
         if context:
-            messages.append({
-                "role": "system",
-                "content": context
-            })
+            full_prompt = f"Context: {context}\n\nUser Request: {prompt}"
         
-        # Add user message
-        messages.append({
-            "role": "user",
-            "content": prompt
-        })
-        
-        # Add language instruction for user-facing responses
-        if hasattr(self, 'userLanguage') and self.userLanguage:
-            ltext = f"Please respond in '{self.userLanguage}' language."
-            if messages and messages[0]["role"] == "system":
-                if "language" not in messages[0]["content"].lower():
-                    messages[0]["content"] = f"{ltext} {messages[0]['content']}"
-            else:
-                messages.insert(0, {
-                    "role": "system", 
-                    "content": ltext
-                })
-        
-        try:
-            return await self.openaiService.callAiBasic(messages)
-        except ContextLengthExceededException as e:
-            logger.warning(f"OpenAI context length exceeded, falling back to Anthropic: {str(e)}")
-            # Fallback to Anthropic (AI Advanced) when context length is exceeded
-            return await self.callAiTextAdvanced(prompt, context, _is_fallback=True)
-        except Exception as e:
-            logger.error(f"Error in OpenAI call: {str(e)}")
-            return f"Error: {str(e)}"
+        # Use centralized AI call with speed priority for basic calls
+        return await self.callAi(
+            prompt=full_prompt,
+            priority="speed",
+            compress_prompt=True,
+            compress_documents=False
+        )
 
     async def callAiTextAdvanced(self, prompt: str, context: Optional[str] = None, _is_fallback: bool = False) -> str:
         """
-        Advanced text processing using Anthropic.
-        Fallback to OpenAI if Anthropic is overloaded or rate-limited.
+        Advanced text processing - now uses centralized AI call method.
         
         Args:
             prompt: The user prompt to process
             context: Optional system context/prompt
-            _is_fallback: Internal flag to prevent infinite recursion
+            _is_fallback: Internal flag (kept for compatibility)
+            
+        Returns:
+            The AI response as text
         """
-        # For Anthropic, we need to handle system content differently
-        # Anthropic expects system content in a top-level parameter, not as a message role
-        try:
-            # Create messages without system role for Anthropic
-            anthropic_messages = []
-            if hasattr(self, 'userLanguage') and self.userLanguage:
-                ltext = f"Please respond in '{self.userLanguage}' language."
-                if context:
-                    # Combine context and language instruction
-                    full_context = f"{ltext}\n\n{context}"
-                else:
-                    full_context = ltext
-            else:
-                full_context = context
-            
-            # Add user message
-            anthropic_messages.append({
-                "role": "user",
-                "content": prompt
-            })
-            
-            # Call Anthropic - let the connector handle system content conversion
-            if full_context:
-                # Send context as part of the user message for Anthropic
-                enhanced_prompt = f"Context:\n{full_context}\n\nUser Request:\n{prompt}"
-                response = await self.anthropicService.callAiBasic([
-                    {"role": "user", "content": enhanced_prompt}
-                ])
-            else:
-                response = await self.anthropicService.callAiBasic(anthropic_messages)
-            
-            return response["choices"][0]["message"]["content"]
-        except Exception as e:
-            err_str = str(e)
-            logger.warning(f"[UI NOTICE] Advanced AI failed, falling back to Basic AI (OpenAI). Reason: {err_str}")
-            # Fallback to OpenAI basic, but only if we're not already in a fallback
-            if not _is_fallback:
-                return await self.callAiTextBasic(prompt, context)
-            else:
-                # If we're already in a fallback, return error to prevent infinite recursion
-                logger.error("Both AI services failed, cannot provide fallback")
-                return f"Error: Both AI services failed. Anthropic error: {err_str}"
+        # Combine context with prompt if provided
+        full_prompt = prompt
+        if context:
+            full_prompt = f"Context: {context}\n\nUser Request: {prompt}"
+        
+        # Use centralized AI call with quality priority for advanced calls
+        return await self.callAi(
+            prompt=full_prompt,
+            priority="quality",
+            compress_prompt=False,
+            compress_documents=False
+        )
 
     async def callAiImageBasic(self, prompt: str, imageData: Union[str, bytes], mimeType: str = None) -> str:
         """
-        Basic image processing using OpenAI.
+        Basic image processing - now uses centralized AI call method.
         
         Args:
             prompt: The prompt for image analysis
@@ -127,6 +432,8 @@ class AiCalls:
             The AI response as text
         """
         try:
+            # For image processing, use the original connector directly
+            # as the centralized method doesn't handle images yet
             return await self.openaiService.callAiImage(prompt, imageData, mimeType)
         except Exception as e:
             logger.error(f"Error in OpenAI image call: {str(e)}")
@@ -134,7 +441,7 @@ class AiCalls:
 
     async def callAiImageAdvanced(self, prompt: str, imageData: Union[str, bytes], mimeType: str = None) -> str:
         """
-        Advanced image processing using Anthropic.
+        Advanced image processing - now uses centralized AI call method.
         
         Args:
             prompt: The prompt for image analysis
@@ -145,8 +452,76 @@ class AiCalls:
             The AI response as text
         """
         try:
+            # For image processing, use the original connector directly
+            # as the centralized method doesn't handle images yet
             return await self.anthropicService.callAiImage(prompt, imageData, mimeType)
         except Exception as e:
             logger.error(f"Error in Anthropic image call: {str(e)}")
             return f"Error: {str(e)}"
+    
+    # Convenience methods for common use cases
+
+    async def callAiForDocumentAnalysis(
+        self, 
+        prompt: str, 
+        documents: List[ChatDocument],
+        priority: str = "balanced"
+    ) -> str:
+        """Convenience method for document analysis"""
+        return await self.callAi(
+            prompt=prompt,
+            documents=documents,
+            operation_type="document_analysis",
+            priority=priority,
+            compress_documents=True,
+            process_documents_individually=False
+        )
+    
+    async def callAiForReportGeneration(
+        self, 
+        prompt: str, 
+        documents: List[ChatDocument],
+        priority: str = "quality"
+    ) -> str:
+        """Convenience method for report generation"""
+        return await self.callAi(
+            prompt=prompt,
+            documents=documents,
+            operation_type="report_generation",
+            priority=priority,
+            compress_documents=True,
+            process_documents_individually=True
+        )
+    
+    async def callAiForEmailComposition(
+        self, 
+        prompt: str, 
+        documents: List[ChatDocument] = None,
+        priority: str = "speed"
+    ) -> str:
+        """Convenience method for email composition"""
+        return await self.callAi(
+            prompt=prompt,
+            documents=documents,
+            operation_type="email_composition",
+            priority=priority,
+            compress_prompt=True,
+            compress_documents=True
+        )
+    
+    async def callAiForTaskPlanning(
+        self, 
+        prompt: str, 
+        documents: List[ChatDocument] = None,
+        priority: str = "balanced"
+    ) -> str:
+        """Convenience method for task planning"""
+        return await self.callAi(
+            prompt=prompt,
+            documents=documents,
+            operation_type="task_planning",
+            priority=priority,
+            compress_prompt=False,
+            compress_documents=True
+        )
 
diff --git a/modules/interfaces/interfaceAiEngine.py b/modules/interfaces/interfaceAiEngine.py
deleted file mode 100644
index 2ccdd70e..00000000
--- a/modules/interfaces/interfaceAiEngine.py
+++ /dev/null
@@ -1,115 +0,0 @@
-"""
-Centralized AI Engine Interface for intelligent content processing
-"""
-
-from abc import ABC, abstractmethod
-from typing import List, Dict, Any, Optional, Union, Tuple
-from enum import Enum
-from dataclasses import dataclass
-from modules.interfaces.interfaceChatModel import ChatDocument, ExtractedContent
-
-
-class AIModelType(Enum):
-    """Available AI model types"""
-    OPENAI_GPT4 = "openai_gpt4"
-    OPENAI_GPT35 = "openai_gpt35"
-    ANTHROPIC_CLAUDE = "anthropic_claude"
-    OPENAI_VISION = "openai_vision"
-    ANTHROPIC_VISION = "anthropic_vision"
-
-
-class ProcessingStrategy(Enum):
-    """Content processing strategies"""
-    SINGLE_CALL = "single_call"           # One AI call with full content
-    DOCUMENT_BY_DOCUMENT = "doc_by_doc"   # One call per document, merge results
-    CHUNKED_PROCESSING = "chunked"        # Process in chunks, merge results
-    SUMMARIZED_CONTENT = "summarized"     # Summarize content first, then process
-
-
-class ContentReductionStrategy(Enum):
-    """Content reduction strategies"""
-    REDUCE_DOCUMENTS_ONLY = "reduce_docs"      # Keep prompt, reduce documents
-    REDUCE_PROMPT_AND_DOCS = "reduce_both"     # Reduce both prompt and documents
-    SUMMARIZE_DOCUMENTS = "summarize_docs"     # Summarize documents to key points
-    EXTRACT_KEY_INFO = "extract_key"           # Extract only relevant information
-
-
-@dataclass
-class AIRequest:
-    """Standardized AI request structure"""
-    prompt: str
-    documents: List[ChatDocument]
-    context: Optional[str] = None
-    preferred_model: Optional[AIModelType] = None
-    max_tokens: Optional[int] = None
-    temperature: Optional[float] = None
-    processing_strategy: Optional[ProcessingStrategy] = None
-    reduction_strategy: Optional[ContentReductionStrategy] = None
-    metadata: Optional[Dict[str, Any]] = None
-
-
-@dataclass
-class AIResponse:
-    """Standardized AI response structure"""
-    success: bool
-    content: str
-    model_used: AIModelType
-    processing_strategy: ProcessingStrategy
-    tokens_used: Optional[int] = None
-    processing_time: Optional[float] = None
-    error: Optional[str] = None
-    metadata: Optional[Dict[str, Any]] = None
-
-
-@dataclass
-class ModelCapabilities:
-    """AI model capabilities and limits"""
-    max_tokens: int
-    max_input_tokens: int
-    supports_vision: bool
-    supports_function_calling: bool
-    cost_per_1k_tokens: float
-    processing_speed: str  # "fast", "medium", "slow"
-
-
-class AIEngine(ABC):
-    """Abstract AI Engine interface"""
-    
-    @abstractmethod
-    async def process_request(self, request: AIRequest) -> AIResponse:
-        """Process an AI request with intelligent content management"""
-        pass
-    
-    @abstractmethod
-    def get_model_capabilities(self, model: AIModelType) -> ModelCapabilities:
-        """Get capabilities and limits for a specific model"""
-        pass
-    
-    @abstractmethod
-    async def estimate_token_usage(self, request: AIRequest) -> int:
-        """Estimate token usage for a request"""
-        pass
-
-
-class ContentReducer(ABC):
-    """Abstract content reduction interface"""
-    
-    @abstractmethod
-    async def reduce_content(
-        self, 
-        documents: List[ChatDocument], 
-        prompt: str,
-        strategy: ContentReductionStrategy,
-        target_reduction: float = 0.5
-    ) -> Tuple[List[ChatDocument], str]:
-        """Reduce content size while preserving important information"""
-        pass
-    
-    @abstractmethod
-    async def summarize_document(
-        self, 
-        document: ChatDocument, 
-        focus_prompt: str
-    ) -> ChatDocument:
-        """Create a summary of a document focused on specific aspects"""
-        pass

From 5e00b4bd0765877e29ade14e3c428a814ed33a94 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Thu, 4 Sep 2025 01:01:21 +0200
Subject: [PATCH 16/17] sharepoint implemented

---
 modules/chat/documents/documentExtraction.py |  12 +-
 modules/chat/documents/documentGeneration.py |  18 +-
 modules/chat/documents/documentUtility.py    | 147 ++-
 modules/chat/handling/handlingTasks.py       |  12 +-
 modules/chat/handling/methodOutlook.py       |   3 -
 modules/chat/handling/promptFactory.py       |   4 +-
 modules/chat/serviceCenter.py                | 762 ++++++--------
 modules/interfaces/interfaceChatModel.py     |   6 +-
 modules/methods/methodOutlook.py             |   8 +-
 modules/methods/methodSharepoint.py          | 930 ++++++++++-------
 modules/workflow/managerWorkflow.py          |   2 +-
 notes/changelog.txt                          |   4 +-
 notes/management_summary.html                | 128 ---
 notes/methodbased_arch.html                  | 129 ---
 notes/methodbased_specification.md           | 999 -------------------
 test_ai_calls.md                             | 235 -----
 test_ai_fallback.py                          | 103 --
 test_documentExtraction.py                   | 855 ----------------
 test_excel_processing.py                     | 189 ----
 test_methodWeb.py                            | 658 ------------
 test_outlook_filters.py                      |  51 -
 test_outlook_filters_fixed.py                |  70 --
 test_pydantic_compat.py                      | 100 --
 test_web_csv_functionality.py                | 207 ----
 24 files changed, 1024 insertions(+), 4608 deletions(-)
 delete mode 100644 modules/chat/handling/methodOutlook.py
 delete mode 100644 notes/management_summary.html
 delete mode 100644 notes/methodbased_arch.html
 delete mode 100644 notes/methodbased_specification.md
 delete mode 100644 test_ai_calls.md
 delete mode 100644 test_ai_fallback.py
 delete mode 100644 test_documentExtraction.py
 delete mode 100644 test_excel_processing.py
 delete mode 100644 test_methodWeb.py
 delete mode 100644 test_outlook_filters.py
 delete mode 100644 test_outlook_filters_fixed.py
 delete mode 100644 test_pydantic_compat.py
 delete mode 100644 test_web_csv_functionality.py

diff --git a/modules/chat/documents/documentExtraction.py b/modules/chat/documents/documentExtraction.py
index ea96289d..a304cbe3 100644
--- a/modules/chat/documents/documentExtraction.py
+++ b/modules/chat/documents/documentExtraction.py
@@ -341,7 +341,7 @@ class DocumentExtraction:
 
             
             # Use documentUtility for mime type
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="main",
                 data=content,
@@ -360,7 +360,7 @@ class DocumentExtraction:
         """Process CSV document with robust encoding detection"""
         try:
             content = self._robustTextDecode(fileData, fileName)
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="main",
                 data=content,
@@ -380,7 +380,7 @@ class DocumentExtraction:
         try:
             content = self._robustTextDecode(fileData, fileName)
             jsonData = json.loads(content)
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="main",
                 data=content,
@@ -399,7 +399,7 @@ class DocumentExtraction:
         """Process XML document with robust encoding detection"""
         try:
             content = self._robustTextDecode(fileData, fileName)
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="main",
                 data=content,
@@ -418,7 +418,7 @@ class DocumentExtraction:
         """Process HTML document with robust encoding detection"""
         try:
             content = self._robustTextDecode(fileData, fileName)
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="main",
                 data=content,
@@ -512,7 +512,7 @@ class DocumentExtraction:
             # Combine all meaningful content
             final_content = "\n".join(meaningful_content)
             
-            mime_type = getMimeTypeFromExtension(getFileExtension(fileName), self._serviceCenter)
+            mime_type = getMimeTypeFromExtension(getFileExtension(fileName))
             return [ContentItem(
                 label="svg_content",
                 data=final_content,
diff --git a/modules/chat/documents/documentGeneration.py b/modules/chat/documents/documentGeneration.py
index 5534462a..dfe10918 100644
--- a/modules/chat/documents/documentGeneration.py
+++ b/modules/chat/documents/documentGeneration.py
@@ -98,26 +98,12 @@ class DocumentGenerator:
                     
                     logger.info(f"Document {document_name} has content: {len(content)} characters")
                     
-                    # Create file in system
-                    file_id = self.service.createFile(
-                        fileName=document_name,
-                        mimeType=mime_type,
-                        content=content,
-                        base64encoded=False
-                    )
-                    if not file_id:
-                        logger.error(f"Failed to create file for document {document_name}")
-                        continue
-                    
-                    logger.info(f"Created file with ID: {file_id}")
-                    
-                    # Create document object using existing file ID
+                    # Create document with file in one step
                     document = self.service.createDocument(
                         fileName=document_name,
                         mimeType=mime_type,
                         content=content,
-                        base64encoded=False,
-                        existing_file_id=file_id
+                        base64encoded=False
                     )
                     if document:
                         # Set workflow context on the document if possible
diff --git a/modules/chat/documents/documentUtility.py b/modules/chat/documents/documentUtility.py
index 3d674720..5b0a612c 100644
--- a/modules/chat/documents/documentUtility.py
+++ b/modules/chat/documents/documentUtility.py
@@ -1,51 +1,160 @@
 import json
 import logging
+import os
 from typing import Any, Dict
 
 logger = logging.getLogger(__name__)
 
 def getFileExtension(fileName: str) -> str:
-    """Extract file extension from fileName"""
+    """Extract file extension from fileName (without dot, lowercased)."""
     if '.' in fileName:
         return fileName.rsplit('.', 1)[-1].lower()
     return ''
 
-def getMimeTypeFromExtension(extension: str, service=None) -> str:
-    """Get MIME type based on file extension. Optionally use a service for mapping."""
-    if service:
-        return service.getMimeTypeFromExtension(extension)
-    # Fallback mapping
-    mapping = {
+def getMimeTypeFromExtension(extension: str) -> str:
+    """
+    Get MIME type based on file extension.
+    This method consolidates MIME type detection from extension.
+    
+    Args:
+        extension: File extension (with or without dot)
+        
+    Returns:
+        str: MIME type for the extension
+    """
+    # Normalize extension (remove dot if present)
+    if extension.startswith('.'):
+        extension = extension[1:]
+    
+    # Map extensions to MIME types
+    mime_types = {
         'txt': 'text/plain',
-        'md': 'text/markdown',
-        'html': 'text/html',
-        'css': 'text/css',
-        'js': 'application/javascript',
         'json': 'application/json',
-        'csv': 'text/csv',
         'xml': 'application/xml',
+        'csv': 'text/csv',
+        'html': 'text/html',
+        'htm': 'text/html',
+        'md': 'text/markdown',
         'py': 'text/x-python',
+        'js': 'application/javascript',
+        'css': 'text/css',
         'pdf': 'application/pdf',
+        'doc': 'application/msword',
         'docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
+        'xls': 'application/vnd.ms-excel',
         'xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-        'png': 'image/png',
+        'ppt': 'application/vnd.ms-powerpoint',
+        'pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
+        'svg': 'image/svg+xml',
         'jpg': 'image/jpeg',
         'jpeg': 'image/jpeg',
+        'png': 'image/png',
         'gif': 'image/gif',
-        'svg': 'image/svg+xml',
+        'bmp': 'image/bmp',
+        'webp': 'image/webp',
+        'zip': 'application/zip',
+        'rar': 'application/x-rar-compressed',
+        '7z': 'application/x-7z-compressed',
+        'tar': 'application/x-tar',
+        'gz': 'application/gzip'
     }
-    return mapping.get(extension.lower(), 'application/octet-stream')
+    return mime_types.get(extension.lower(), 'application/octet-stream')
+
+def detectContentTypeFromData(fileData: bytes, fileName: str) -> str:
+    """
+    Detect content type from file data and fileName.
+    This method makes the MIME type detection function accessible through the service center.
+    
+    Args:
+        fileData: Raw file data as bytes
+        fileName: Name of the file
+        
+    Returns:
+        str: Detected MIME type
+    """
+    try:
+        # Check file extension first
+        ext = os.path.splitext(fileName)[1].lower()
+        if ext:
+            # Map common extensions to MIME types
+            extToMime = {
+                '.txt': 'text/plain',
+                '.md': 'text/markdown',
+                '.csv': 'text/csv',
+                '.json': 'application/json',
+                '.xml': 'application/xml',
+                '.js': 'application/javascript',
+                '.py': 'application/x-python',
+                '.svg': 'image/svg+xml',
+                '.jpg': 'image/jpeg',
+                '.jpeg': 'image/jpeg',
+                '.png': 'image/png',
+                '.gif': 'image/gif',
+                '.bmp': 'image/bmp',
+                '.webp': 'image/webp',
+                '.pdf': 'application/pdf',
+                '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
+                '.doc': 'application/msword',
+                '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
+                '.xls': 'application/vnd.ms-excel',
+                '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
+                '.ppt': 'application/vnd.ms-powerpoint',
+                '.html': 'text/html',
+                '.htm': 'text/html',
+                '.css': 'text/css',
+                '.zip': 'application/zip',
+                '.rar': 'application/x-rar-compressed',
+                '.7z': 'application/x-7z-compressed',
+                '.tar': 'application/x-tar',
+                '.gz': 'application/gzip'
+            }
+            if ext in extToMime:
+                return extToMime[ext]
+        
+        # Try to detect from content
+        if fileData.startswith(b'%PDF'):
+            return 'application/pdf'
+        elif fileData.startswith(b'PK\x03\x04'):
+            # ZIP-based formats (docx, xlsx, pptx)
+            return 'application/zip'
+        elif fileData.startswith(b'<'):
+            # XML-based formats
+            try:
+                text = fileData.decode('utf-8', errors='ignore')
+                if '<svg' in text.lower():
+                    return 'image/svg+xml'
+                elif '<html' in text.lower():
+                    return 'text/html'
+                else:
+                    return 'application/xml'
+            except:
+                pass
+        elif fileData.startswith(b'\x89PNG\r\n\x1a\n'):
+            return 'image/png'
+        elif fileData.startswith(b'\xff\xd8\xff'):
+            return 'image/jpeg'
+        elif fileData.startswith(b'GIF87a') or fileData.startswith(b'GIF89a'):
+            return 'image/gif'
+        elif fileData.startswith(b'BM'):
+            return 'image/bmp'
+        elif fileData.startswith(b'RIFF') and fileData[8:12] == b'WEBP':
+            return 'image/webp'
+        
+        return 'application/octet-stream'
+        
+    except Exception as e:
+        logger.error(f"Error detecting content type from data: {str(e)}")
+        return 'application/octet-stream'
 
 def detectMimeTypeFromData(file_bytes: bytes, fileName: str, service=None) -> str:
     """Detect MIME type from file bytes and fileName using a service if provided."""
     try:
-        if service:
+        if service and hasattr(service, 'detectContentTypeFromData'):
             detected = service.detectContentTypeFromData(file_bytes, fileName)
             if detected and detected != 'application/octet-stream':
                 return detected
-        # Fallback: guess from extension
-        ext = getFileExtension(fileName)
-        return getMimeTypeFromExtension(ext, service)
+        # Fallback: use our consolidated function
+        return detectContentTypeFromData(file_bytes, fileName)
     except Exception as e:
         logger.warning(f"Error in MIME type detection for {fileName}: {str(e)}")
         return 'application/octet-stream'
diff --git a/modules/chat/handling/handlingTasks.py b/modules/chat/handling/handlingTasks.py
index d99521f2..88465b0e 100644
--- a/modules/chat/handling/handlingTasks.py
+++ b/modules/chat/handling/handlingTasks.py
@@ -108,7 +108,7 @@ class HandlingTasks:
             # Log the full task planning prompt being sent to AI for debugging
             logger.info("=== TASK PLANNING PROMPT SENT TO AI ===")
             logger.info(f"User Input: {userInput}")
-            logger.info(f"Available Documents: {len(available_docs) if available_docs else 0}")
+            logger.info(f"Available Documents: {available_docs}")
             logger.info("=== FULL TASK PLANNING PROMPT ===")
             logger.info(task_planning_prompt)
             logger.info("=== END TASK PLANNING PROMPT ===")
@@ -312,12 +312,8 @@ class HandlingTasks:
 
             # Log available resources for debugging
             logger.info("=== AVAILABLE RESOURCES FOR ACTION GENERATION ===")
-            logger.info(f"Available Documents: {len(available_docs) if available_docs else 0}")
-            if available_docs:
-                for i, doc in enumerate(available_docs[:5]):  # Show first 5
-                    logger.info(f"  Doc {i+1}: {doc}")
-                if len(available_docs) > 5:
-                    logger.info(f"  ... and {len(available_docs) - 5} more documents")
+            logger.info(f"Available Documents: {available_docs}")
+            # Note: available_docs is now a string description, not a list
             logger.info(f"Available Connections: {len(available_connections) if available_connections else 0}")
             if available_connections:
                 for i, conn in enumerate(available_connections[:5]):  # Show first 5
@@ -376,7 +372,7 @@ class HandlingTasks:
             logger.info(f"Task Step ID: {action_context.task_step.id if action_context.task_step else 'None'}")
             logger.info(f"Task Step Objective: {action_context.task_step.objective if action_context.task_step else 'None'}")
             logger.info(f"Workflow ID: {action_context.workflow_id}")
-            logger.info(f"Available Documents Count: {len(action_context.available_documents) if action_context.available_documents else 0}")
+            logger.info(f"Available Documents: {action_context.available_documents or 'No documents available'}")
             logger.info(f"Available Connections Count: {len(action_context.available_connections) if action_context.available_connections else 0}")
             logger.info(f"Previous Results Count: {len(action_context.previous_results) if action_context.previous_results else 0}")
             logger.info(f"Retry Count: {action_context.retry_count}")
diff --git a/modules/chat/handling/methodOutlook.py b/modules/chat/handling/methodOutlook.py
deleted file mode 100644
index b28b04f6..00000000
--- a/modules/chat/handling/methodOutlook.py
+++ /dev/null
@@ -1,3 +0,0 @@
-
-
-
diff --git a/modules/chat/handling/promptFactory.py b/modules/chat/handling/promptFactory.py
index 4587cce4..9faa06b3 100644
--- a/modules/chat/handling/promptFactory.py
+++ b/modules/chat/handling/promptFactory.py
@@ -20,13 +20,13 @@ def createTaskPlanningPrompt(context: TaskContext, service) -> str:
     user_request = context.task_step.objective if context.task_step else 'No request specified'
     
     # Extract available documents from context - use Pydantic model directly
-    available_documents = context.available_documents or []
+    available_documents = context.available_documents or "No documents available"
     
     return f"""You are a task planning AI that analyzes user requests and creates structured task plans with user-friendly feedback messages.
 
 USER REQUEST: {user_request}
 
-AVAILABLE DOCUMENTS: {', '.join(available_documents)}
+AVAILABLE DOCUMENTS: {available_documents}
 
 INSTRUCTIONS:
 1. Analyze the user request and available documents
diff --git a/modules/chat/serviceCenter.py b/modules/chat/serviceCenter.py
index 703531f0..cef1555b 100644
--- a/modules/chat/serviceCenter.py
+++ b/modules/chat/serviceCenter.py
@@ -14,6 +14,7 @@ from modules.interfaces.interfaceChatModel import ActionResult
 from modules.interfaces.interfaceComponentObjects import getInterface as getComponentObjects
 from modules.interfaces.interfaceAppObjects import getInterface as getAppObjects
 from modules.chat.documents.documentExtraction import DocumentExtraction
+from modules.chat.documents.documentUtility import getFileExtension, getMimeTypeFromExtension, detectContentTypeFromData
 from modules.chat.methodBase import MethodBase
 from modules.shared.timezoneUtils import get_utc_timestamp
 import uuid
@@ -111,165 +112,9 @@ class ServiceCenter:
         except Exception as e:
             logger.error(f"Error discovering methods: {str(e)}")
 
-    def detectContentTypeFromData(self, fileData: bytes, fileName: str) -> str:
-        """
-        Detect content type from file data and fileName.
-        This method makes the MIME type detection function accessible through the service center.
-        
-        Args:
-            fileData: Raw file data as bytes
-            fileName: Name of the file
-            
-        Returns:
-            str: Detected MIME type
-        """
-        try:
-            # Check file extension first
-            ext = os.path.splitext(fileName)[1].lower()
-            if ext:
-                # Map common extensions to MIME types
-                extToMime = {
-                    '.txt': 'text/plain',
-                    '.md': 'text/markdown',
-                    '.csv': 'text/csv',
-                    '.json': 'application/json',
-                    '.xml': 'application/xml',
-                    '.js': 'application/javascript',
-                    '.py': 'application/x-python',
-                    '.svg': 'image/svg+xml',
-                    '.jpg': 'image/jpeg',
-                    '.jpeg': 'image/jpeg',
-                    '.png': 'image/png',
-                    '.gif': 'image/gif',
-                    '.bmp': 'image/bmp',
-                    '.webp': 'image/webp',
-                    '.pdf': 'application/pdf',
-                    '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
-                    '.doc': 'application/msword',
-                    '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-                    '.xls': 'application/vnd.ms-excel',
-                    '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
-                    '.ppt': 'application/vnd.ms-powerpoint',
-                    '.html': 'text/html',
-                    '.htm': 'text/html',
-                    '.css': 'text/css',
-                    '.zip': 'application/zip',
-                    '.rar': 'application/x-rar-compressed',
-                    '.7z': 'application/x-7z-compressed',
-                    '.tar': 'application/x-tar',
-                    '.gz': 'application/gzip'
-                }
-                if ext in extToMime:
-                    return extToMime[ext]
-            
-            # Try to detect from content
-            if fileData.startswith(b'%PDF'):
-                return 'application/pdf'
-            elif fileData.startswith(b'PK\x03\x04'):
-                # ZIP-based formats (docx, xlsx, pptx)
-                return 'application/zip'
-            elif fileData.startswith(b'<'):
-                # XML-based formats
-                try:
-                    text = fileData.decode('utf-8', errors='ignore')
-                    if '<svg' in text.lower():
-                        return 'image/svg+xml'
-                    elif '<html' in text.lower():
-                        return 'text/html'
-                    else:
-                        return 'application/xml'
-                except:
-                    pass
-            elif fileData.startswith(b'\x89PNG\r\n\x1a\n'):
-                return 'image/png'
-            elif fileData.startswith(b'\xff\xd8\xff'):
-                return 'image/jpeg'
-            elif fileData.startswith(b'GIF87a') or fileData.startswith(b'GIF89a'):
-                return 'image/gif'
-            elif fileData.startswith(b'BM'):
-                return 'image/bmp'
-            elif fileData.startswith(b'RIFF') and fileData[8:12] == b'WEBP':
-                return 'image/webp'
-            
-            return 'application/octet-stream'
-            
-        except Exception as e:
-            logger.error(f"Error detecting content type from data: {str(e)}")
-            return 'application/octet-stream'
 
-    def getMimeTypeFromExtension(self, extension: str) -> str:
-        """
-        Get MIME type based on file extension.
-        This method consolidates MIME type detection from extension.
-        
-        Args:
-            extension: File extension (with or without dot)
-            
-        Returns:
-            str: MIME type for the extension
-        """
-        # Normalize extension (remove dot if present)
-        if extension.startswith('.'):
-            extension = extension[1:]
-        
-        # Map extensions to MIME types
-        mime_types = {
-            'txt': 'text/plain',
-            'json': 'application/json',
-            'xml': 'application/xml',
-            'csv': 'text/csv',
-            'html': 'text/html',
-            'htm': 'text/html',
-            'md': 'text/markdown',
-            'py': 'text/x-python',
-            'js': 'application/javascript',
-            'css': 'text/css',
-            'pdf': 'application/pdf',
-            'doc': 'application/msword',
-            'docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
-            'xls': 'application/vnd.ms-excel',
-            'xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-            'ppt': 'application/vnd.ms-powerpoint',
-            'pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
-            'svg': 'image/svg+xml',
-            'jpg': 'image/jpeg',
-            'jpeg': 'image/jpeg',
-            'png': 'image/png',
-            'gif': 'image/gif',
-            'bmp': 'image/bmp',
-            'webp': 'image/webp',
-            'zip': 'application/zip',
-            'rar': 'application/x-rar-compressed',
-            '7z': 'application/x-7z-compressed',
-            'tar': 'application/x-tar',
-            'gz': 'application/gzip'
-        }
-        return mime_types.get(extension.lower(), 'application/octet-stream')
 
-    def getFileExtension(self, fileName: str) -> str:
-        """
-        Extract file extension from fileName.
-        
-        Args:
-            fileName: Name of the file
-            
-        Returns:
-            str: File extension (without dot)
-        """
-        if '.' in fileName:
-            return fileName.split('.')[-1].lower()
-        return "txt"  # Default to text
-
-    def getFileExtension(self, fileName):
-        """
-        Extract file extension from fileName (without dot, lowercased).
-        Returns empty string if no extension is found.
-        """
-        if '.' in fileName:
-            return fileName.rsplit('.', 1)[-1].lower()
-        return ''
-
-    # ===== Functions =====
+    # ===== Functions for Prompts: Context =====
             
     def getMethodsList(self) -> List[str]:
         """Get list of available methods with their signatures in the required format"""
@@ -283,157 +128,48 @@ class ServiceCenter:
                     methodList.append(signature)
         return methodList
 
-    def generateDocumentLabel(self, document: ChatDocument, message: ChatMessage) -> str:
-        """Generate new document label: round+task+action+filename.extension"""
+    async def summarizeChat(self, messages: List[ChatMessage]) -> str:
+        """
+        Summarize chat messages from last to first message with status="first"
+        
+        Args:
+            messages: List of chat messages to summarize
+            
+        Returns:
+            str: Summary of the chat in user's language
+        """
         try:
-            # Get workflow context from message
-            round_num = message.roundNumber if hasattr(message, 'roundNumber') else 1
-            task_num = message.taskNumber if hasattr(message, 'taskNumber') else 0
-            action_num = message.actionNumber if hasattr(message, 'actionNumber') else 0
+            # Get messages from last to first, stopping at first message with status="first"
+            relevantMessages = []
+            for msg in reversed(messages):
+                relevantMessages.append(msg)
+                if msg.status == "first":
+                    break
             
-            # Get file extension from document's fileName property
-            try:
-                file_extension = self.getFileExtension(document.fileName)
-                filename = document.fileName
-            except Exception as e:
-                # Try to diagnose and recover the issue
-                diagnosis = self.diagnoseDocumentAccess(document)
-                logger.error(f"Critical error: Cannot access document fileName for document {document.id}. Diagnosis: {diagnosis}")
-                
-                # Attempt recovery
-                if self.recoverDocumentAccess(document):
-                    try:
-                        file_extension = self.getFileExtension(document.fileName)
-                        filename = document.fileName
-                        logger.info(f"Document access recovered for {document.id}")
-                    except Exception as recovery_error:
-                        logger.error(f"Recovery failed for document {document.id}: {str(recovery_error)}")
-                        raise RuntimeError(f"Document {document.id} is permanently inaccessible after recovery attempt: {str(recovery_error)}")
-                else:
-                    # Recovery failed - don't continue with invalid data
-                    raise RuntimeError(f"Document {document.id} is inaccessible and recovery failed. Diagnosis: {diagnosis}")
-            
-            # Construct label: round1_task2_action3_filename.ext
-            if file_extension:
-                label = f"round{round_num}_task{task_num}_action{action_num}_{filename}"
-            else:
-                label = f"round{round_num}_task{task_num}_action{action_num}_{filename}"
-            
-            return label
-        except Exception as e:
-            logger.error(f"Critical error generating document label for document {document.id}: {str(e)}")
-            # Re-raise the error to prevent workflow from continuing with invalid data
-            raise
+            # Create prompt for AI
+            prompt = f"""You are an AI assistant providing a summary of a chat conversation.
+Please respond in '{self.user.language}' language.
 
-    def getDocumentReferenceList(self) -> Dict[str, List[DocumentExchange]]:
-        """Get list of document exchanges with new labeling format, sorted by recency"""
-        # Collect all documents first and refresh their attributes
-        all_documents = []
-        for message in self.workflow.messages:
-            if message.documents:
-                all_documents.extend(message.documents)
-        
-        # Refresh file attributes for all documents
-        if all_documents:
-            self.refreshDocumentFileAttributes(all_documents)
-        
-        chat_exchanges = []
-        history_exchanges = []
-        
-        # Process messages in reverse order; "first" marks boundary
-        in_current_round = True
-        for message in reversed(self.workflow.messages):
-            is_first = message.status == "first" if hasattr(message, 'status') else False
+Chat History:
+{chr(10).join(f"- {msg.message}" for msg in reversed(relevantMessages))}
+
+Instructions:
+1. Summarize the conversation's key points and outcomes
+2. Be concise but informative
+3. Use a professional but friendly tone
+4. Focus on important decisions and next steps if any
+
+Please provide a comprehensive summary of this conversation."""
             
-            # Build a DocumentExchange if message has documents
-            doc_exchange = None
-            if message.documents:
-                if message.actionId and message.documentsLabel:
-                    # Validate that we use the same label as in the message
-                    validated_label = self._validateDocumentLabelConsistency(message)
-                    
-                    # Use the message's actual documentsLabel
-                    doc_refs = []
-                    for doc in message.documents:
-                        doc_ref = self.getDocumentReferenceFromChatDocument(doc, message)
-                        doc_refs.append(doc_ref)
-                    
-                    doc_exchange = DocumentExchange(
-                        documentsLabel=validated_label,
-                        documents=doc_refs
-                    )
-                else:
-                    # Generate new labels for documents without explicit labels
-                    doc_refs = []
-                    for doc in message.documents:
-                        doc_ref = self.getDocumentReferenceFromChatDocument(doc, message)
-                        doc_refs.append(doc_ref)
-                    
-                    if doc_refs:
-                        # Create a label based on message context
-                        round_num = message.roundNumber if hasattr(message, 'roundNumber') else 1
-                        task_num = message.taskNumber if hasattr(message, 'taskNumber') else 0
-                        action_num = message.actionNumber if hasattr(message, 'actionNumber') else 0
-                        context_label = f"round{round_num}_task{task_num}_action{action_num}_context"
-                        
-                        doc_exchange = DocumentExchange(
-                            documentsLabel=context_label,
-                            documents=doc_refs
-                        )
+            # Get summary using AI
+            return await self.callAiTextBasic(prompt)
             
-            # Append to appropriate container based on boundary
-            if doc_exchange:
-                if in_current_round:
-                    chat_exchanges.append(doc_exchange)
-                else:
-                    history_exchanges.append(doc_exchange)
-            
-            # Flip boundary after including the "first" message in chat
-            if in_current_round and is_first:
-                in_current_round = False
-        
-        # Sort by recency: most recent first, then current round, then earlier rounds
-        # Sort chat exchanges by message sequence number (most recent first)
-        chat_exchanges.sort(key=lambda x: self._getMessageSequenceForExchange(x), reverse=True)
-        # Sort history exchanges by message sequence number (most recent first)
-        history_exchanges.sort(key=lambda x: self._getMessageSequenceForExchange(x), reverse=True)
-        
-        return {
-            "chat": chat_exchanges,
-            "history": history_exchanges
-        }
+        except Exception as e:
+            logger.error(f"Error summarizing chat: {str(e)}")
+            return f"Error summarizing chat: {str(e)}"
+
+    # ===== Functions for Prompts + Actions: Document References generation and resolution =====
     
-    def _getMessageSequenceForExchange(self, exchange: DocumentExchange) -> int:
-        """Get message sequence number for sorting exchanges by recency"""
-        try:
-            # Extract message ID from the first document reference
-            if exchange.documents and len(exchange.documents) > 0:
-                first_doc_ref = exchange.documents[0]
-                if first_doc_ref.startswith("docItem:"):
-                    # docItem:<id>:<label> - extract ID
-                    parts = first_doc_ref.split(':')
-                    if len(parts) >= 2:
-                        doc_id = parts[1]
-                        # Find the message containing this document
-                        for message in self.workflow.messages:
-                            if message.documents:
-                                for doc in message.documents:
-                                    if doc.id == doc_id:
-                                        return message.sequenceNr if hasattr(message, 'sequenceNr') else 0
-                elif first_doc_ref.startswith("docList:"):
-                    # docList:<message_id>:<label> - extract message ID
-                    parts = first_doc_ref.split(':')
-                    if len(parts) >= 2:
-                        message_id = parts[1]
-                        # Find the message by ID
-                        for message in self.workflow.messages:
-                            if str(message.id) == message_id:
-                                return message.sequenceNr if hasattr(message, 'sequenceNr') else 0
-            return 0
-        except Exception as e:
-            logger.error(f"Error getting message sequence for exchange: {str(e)}")
-            return 0
-
     def getEnhancedDocumentContext(self) -> str:
         """Get enhanced document context formatted for action planning prompts with proper docList and docItem references"""
         try:
@@ -509,6 +245,144 @@ class ServiceCenter:
             logger.error(f"Error generating enhanced document context: {str(e)}")
             return "NO DOCUMENTS AVAILABLE - Error generating document context."
 
+    def getDocumentReferenceList(self) -> Dict[str, List[DocumentExchange]]:
+        """Get list of document exchanges with new labeling format, sorted by recency"""
+        # Collect all documents first and refresh their attributes
+        all_documents = []
+        for message in self.workflow.messages:
+            if message.documents:
+                all_documents.extend(message.documents)
+        
+        # Refresh file attributes for all documents
+        if all_documents:
+            self._refreshDocumentFileAttributes(all_documents)
+        
+        chat_exchanges = []
+        history_exchanges = []
+        
+        # Process messages in reverse order; "first" marks boundary
+        in_current_round = True
+        for message in reversed(self.workflow.messages):
+            is_first = message.status == "first" if hasattr(message, 'status') else False
+            
+            # Build a DocumentExchange if message has documents
+            doc_exchange = None
+            if message.documents:
+                if message.actionId and message.documentsLabel:
+                    # Validate that we use the same label as in the message
+                    validated_label = self._validateDocumentLabelConsistency(message)
+                    
+                    # Use the message's actual documentsLabel
+                    doc_refs = []
+                    for doc in message.documents:
+                        doc_ref = self._getDocumentReferenceFromChatDocument(doc, message)
+                        doc_refs.append(doc_ref)
+                    
+                    doc_exchange = DocumentExchange(
+                        documentsLabel=validated_label,
+                        documents=doc_refs
+                    )
+                else:
+                    # Generate new labels for documents without explicit labels
+                    doc_refs = []
+                    for doc in message.documents:
+                        doc_ref = self._getDocumentReferenceFromChatDocument(doc, message)
+                        doc_refs.append(doc_ref)
+                    
+                    if doc_refs:
+                        # Create a label based on message context
+                        context_prefix = self._generateWorkflowContextPrefix(message)
+                        context_label = f"{context_prefix}_context"
+                        
+                        doc_exchange = DocumentExchange(
+                            documentsLabel=context_label,
+                            documents=doc_refs
+                        )
+            
+            # Append to appropriate container based on boundary
+            if doc_exchange:
+                if in_current_round:
+                    chat_exchanges.append(doc_exchange)
+                else:
+                    history_exchanges.append(doc_exchange)
+            
+            # Flip boundary after including the "first" message in chat
+            if in_current_round and is_first:
+                in_current_round = False
+        
+        # Sort by recency: most recent first, then current round, then earlier rounds
+        # Sort chat exchanges by message sequence number (most recent first)
+        chat_exchanges.sort(key=lambda x: self._getMessageSequenceForExchange(x), reverse=True)
+        # Sort history exchanges by message sequence number (most recent first)
+        history_exchanges.sort(key=lambda x: self._getMessageSequenceForExchange(x), reverse=True)
+        
+        return {
+            "chat": chat_exchanges,
+            "history": history_exchanges
+        }
+            
+    def _refreshDocumentFileAttributes(self, documents: List[ChatDocument]) -> None:
+        """Update file attributes (fileName, fileSize, mimeType) for documents"""
+        for doc in documents:
+            try:
+                file_item = self.interfaceComponent.getFile(doc.fileId)
+                if file_item:
+                    doc.fileName = file_item.fileName
+                    doc.fileSize = file_item.fileSize
+                    doc.mimeType = file_item.mimeType
+                else:
+                    logger.warning(f"File not found for document {doc.id}, fileId: {doc.fileId}")
+            except Exception as e:
+                logger.error(f"Error refreshing file attributes for document {doc.id}: {e}")
+
+    def _generateWorkflowContextPrefix(self, message: ChatMessage) -> str:
+        """Generate workflow context prefix: round{num}_task{num}_action{num}"""
+        round_num = message.roundNumber if hasattr(message, 'roundNumber') else 1
+        task_num = message.taskNumber if hasattr(message, 'taskNumber') else 0
+        action_num = message.actionNumber if hasattr(message, 'actionNumber') else 0
+        return f"round{round_num}_task{task_num}_action{action_num}"
+
+    def _getDocumentReferenceFromChatDocument(self, document: ChatDocument, message: ChatMessage) -> str:
+        """Get document reference using document ID and filename."""
+        try:
+            # Use document ID and filename for simple reference
+            return f"docItem:{document.id}:{document.fileName}"
+        except Exception as e:
+            logger.error(f"Critical error creating document reference for document {document.id}: {str(e)}")
+            # Re-raise the error to prevent workflow from continuing with invalid data
+            raise
+
+    def _getMessageSequenceForExchange(self, exchange: DocumentExchange) -> int:
+        """Get message sequence number for sorting exchanges by recency"""
+        try:
+            # Extract message ID from the first document reference
+            if exchange.documents and len(exchange.documents) > 0:
+                first_doc_ref = exchange.documents[0]
+                if first_doc_ref.startswith("docItem:"):
+                    # docItem:<id>:<label> - extract ID
+                    parts = first_doc_ref.split(':')
+                    if len(parts) >= 2:
+                        doc_id = parts[1]
+                        # Find the message containing this document
+                        for message in self.workflow.messages:
+                            if message.documents:
+                                for doc in message.documents:
+                                    if doc.id == doc_id:
+                                        return message.sequenceNr if hasattr(message, 'sequenceNr') else 0
+                elif first_doc_ref.startswith("docList:"):
+                    # docList:<message_id>:<label> - extract message ID
+                    parts = first_doc_ref.split(':')
+                    if len(parts) >= 2:
+                        message_id = parts[1]
+                        # Find the message by ID
+                        for message in self.workflow.messages:
+                            if str(message.id) == message_id:
+                                return message.sequenceNr if hasattr(message, 'sequenceNr') else 0
+            return 0
+        except Exception as e:
+            logger.error(f"Error getting message sequence for exchange: {str(e)}")
+            return 0
+
     def _validateDocumentLabelConsistency(self, message) -> str:
         """Validate that the document label used for references matches the message's actual label"""
         if not hasattr(message, 'documentsLabel') or not message.documentsLabel:
@@ -571,27 +445,6 @@ class ServiceCenter:
             logger.error(f"Error extracting document info from reference: {str(e)}")
             return None
 
-    def getDocumentReferenceFromChatDocument(self, document: ChatDocument, message: ChatMessage) -> str:
-        """Get document reference using document ID and filename."""
-        try:
-            # Use document ID and filename for simple reference
-            return f"docItem:{document.id}:{document.fileName}"
-        except Exception as e:
-            logger.error(f"Critical error creating document reference for document {document.id}: {str(e)}")
-            # Re-raise the error to prevent workflow from continuing with invalid data
-            raise
-    
-    def getDocumentListReferenceFromChatMessage(self, message: ChatMessage) -> str:
-        """Get document list reference using message ID and label."""
-        try:
-            # Use message ID and documentsLabel for document list reference
-            label = getattr(message, 'documentsLabel', f"message_{message.id}")
-            return f"docList:{message.id}:{label}"
-        except Exception as e:
-            logger.error(f"Critical error creating document list reference for message {message.id}: {str(e)}")
-            # Re-raise the error to prevent workflow from continuing with invalid data
-            raise
-    
     def getChatDocumentsFromDocumentList(self, documentList: List[str]) -> List[ChatDocument]:
         """Get ChatDocuments from a list of document references using all three formats."""
         try:
@@ -731,6 +584,8 @@ class ServiceCenter:
             logger.error(f"Error getting documents from document list: {str(e)}")
             return []
     
+    # ===== Functions for Prompts + Actions: Connection References generation and resolution =====
+            
     def getConnectionReferenceList(self) -> List[str]:
         """Get list of all UserConnection objects as references with enhanced state information"""
         connections = []
@@ -827,46 +682,8 @@ class ServiceCenter:
             logger.error(f"Error parsing connection reference: {str(e)}")
             return None
 
-    async def summarizeChat(self, messages: List[ChatMessage]) -> str:
-        """
-        Summarize chat messages from last to first message with status="first"
-        
-        Args:
-            messages: List of chat messages to summarize
+    # ===== Functions for Actions: AI calls =====
             
-        Returns:
-            str: Summary of the chat in user's language
-        """
-        try:
-            # Get messages from last to first, stopping at first message with status="first"
-            relevantMessages = []
-            for msg in reversed(messages):
-                relevantMessages.append(msg)
-                if msg.status == "first":
-                    break
-            
-            # Create prompt for AI
-            prompt = f"""You are an AI assistant providing a summary of a chat conversation.
-Please respond in '{self.user.language}' language.
-
-Chat History:
-{chr(10).join(f"- {msg.message}" for msg in reversed(relevantMessages))}
-
-Instructions:
-1. Summarize the conversation's key points and outcomes
-2. Be concise but informative
-3. Use a professional but friendly tone
-4. Focus on important decisions and next steps if any
-
-Please provide a comprehensive summary of this conversation."""
-            
-            # Get summary using AI
-            return await self.callAiTextBasic(prompt)
-            
-        except Exception as e:
-            logger.error(f"Error summarizing chat: {str(e)}")
-            return f"Error summarizing chat: {str(e)}"
-
     async def callAiTextAdvanced(self, prompt: str, context: str = None) -> str:
         """Advanced text processing using Anthropic, with fallback to OpenAI basic if advanced fails."""
         max_retries = 3
@@ -959,6 +776,8 @@ Please provide a comprehensive summary of this conversation."""
         
         return response
 
+    # ===== Functions for Actions: Data management =====
+            
     def getFileInfo(self, fileId: str) -> Dict[str, Any]:
         """Get file information"""
         file_item = self.interfaceComponent.getFile(fileId)
@@ -997,11 +816,11 @@ Please provide a comprehensive summary of this conversation."""
                 mimeType = document.mimeType
             except Exception as e:
                 # Try to diagnose and recover the issue
-                diagnosis = self.diagnoseDocumentAccess(document)
+                diagnosis = self._diagnoseDocumentAccess(document)
                 logger.error(f"Critical error: Cannot access document properties for document {document.id}. Diagnosis: {diagnosis}")
                 
                 # Attempt recovery
-                if self.recoverDocumentAccess(document):
+                if self._recoverDocumentAccess(document):
                     try:
                         fileName = document.fileName
                         mimeType = document.mimeType
@@ -1031,9 +850,78 @@ Please provide a comprehensive summary of this conversation."""
         except Exception as e:
             logger.error(f"Error extracting from document: {str(e)}")
             raise
-    
-    def createFile(self, fileName: str, mimeType: str, content: str, base64encoded: bool = False) -> str:
-        """Create new file and return its ID"""
+       
+    def _diagnoseDocumentAccess(self, document: ChatDocument) -> Dict[str, Any]:
+        """
+        Diagnose document access issues and provide recovery information.
+        This method helps identify why document properties are inaccessible.
+        """
+        try:
+            diagnosis = {
+                'document_id': document.id,
+                'file_id': document.fileId,
+                'has_component_interface': document._componentInterface is not None,
+                'component_interface_type': type(document._componentInterface).__name__ if document._componentInterface else None,
+                'file_exists': False,
+                'file_info': None,
+                'error_details': None
+            }
+            
+            # Check if component interface is set
+            if not document._componentInterface:
+                diagnosis['error_details'] = "Component interface not set - document cannot access file system"
+                return diagnosis
+            
+            # Try to access the file directly
+            try:
+                file_info = self.interfaceComponent.getFile(document.fileId)
+                if file_info:
+                    diagnosis['file_exists'] = True
+                    diagnosis['file_info'] = {
+                        'fileName': file_info.fileName if hasattr(file_info, 'fileName') else 'N/A',
+                        'fileSize': file_info.fileSize if hasattr(file_info, 'fileSize') else 'N/A',
+                        'mimeType': file_info.mimeType if hasattr(file_info, 'mimeType') else 'N/A'
+                    }
+                else:
+                    diagnosis['error_details'] = f"File with ID {document.fileId} not found in component interface"
+            except Exception as e:
+                diagnosis['error_details'] = f"Error accessing file {document.fileId}: {str(e)}"
+            
+            return diagnosis
+            
+        except Exception as e:
+            return {
+                'document_id': document.id if hasattr(document, 'id') else 'unknown',
+                'file_id': document.fileId if hasattr(document, 'fileId') else 'unknown',
+                'error_details': f"Error during diagnosis: {str(e)}"
+            }
+
+    def _recoverDocumentAccess(self, document: ChatDocument) -> bool:
+        """
+        Attempt to recover document access by re-setting the component interface.
+        Returns True if recovery was successful.
+        """
+        try:
+            logger.info(f"Attempting to recover document access for document {document.id}")
+            
+            # Re-set the component interface
+            document.setComponentInterface(self.interfaceComponent)
+            
+            # Test if we can now access the fileName
+            try:
+                test_fileName = document.fileName
+                logger.info(f"Document access recovered for {document.id} -> {test_fileName}")
+                return True
+            except Exception as e:
+                logger.error(f"Document access recovery failed for {document.id}: {str(e)}")
+                return False
+                
+        except Exception as e:
+            logger.error(f"Error during document access recovery for {document.id}: {str(e)}")
+            return False
+
+    def createDocument(self, fileName: str, mimeType: str, content: str, base64encoded: bool = True) -> ChatDocument:
+        """Create document with file in one step - handles file creation internally"""
         # Convert content to bytes based on base64 flag
         if base64encoded:
             import base64
@@ -1051,27 +939,16 @@ Please provide a comprehensive summary of this conversation."""
         # Then store the file data
         self.interfaceComponent.createFileData(file_item.id, content_bytes)
         
-        return file_item.id
-    
-    def createDocument(self, fileName: str, mimeType: str, content: str, base64encoded: bool = True, existing_file_id: str = None) -> ChatDocument:
-        """Create document AND file from file data object created by AI call"""
-        # Use existing file ID if provided, otherwise create new file
-        if existing_file_id:
-            file_id = existing_file_id
-        else:
-            # First create the file and get its ID
-            file_id = self.createFile(fileName, mimeType, content, base64encoded)
-        
         # Get file info to copy attributes
-        file_info = self.getFileInfo(file_id)
+        file_info = self.getFileInfo(file_item.id)
         if not file_info:
-            logger.error(f"Could not get file info for fileId: {file_id}")
-            raise ValueError(f"File info not found for fileId: {file_id}")
+            logger.error(f"Could not get file info for fileId: {file_item.id}")
+            raise ValueError(f"File info not found for fileId: {file_item.id}")
         
         # Create document with all file attributes copied
         document = ChatDocument(
             id=str(uuid.uuid4()),
-            fileId=file_id,
+            fileId=file_item.id,
             fileName=file_info.get("fileName", fileName),
             fileSize=file_info.get("size", 0),
             mimeType=file_info.get("mimeType", mimeType)
@@ -1079,6 +956,8 @@ Please provide a comprehensive summary of this conversation."""
         
         return document
 
+    # ===== Internal public helper functions =====
+            
     def updateWorkflowStats(self, eventLabel: str = None, bytesSent: int = 0, bytesReceived: int = 0, tokenCount: int = 0) -> None:
         """
         Centralized function to update workflow statistics in database and running workflow.
@@ -1128,24 +1007,40 @@ Please provide a comprehensive summary of this conversation."""
             logger.error(f"Error calculating object size: {str(e)}")
             return 0
 
-    def getAvailableDocuments(self, workflow) -> List[str]:
+    def getAvailableDocuments(self, workflow) -> str:
         """
-        Get list of available document fileNames from workflow with new labeling format.
+        Get simple description of available documents for task planning.
         
         Args:
             workflow: ChatWorkflow object
             
         Returns:
-            List[str]: List of document labels in new format
+            str: Simple description of document availability
         """
-        documents = []
+        total_documents = 0
+        document_types = set()
+        
         for message in workflow.messages:
-            for doc in message.documents:
-                # Generate new label format
-                label = self.generateDocumentLabel(doc, message)
-                documents.append(label)
-        return documents
+            if message.documents:
+                total_documents += len(message.documents)
+                for doc in message.documents:
+                    try:
+                        file_extension = getFileExtension(doc.fileName)
+                        if file_extension:
+                            document_types.add(file_extension.upper())
+                    except:
+                        pass
+        
+        if total_documents == 0:
+            return "No documents available"
+        elif len(document_types) == 0:
+            return f"{total_documents} document(s) available"
+        else:
+            types_str = ", ".join(sorted(document_types))
+            return f"{total_documents} document(s) available ({types_str} files)"
 
+    # ===== Functions for Manager: Execution Tools =====
+            
     async def executeAction(self, methodName: str, actionName: str, parameters: Dict[str, Any]) -> ActionResult:
         """Execute a method action"""
         try:
@@ -1193,6 +1088,8 @@ Please provide a comprehensive summary of this conversation."""
         """Set user language for the service center"""
         self.user.language = language
 
+    # ===== Functions for Manager: Workflow Tools =====
+            
     def setWorkflowContext(self, round_number: int = None, task_number: int = None, action_number: int = None):
         """Set current workflow context for document generation and routing"""
         try:
@@ -1287,88 +1184,5 @@ Please provide a comprehensive summary of this conversation."""
                 'workflowId': 'unknown'
             }
 
-    def refreshDocumentFileAttributes(self, documents: List[ChatDocument]) -> None:
-        """Update file attributes (fileName, fileSize, mimeType) for documents"""
-        for doc in documents:
-            try:
-                file_item = self.interfaceComponent.getFile(doc.fileId)
-                if file_item:
-                    doc.fileName = file_item.fileName
-                    doc.fileSize = file_item.fileSize
-                    doc.mimeType = file_item.mimeType
-                else:
-                    logger.warning(f"File not found for document {doc.id}, fileId: {doc.fileId}")
-            except Exception as e:
-                logger.error(f"Error refreshing file attributes for document {doc.id}: {e}")
-
-    def diagnoseDocumentAccess(self, document: ChatDocument) -> Dict[str, Any]:
-        """
-        Diagnose document access issues and provide recovery information.
-        This method helps identify why document properties are inaccessible.
-        """
-        try:
-            diagnosis = {
-                'document_id': document.id,
-                'file_id': document.fileId,
-                'has_component_interface': document._componentInterface is not None,
-                'component_interface_type': type(document._componentInterface).__name__ if document._componentInterface else None,
-                'file_exists': False,
-                'file_info': None,
-                'error_details': None
-            }
-            
-            # Check if component interface is set
-            if not document._componentInterface:
-                diagnosis['error_details'] = "Component interface not set - document cannot access file system"
-                return diagnosis
-            
-            # Try to access the file directly
-            try:
-                file_info = self.interfaceComponent.getFile(document.fileId)
-                if file_info:
-                    diagnosis['file_exists'] = True
-                    diagnosis['file_info'] = {
-                        'fileName': file_info.fileName if hasattr(file_info, 'fileName') else 'N/A',
-                        'fileSize': file_info.fileSize if hasattr(file_info, 'fileSize') else 'N/A',
-                        'mimeType': file_info.mimeType if hasattr(file_info, 'mimeType') else 'N/A'
-                    }
-                else:
-                    diagnosis['error_details'] = f"File with ID {document.fileId} not found in component interface"
-            except Exception as e:
-                diagnosis['error_details'] = f"Error accessing file {document.fileId}: {str(e)}"
-            
-            return diagnosis
-            
-        except Exception as e:
-            return {
-                'document_id': document.id if hasattr(document, 'id') else 'unknown',
-                'file_id': document.fileId if hasattr(document, 'fileId') else 'unknown',
-                'error_details': f"Error during diagnosis: {str(e)}"
-            }
-
-    def recoverDocumentAccess(self, document: ChatDocument) -> bool:
-        """
-        Attempt to recover document access by re-setting the component interface.
-        Returns True if recovery was successful.
-        """
-        try:
-            logger.info(f"Attempting to recover document access for document {document.id}")
-            
-            # Re-set the component interface
-            document.setComponentInterface(self.interfaceComponent)
-            
-            # Test if we can now access the fileName
-            try:
-                test_fileName = document.fileName
-                logger.info(f"Document access recovered for {document.id} -> {test_fileName}")
-                return True
-            except Exception as e:
-                logger.error(f"Document access recovery failed for {document.id}: {str(e)}")
-                return False
-                
-        except Exception as e:
-            logger.error(f"Error during document access recovery for {document.id}: {str(e)}")
-            return False
-
 # Create singleton instance
 serviceObject = None
diff --git a/modules/interfaces/interfaceChatModel.py b/modules/interfaces/interfaceChatModel.py
index ddf68edf..769e94c9 100644
--- a/modules/interfaces/interfaceChatModel.py
+++ b/modules/interfaces/interfaceChatModel.py
@@ -732,7 +732,7 @@ class TaskContext(BaseModel, ModelMixin):
     workflow_id: Optional[str] = None
     
     # Available resources
-    available_documents: Optional[list[str]] = []
+    available_documents: Optional[str] = "No documents available"
     available_connections: Optional[list[str]] = []
     
     # Previous execution state
@@ -755,8 +755,8 @@ class TaskContext(BaseModel, ModelMixin):
     criteria_progress: Optional[dict] = None
     
     def getDocumentReferences(self) -> List[str]:
-        """Get all available document references"""
-        docs = self.available_documents or []
+        """Get all available document references from previous handover"""
+        docs = []
         if self.previous_handover:
             for doc_exchange in self.previous_handover.inputDocuments:
                 docs.extend(doc_exchange.documents)
diff --git a/modules/methods/methodOutlook.py b/modules/methods/methodOutlook.py
index 1c9872c3..2c2c90ce 100644
--- a/modules/methods/methodOutlook.py
+++ b/modules/methods/methodOutlook.py
@@ -731,8 +731,6 @@ class MethodOutlook(MethodBase):
                         attachment_docs = self.service.getChatDocumentsFromDocumentList([attachment_ref])
                         if attachment_docs:
                             for doc in attachment_docs:
-                
-                                
                                 # Get the actual file content using fileId
                                 file_id = getattr(doc, 'fileId', None)
                                 if file_id:
@@ -757,15 +755,15 @@ class MethodOutlook(MethodBase):
                                                 "contentBytes": base64_content
                                             }
                                             message["attachments"].append(attachment)
-                            
+                                        
                                         else:
                                             logger.warning(f"No content found for attachment: {doc.fileName}")
                                     except Exception as e:
                                         logger.error(f"Error reading attachment file {doc.fileName}: {str(e)}")
                                 else:
                                     logger.warning(f"Attachment document has no fileId: {doc.fileName}")
-                            else:
-                                logger.warning(f"No attachment documents found for reference: {attachment_ref}")
+                        else:
+                            logger.warning(f"No attachment documents found for reference: {attachment_ref}")
                 
                 # Create the draft message
                 # First, get the Drafts folder ID to ensure the draft is created there
diff --git a/modules/methods/methodSharepoint.py b/modules/methods/methodSharepoint.py
index 3e808645..12af28d6 100644
--- a/modules/methods/methodSharepoint.py
+++ b/modules/methods/methodSharepoint.py
@@ -65,6 +65,7 @@ class MethodSharepoint(MethodBase):
             
             return {
                 "id": userConnection.id,
+                "userConnection": userConnection,
                 "accessToken": token.tokenAccess,
                 "refreshToken": token.tokenRefresh,
                 "scopes": ["Sites.ReadWrite.All", "Files.ReadWrite.All", "User.Read"]  # SharePoint scopes
@@ -73,6 +74,183 @@ class MethodSharepoint(MethodBase):
             logger.error(f"Error getting Microsoft connection: {str(e)}")
             return None
     
+    async def _discoverSharePointSites(self, access_token: str) -> List[Dict[str, Any]]:
+        """
+        Discover all SharePoint sites accessible to the user via Microsoft Graph API
+        
+        Parameters:
+            access_token (str): Microsoft Graph access token
+            
+        Returns:
+            List[Dict[str, Any]]: List of SharePoint site information
+        """
+        try:
+            # Query Microsoft Graph to get all sites the user has access to
+            endpoint = "sites?search=*"
+            result = await self._makeGraphApiCall(access_token, endpoint)
+            
+            if "error" in result:
+                logger.error(f"Error discovering SharePoint sites: {result['error']}")
+                return []
+            
+            sites = result.get("value", [])
+            logger.info(f"Discovered {len(sites)} SharePoint sites")
+            
+            # Process and return site information
+            processed_sites = []
+            for site in sites:
+                site_info = {
+                    "id": site.get("id"),
+                    "displayName": site.get("displayName"),
+                    "name": site.get("name"),
+                    "webUrl": site.get("webUrl"),
+                    "description": site.get("description"),
+                    "createdDateTime": site.get("createdDateTime"),
+                    "lastModifiedDateTime": site.get("lastModifiedDateTime")
+                }
+                processed_sites.append(site_info)
+                logger.debug(f"Site: {site_info['displayName']} - {site_info['webUrl']}")
+            
+            return processed_sites
+            
+        except Exception as e:
+            logger.error(f"Error discovering SharePoint sites: {str(e)}")
+            return []
+    
+    def _parseSearchQuery(self, searchQuery: str) -> tuple[str, str, str, dict]:
+        """
+        Parse searchQuery to extract path, search terms, search type, and search options.
+        
+        Parameters:
+            searchQuery (str): Enhanced search query with options:
+                - "budget" -> pathQuery="*", fileQuery="budget", searchType="all", options={}
+                - "/Documents:budget" -> pathQuery="/Documents", fileQuery="budget", searchType="all", options={}
+                - "files:budget" -> pathQuery="*", fileQuery="budget", searchType="files", options={}
+                - "folders:DELTA" -> pathQuery="*", fileQuery="DELTA", searchType="folders", options={}
+                - "exact:\"Operations 2025\"" -> exact phrase matching
+                - "regex:^Operations.*2025$" -> regex pattern matching
+                - "case:DELTA" -> case-sensitive search
+                - "and:DELTA AND 2025 Mars AND Group" -> all AND terms must be present
+        
+        Returns:
+            tuple[str, str, str, dict]: (pathQuery, fileQuery, searchType, searchOptions)
+        """
+        try:
+            if not searchQuery or not searchQuery.strip() or searchQuery.strip() == "*":
+                return "*", "*", "all", {}
+            
+            searchQuery = searchQuery.strip()
+            searchOptions = {}
+            
+            # Check for search type specification (files:, folders:, all:)
+            searchType = "all"  # Default
+            if searchQuery.startswith(("files:", "folders:", "all:")):
+                type_parts = searchQuery.split(':', 1)
+                searchType = type_parts[0].strip()
+                searchQuery = type_parts[1].strip()
+            
+            # Check for search mode specification (exact:, regex:, case:, and:)
+            if searchQuery.startswith(("exact:", "regex:", "case:", "and:")):
+                mode_parts = searchQuery.split(':', 1)
+                mode = mode_parts[0].strip()
+                searchQuery = mode_parts[1].strip()
+                
+                if mode == "exact":
+                    searchOptions["exact_match"] = True
+                    # Remove quotes if present
+                    if searchQuery.startswith('"') and searchQuery.endswith('"'):
+                        searchQuery = searchQuery[1:-1]
+                elif mode == "regex":
+                    searchOptions["regex_match"] = True
+                elif mode == "case":
+                    searchOptions["case_sensitive"] = True
+                elif mode == "and":
+                    searchOptions["and_terms"] = True
+            
+            # Check if it contains path:search format
+            if ':' in searchQuery:
+                parts = searchQuery.split(':', 1)  # Split only on first colon
+                path_part = parts[0].strip()
+                search_part = parts[1].strip()
+                
+                # Handle path part
+                if not path_part or path_part == "*":
+                    pathQuery = "*"
+                elif path_part.startswith('/'):
+                    pathQuery = path_part
+                else:
+                    pathQuery = f"/Documents/{path_part}"
+                
+                # Handle search part
+                if not search_part or search_part == "*":
+                    fileQuery = "*"
+                else:
+                    fileQuery = search_part
+                
+                return pathQuery, fileQuery, searchType, searchOptions
+            
+            # No colon - check if it looks like a path
+            elif searchQuery.startswith('/'):
+                # It's a path only
+                return searchQuery, "*", searchType, searchOptions
+            
+            else:
+                # It's a search term only
+                return "*", searchQuery, searchType, searchOptions
+                
+        except Exception as e:
+            logger.error(f"Error parsing searchQuery '{searchQuery}': {str(e)}")
+            return "*", "*", "all", {}
+    
+    def _resolvePathQuery(self, pathQuery: str) -> List[str]:
+        """
+        Resolve pathQuery into a list of search paths for SharePoint operations.
+        
+        Parameters:
+            pathQuery (str): Query string that can contain:
+                - Direct paths (e.g., "/Documents/Project1")
+                - Wildcards (e.g., "/Documents/*")
+                - Multiple paths separated by semicolons (e.g., "/Docs; /Files")
+                - Relative paths (e.g., "Project1" -> resolved to default folder)
+                - Empty string or "*" for global search
+        
+        Returns:
+            List[str]: List of resolved paths
+        """
+        try:
+            if not pathQuery or not pathQuery.strip() or pathQuery.strip() == "*":
+                return ["*"]  # Global search across all sites
+            
+            # Split by semicolon to handle multiple paths
+            raw_paths = [path.strip() for path in pathQuery.split(';') if path.strip()]
+            resolved_paths = []
+            
+            for raw_path in raw_paths:
+                # Handle wildcards - return as-is
+                if '*' in raw_path:
+                    resolved_paths.append(raw_path)
+                # Handle absolute paths
+                elif raw_path.startswith('/'):
+                    resolved_paths.append(raw_path)
+                # Handle relative paths - prepend default folder
+                else:
+                    resolved_paths.append(f"/Documents/{raw_path}")
+            
+            # Remove duplicates while preserving order
+            seen = set()
+            unique_paths = []
+            for path in resolved_paths:
+                if path not in seen:
+                    seen.add(path)
+                    unique_paths.append(path)
+            
+            logger.info(f"Resolved pathQuery '{pathQuery}' to {len(unique_paths)} paths: {unique_paths}")
+            return unique_paths
+            
+        except Exception as e:
+            logger.error(f"Error resolving pathQuery '{pathQuery}': {str(e)}")
+            return ["*"]  # Fallback to global search
+    
     def _parseSiteUrl(self, siteUrl: str) -> Dict[str, str]:
         """Parse SharePoint site URL to extract hostname and site path"""
         try:
@@ -167,99 +345,157 @@ class MethodSharepoint(MethodBase):
     @action
     async def findDocumentPath(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        Find document path based on query/description
+        Find documents by searching their content, names, or metadata across all accessible SharePoint sites
         
         Parameters:
             connectionReference (str): Reference to the Microsoft connection
-            siteUrl (str): SharePoint site URL
-            query (str): Query or description to find document
-            searchScope (str, optional): Search scope (default: "all")
+            searchQuery (str): [path:][type:][mode:]query - Enhanced search syntax:
+                - "budget", "/Documents:budget", "files:budget", "folders:DELTA", "*"
+                - "exact:\"Operations 2025\"" - exact phrase matching
+                - "regex:^Operations.*2025$" - regex pattern matching  
+                - "case:DELTA" - case-sensitive search
+                - "and:DELTA AND 2025 Mars AND Group" - all terms must be present
+                - "folders:and:DELTA AND 2025 Mars AND Group" - combined options
+                Note: For storage locations, use "folders:" prefix. All search terms must be present by default.
+            searchScope (str, optional): Search scope - options: "all" (default), "documents" (files only), "pages" (SharePoint pages only)
+            maxResults (int, optional): Maximum number of results to return (default: 100)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
             connectionReference = parameters.get("connectionReference")
-            siteUrl = parameters.get("siteUrl")
-            query = parameters.get("query")
+            searchQuery = parameters.get("searchQuery", "*")
             searchScope = parameters.get("searchScope", "all")
+            maxResults = parameters.get("maxResults", 100)
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
-            if not connectionReference or not siteUrl or not query:
-                return ActionResult.isFailure(error="Connection reference, site URL, and query are required")
+            if not connectionReference:
+                return ActionResult.isFailure(error="Connection reference is required")
+            
+            # Parse searchQuery to extract path, search terms, search type, and options
+            pathQuery, fileQuery, searchType, searchOptions = self._parseSearchQuery(searchQuery)
             
             connection = self._getMicrosoftConnection(connectionReference)
             if not connection:
                 return ActionResult.isFailure(error="No valid Microsoft connection found for the provided connection reference")
             
-            # Parse site URL to get hostname and site path
-            site_info = self._parseSiteUrl(siteUrl)
-            if not site_info["hostname"] or not site_info["sitePath"]:
-                return ActionResult.isFailure(error=f"Invalid SharePoint site URL: {siteUrl}")
+            # Discover all SharePoint sites accessible to the user
+            sites = await self._discoverSharePointSites(connection["accessToken"])
+            if not sites:
+                return ActionResult.isFailure(error="No SharePoint sites found or accessible")
             
-            # Get site ID
-            site_id = await self._getSiteId(connection["accessToken"], site_info["hostname"], site_info["sitePath"])
-            if not site_id:
-                return ActionResult.isFailure(error="Failed to get SharePoint site ID")
+            # Resolve path query into search paths
+            search_paths = self._resolvePathQuery(pathQuery)
             
             try:
-                # Use Microsoft Graph search API
-                search_query = query.replace("'", "''")  # Escape single quotes for OData
-                endpoint = f"sites/{site_id}/drive/root/search(q='{search_query}')"
-                
-                # Make the search API call
-                search_result = await self._makeGraphApiCall(connection["accessToken"], endpoint)
-                
-                if "error" in search_result:
-                    return ActionResult.isFailure(error=f"Search failed: {search_result['error']}")
-                
-                # Process search results
-                items = search_result.get("value", [])
+                # Search across all discovered sites
                 found_documents = []
+                all_sites_searched = []
                 
-                for item in items:
-                    # Filter by search scope if specified
-                    if searchScope == "documents" and "folder" in item:
-                        continue
-                    elif searchScope == "pages" and "file" in item and not item["file"].get("mimeType", "").startswith("text/html"):
+                for site in sites:
+                    site_id = site["id"]
+                    site_name = site["displayName"]
+                    site_url = site["webUrl"]
+                    
+                    logger.info(f"Searching in site: {site_name} ({site_url})")
+                    
+                    # Use Microsoft Graph search API for this specific site
+                    # Handle empty or wildcard queries
+                    if not fileQuery or fileQuery.strip() == "" or fileQuery.strip() == "*":
+                        # For wildcard/empty queries, list all items in the drive
+                        endpoint = f"sites/{site_id}/drive/root/children"
+                    else:
+                        # For specific queries, use search API
+                        search_query = fileQuery.replace("'", "''")  # Escape single quotes for OData
+                        endpoint = f"sites/{site_id}/drive/root/search(q='{search_query}')"
+                    
+                    # Make the search API call
+                    search_result = await self._makeGraphApiCall(connection["accessToken"], endpoint)
+                    
+                    if "error" in search_result:
+                        logger.warning(f"Search failed for site {site_name}: {search_result['error']}")
                         continue
                     
-                    doc_info = {
-                        "id": item.get("id"),
-                        "name": item.get("name"),
-                        "path": item.get("parentReference", {}).get("path", "") + "/" + item.get("name", ""),
-                        "size": item.get("size", 0),
-                        "createdDateTime": item.get("createdDateTime"),
-                        "lastModifiedDateTime": item.get("lastModifiedDateTime"),
-                        "webUrl": item.get("webUrl"),
-                        "type": "folder" if "folder" in item else "file"
-                    }
+                    # Process search results for this site
+                    items = search_result.get("value", [])
+                    site_documents = []
                     
-                    # Add file-specific information
-                    if "file" in item:
-                        doc_info.update({
-                            "mimeType": item["file"].get("mimeType"),
-                            "downloadUrl": item.get("@microsoft.graph.downloadUrl")
-                        })
+                    for item in items:
+                        # Filter by search scope if specified
+                        if searchScope == "documents" and "folder" in item:
+                            continue
+                        elif searchScope == "pages" and "file" in item and not item["file"].get("mimeType", "").startswith("text/html"):
+                            continue
+                        
+                        # Filter by search type (files, folders, all)
+                        if searchType == "files" and "folder" in item:
+                            continue
+                        elif searchType == "folders" and "file" in item:
+                            continue
+                        
+                        # Enhanced post-filtering based on search options
+                        item_name = item.get("name", "")
+                        if fileQuery != "*" and fileQuery.strip():
+                            # Apply different filtering based on search options
+                            if searchOptions.get("exact_match"):
+                                # Exact phrase matching
+                                if searchOptions.get("case_sensitive"):
+                                    if fileQuery not in item_name:
+                                        continue
+                                else:
+                                    if fileQuery.lower() not in item_name.lower():
+                                        continue
+                            elif searchOptions.get("regex_match"):
+                                # Regex pattern matching
+                                import re
+                                flags = 0 if searchOptions.get("case_sensitive") else re.IGNORECASE
+                                if not re.search(fileQuery, item_name, flags):
+                                    continue
+                            elif searchOptions.get("and_terms"):
+                                # AND terms mode: Split by " AND " and ensure ALL terms are present
+                                search_name = item_name.lower() if not searchOptions.get("case_sensitive") else item_name
+                                and_terms = [term.strip() for term in fileQuery.split(" AND ") if term.strip()]
+                                and_terms = [term.lower() if not searchOptions.get("case_sensitive") else term for term in and_terms]
+                                if not all(term in search_name for term in and_terms):
+                                    continue  # Skip this item if not all AND terms match
+                            else:
+                                # Default: ALL search terms must be present (space-separated)
+                                search_name = item_name.lower() if not searchOptions.get("case_sensitive") else item_name
+                                search_terms = [term.strip().lower() if not searchOptions.get("case_sensitive") else term.strip() 
+                                              for term in fileQuery.split() if term.strip()]
+                                if not all(term in search_name for term in search_terms):
+                                    continue  # Skip this item if not all terms match
+                        
+                        # Create minimal result with only essential reference information
+                        doc_info = {
+                            "id": item.get("id"),
+                            "name": item.get("name"),
+                            "type": "folder" if "folder" in item else "file",
+                            "siteName": site_name,
+                            "siteId": site_id
+                        }
+                        
+                        site_documents.append(doc_info)
                     
-                    # Add folder-specific information
-                    if "folder" in item:
-                        doc_info.update({
-                            "childCount": item["folder"].get("childCount", 0)
-                        })
+                    found_documents.extend(site_documents)
+                    all_sites_searched.append({
+                        "siteName": site_name,
+                        "siteUrl": site_url,
+                        "siteId": site_id,
+                        "documentsFound": len(site_documents)
+                    })
                     
-                    found_documents.append(doc_info)
+                    logger.info(f"Found {len(site_documents)} documents in site {site_name}")
+                
+                # Limit total results to maxResults
+                if len(found_documents) > maxResults:
+                    found_documents = found_documents[:maxResults]
+                    logger.info(f"Limited results to {maxResults} items")
                 
                 result_data = {
-                    "connectionReference": connectionReference,
-                    "siteUrl": siteUrl,
-                    "query": query,
-                    "searchScope": searchScope,
+                    "searchQuery": searchQuery,
                     "totalResults": len(found_documents),
+                    "maxResults": maxResults,
                     "foundDocuments": found_documents,
-                    "connection": {
-                        "id": connection["id"],
-                        "authority": "microsoft",
-                        "reference": connectionReference
-                    },
                     "timestamp": get_utc_timestamp()
                 }
                 
@@ -296,46 +532,32 @@ class MethodSharepoint(MethodBase):
             return ActionResult.isFailure(error=str(e))
     
     @action
-    async def readDocument(self, parameters: Dict[str, Any]) -> ActionResult:
+    async def readDocuments(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        Read documents from SharePoint
+        Read documents from SharePoint across all accessible sites
         
         Parameters:
             documentList (str): Reference to the document list to read
             connectionReference (str): Reference to the Microsoft connection
-            siteUrl (str): SharePoint site URL
-            documentPaths (List[str]): List of paths to the documents in SharePoint
+            pathQuery (str): Path query to locate documents (e.g., "/Documents/Project1", "*" for all sites)
             includeMetadata (bool, optional): Whether to include metadata (default: True)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
             documentList = parameters.get("documentList")
             connectionReference = parameters.get("connectionReference")
-            siteUrl = parameters.get("siteUrl")
-            documentPaths = parameters.get("documentPaths")
+            pathQuery = parameters.get("pathQuery", "*")
             includeMetadata = parameters.get("includeMetadata", True)
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
-            if not documentList or not connectionReference or not siteUrl or not documentPaths:
-                return ActionResult.isFailure(error="Document list reference, connection reference, site URL, and document paths are required")
+            if not documentList or not connectionReference:
+                return ActionResult.isFailure(error="Document list reference and connection reference are required")
             
             # Get documents from reference - ensure documentList is a list, not a string
             if isinstance(documentList, str):
                 documentList = [documentList]  # Convert string to list
             chatDocuments = self.service.getChatDocumentsFromDocumentList(documentList)
             
-            # For testing: if no chat documents found, create mock documents based on document paths
-            if not chatDocuments and documentPaths:
-                logger.info("No chat documents found, creating mock documents for testing based on document paths")
-                chatDocuments = []
-                for i, path in enumerate(documentPaths):
-                    mock_doc = type('MockChatDocument', (), {
-                        'fileId': f'mock_file_id_{i}',
-                        'fileName': path.split('/')[-1] if '/' in path else path
-                    })()
-                    chatDocuments.append(mock_doc)
-                logger.info(f"Created {len(chatDocuments)} mock documents for testing")
-            
             if not chatDocuments:
                 return ActionResult.isFailure(error="No documents found for the provided reference")
             
@@ -343,111 +565,128 @@ class MethodSharepoint(MethodBase):
             if not connection:
                 return ActionResult.isFailure(error="No valid Microsoft connection found for the provided connection reference")
             
-            # Parse site URL to get hostname and site path
-            site_info = self._parseSiteUrl(siteUrl)
-            if not site_info["hostname"] or not site_info["sitePath"]:
-                return ActionResult.isFailure(error=f"Invalid SharePoint site URL: {siteUrl}")
+            # Discover all SharePoint sites accessible to the user
+            sites = await self._discoverSharePointSites(connection["accessToken"])
+            if not sites:
+                return ActionResult.isFailure(error="No SharePoint sites found or accessible")
             
-            # Get site ID
-            site_id = await self._getSiteId(connection["accessToken"], site_info["hostname"], site_info["sitePath"])
-            if not site_id:
-                return ActionResult.isFailure(error="Failed to get SharePoint site ID")
+            # Resolve path query into search paths
+            search_paths = self._resolvePathQuery(pathQuery)
             
-            # Process each document path
+            # Process each chat document across all sites
             read_results = []
             
-            for i, documentPath in enumerate(documentPaths):
+            for i, chatDocument in enumerate(chatDocuments):
                 try:
-                    # Check if documentPath is actually a file ID (starts with 016GRP6V)
-                    if documentPath.startswith('016GRP6V'):
-                        # Use file ID directly
-                        file_endpoint = f"sites/{site_id}/drive/items/{documentPath}"
-                        logger.info(f"Reading file by ID: {documentPath}")
-                    else:
-                        # First, find the file by its path
-                        path_clean = documentPath.lstrip('/')
-                        file_endpoint = f"sites/{site_id}/drive/root:/{path_clean}"
-                        logger.info(f"Reading file by path: {path_clean}")
+                    fileId = chatDocument.fileId
+                    fileName = chatDocument.fileName
                     
-                    # Get file metadata
-                    file_info_result = await self._makeGraphApiCall(connection["accessToken"], file_endpoint)
+                    # Search for this file across all sites
+                    file_found = False
                     
-                    if "error" in file_info_result:
-                        read_results.append({
-                            "documentPath": documentPath,
-                            "error": f"File not found: {file_info_result['error']}",
-                            "content": None
-                        })
-                        continue
-                    
-                    file_id = file_info_result.get("id")
-                    if not file_id:
-                        read_results.append({
-                            "documentPath": documentPath,
-                            "error": "Could not get file ID",
-                            "content": None
-                        })
-                        continue
-                    
-                    # Build result with metadata
-                    result_item = {
-                        "documentPath": documentPath,
-                        "fileId": file_id,
-                        "fileName": file_info_result.get("name"),
-                        "size": file_info_result.get("size", 0),
-                        "createdDateTime": file_info_result.get("createdDateTime"),
-                        "lastModifiedDateTime": file_info_result.get("lastModifiedDateTime"),
-                        "webUrl": file_info_result.get("webUrl")
-                    }
-                    
-                    # Add metadata if requested
-                    if includeMetadata:
-                        result_item["metadata"] = {
-                            "mimeType": file_info_result.get("file", {}).get("mimeType"),
-                            "downloadUrl": file_info_result.get("@microsoft.graph.downloadUrl"),
-                            "createdBy": file_info_result.get("createdBy", {}),
-                            "lastModifiedBy": file_info_result.get("lastModifiedBy", {}),
-                            "parentReference": file_info_result.get("parentReference", {})
-                        }
-                    
-                    # Get file content if it's a readable format
-                    mime_type = file_info_result.get("file", {}).get("mimeType", "")
-                    if mime_type.startswith("text/") or mime_type in [
-                        "application/json", "application/xml", "application/javascript"
-                    ]:
-                        # Download the file content
-                        content_endpoint = f"sites/{site_id}/drive/items/{file_id}/content"
+                    for site in sites:
+                        site_id = site["id"]
+                        site_name = site["displayName"]
+                        site_url = site["webUrl"]
                         
-                        # For content download, we need to handle binary data
-                        try:
-                            async with aiohttp.ClientSession() as session:
-                                headers = {"Authorization": f"Bearer {connection['accessToken']}"}
-                                async with session.get(f"https://graph.microsoft.com/v1.0/{content_endpoint}", headers=headers) as response:
-                                    if response.status == 200:
-                                        content = await response.text()
-                                        result_item["content"] = content
-                                    else:
-                                        result_item["content"] = f"Could not download content: HTTP {response.status}"
-                        except Exception as e:
-                            result_item["content"] = f"Error downloading content: {str(e)}"
-                    else:
-                        result_item["content"] = f"Binary file type ({mime_type}) - content not retrieved"
+                        # Try to find the file by name in this site
+                        search_query = fileName.replace("'", "''")  # Escape single quotes for OData
+                        endpoint = f"sites/{site_id}/drive/root/search(q='{search_query}')"
+                        
+                        search_result = await self._makeGraphApiCall(connection["accessToken"], endpoint)
+                        
+                        if "error" in search_result:
+                            continue
+                        
+                        items = search_result.get("value", [])
+                        for item in items:
+                            if item.get("name") == fileName:
+                                # Found the file, get its details
+                                file_id = item.get("id")
+                                file_endpoint = f"sites/{site_id}/drive/items/{file_id}"
+                                
+                                # Get file metadata
+                                file_info_result = await self._makeGraphApiCall(connection["accessToken"], file_endpoint)
+                                
+                                if "error" in file_info_result:
+                                    continue
+                                
+                                # Build result with metadata
+                                result_item = {
+                                    "fileId": fileId,
+                                    "fileName": fileName,
+                                    "sharepointFileId": file_id,
+                                    "siteName": site_name,
+                                    "siteUrl": site_url,
+                                    "size": file_info_result.get("size", 0),
+                                    "createdDateTime": file_info_result.get("createdDateTime"),
+                                    "lastModifiedDateTime": file_info_result.get("lastModifiedDateTime"),
+                                    "webUrl": file_info_result.get("webUrl")
+                                }
+                                
+                                # Add metadata if requested
+                                if includeMetadata:
+                                    result_item["metadata"] = {
+                                        "mimeType": file_info_result.get("file", {}).get("mimeType"),
+                                        "downloadUrl": file_info_result.get("@microsoft.graph.downloadUrl"),
+                                        "createdBy": file_info_result.get("createdBy", {}),
+                                        "lastModifiedBy": file_info_result.get("lastModifiedBy", {}),
+                                        "parentReference": file_info_result.get("parentReference", {})
+                                    }
+                                
+                                # Get file content if it's a readable format
+                                mime_type = file_info_result.get("file", {}).get("mimeType", "")
+                                if mime_type.startswith("text/") or mime_type in [
+                                    "application/json", "application/xml", "application/javascript"
+                                ]:
+                                    # Download the file content
+                                    content_endpoint = f"sites/{site_id}/drive/items/{file_id}/content"
+                                    
+                                    # For content download, we need to handle binary data
+                                    try:
+                                        async with aiohttp.ClientSession() as session:
+                                            headers = {"Authorization": f"Bearer {connection['accessToken']}"}
+                                            async with session.get(f"https://graph.microsoft.com/v1.0/{content_endpoint}", headers=headers) as response:
+                                                if response.status == 200:
+                                                    content = await response.text()
+                                                    result_item["content"] = content
+                                                else:
+                                                    result_item["content"] = f"Could not download content: HTTP {response.status}"
+                                    except Exception as e:
+                                        result_item["content"] = f"Error downloading content: {str(e)}"
+                                else:
+                                    result_item["content"] = f"Binary file type ({mime_type}) - content not retrieved"
+                                
+                                read_results.append(result_item)
+                                file_found = True
+                                break
+                        
+                        if file_found:
+                            break
                     
-                    read_results.append(result_item)
+                    if not file_found:
+                        read_results.append({
+                            "fileId": fileId,
+                            "fileName": fileName,
+                            "error": "File not found in any accessible SharePoint site",
+                            "content": None
+                        })
                     
                 except Exception as e:
-                    logger.error(f"Error reading document {documentPath}: {str(e)}")
+                    logger.error(f"Error reading document {chatDocument.fileName}: {str(e)}")
                     read_results.append({
-                        "documentPath": documentPath,
+                        "fileId": chatDocument.fileId,
+                        "fileName": chatDocument.fileName,
                         "error": str(e),
                         "content": None
                     })
             
             result_data = {
                 "connectionReference": connectionReference,
-                "siteUrl": siteUrl,
-                "documentPaths": documentPaths,
+                "pathQuery": pathQuery,
+                "documentList": documentList,
                 "includeMetadata": includeMetadata,
+                "sitesSearched": len(sites),
                 "readResults": read_results,
                 "connection": {
                     "id": connection["id"],
@@ -490,26 +729,24 @@ class MethodSharepoint(MethodBase):
     @action
     async def uploadDocument(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        Upload documents to SharePoint
+        Upload documents to SharePoint across accessible sites
         
         Parameters:
             connectionReference (str): Reference to the Microsoft connection
-            siteUrl (str): SharePoint site URL
-            documentPaths (List[str]): List of paths where to upload the documents
+            pathQuery (str): Path query where to upload documents (e.g., "/Documents/Project1", "*" for default location)
             documentList (str): Reference to the document list to upload
             fileNames (List[str]): List of names for the uploaded files
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
             connectionReference = parameters.get("connectionReference")
-            siteUrl = parameters.get("siteUrl")
-            documentPaths = parameters.get("documentPaths")
+            pathQuery = parameters.get("pathQuery", "/Documents")
             documentList = parameters.get("documentList")
             fileNames = parameters.get("fileNames")
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
-            if not connectionReference or not siteUrl or not documentPaths or not documentList or not fileNames:
-                return ActionResult.isFailure(error="Connection reference, site URL, document paths, document list, and file names are required")
+            if not connectionReference or not documentList or not fileNames:
+                return ActionResult.isFailure(error="Connection reference, document list, and file names are required")
             
             # Get Microsoft connection
             connection = self._getMicrosoftConnection(connectionReference)
@@ -523,39 +760,43 @@ class MethodSharepoint(MethodBase):
             if not chatDocuments:
                 return ActionResult.isFailure(error="No documents found for the provided reference")
             
-            # Parse site URL to get hostname and site path
-            site_info = self._parseSiteUrl(siteUrl)
-            if not site_info["hostname"] or not site_info["sitePath"]:
-                return ActionResult.isFailure(error=f"Invalid SharePoint site URL: {siteUrl}")
+            # Discover all SharePoint sites accessible to the user
+            sites = await self._discoverSharePointSites(connection["accessToken"])
+            if not sites:
+                return ActionResult.isFailure(error="No SharePoint sites found or accessible")
             
-            # Get site ID
-            site_id = await self._getSiteId(connection["accessToken"], site_info["hostname"], site_info["sitePath"])
-            if not site_id:
-                return ActionResult.isFailure(error="Failed to get SharePoint site ID")
+            # Resolve path query into upload paths
+            upload_paths = self._resolvePathQuery(pathQuery)
             
             # Process each document upload
             upload_results = []
             
-            for i, (documentPath, fileName) in enumerate(zip(documentPaths, fileNames)):
+            for i, (chatDocument, fileName) in enumerate(zip(chatDocuments, fileNames)):
                 try:
-                    if i < len(chatDocuments):
-                        chatDocument = chatDocuments[i]
-                        fileId = chatDocument.fileId
-                        file_data = self.service.getFileData(fileId)
+                    fileId = chatDocument.fileId
+                    file_data = self.service.getFileData(fileId)
+                    
+                    if not file_data:
+                        logger.warning(f"File data not found for fileId: {fileId}")
+                        upload_results.append({
+                            "fileName": fileName,
+                            "fileId": fileId,
+                            "error": "File data not found",
+                            "uploadStatus": "failed"
+                        })
+                        continue
+                    
+                    # Upload to the first available site (or could be made configurable)
+                    upload_successful = False
+                    
+                    for site in sites:
+                        site_id = site["id"]
+                        site_name = site["displayName"]
+                        site_url = site["webUrl"]
                         
-                        if not file_data:
-                            logger.warning(f"File data not found for fileId: {fileId}")
-                            upload_results.append({
-                                "documentPath": documentPath,
-                                "fileName": fileName,
-                                "fileId": fileId,
-                                "error": "File data not found",
-                                "uploadStatus": "failed"
-                            })
-                            continue
-                        
-                        # Prepare upload path
-                        upload_path = documentPath.rstrip('/') + '/' + fileName
+                        # Use the first upload path or default to Documents
+                        upload_path = upload_paths[0] if upload_paths else "/Documents"
+                        upload_path = upload_path.rstrip('/') + '/' + fileName
                         upload_path_clean = upload_path.lstrip('/')
                         
                         # Upload endpoint for small files (< 4MB)
@@ -570,50 +811,41 @@ class MethodSharepoint(MethodBase):
                                 data=file_data
                             )
                             
-                            if "error" in upload_result:
+                            if "error" not in upload_result:
                                 upload_results.append({
-                                    "documentPath": documentPath,
-                                    "fileName": fileName,
-                                    "fileId": fileId,
-                                    "error": upload_result["error"],
-                                    "uploadStatus": "failed"
-                                })
-                            else:
-                                upload_results.append({
-                                    "documentPath": documentPath,
                                     "fileName": fileName,
                                     "fileId": fileId,
                                     "uploadStatus": "success",
+                                    "siteName": site_name,
+                                    "siteUrl": site_url,
+                                    "uploadPath": upload_path,
                                     "sharepointFileId": upload_result.get("id"),
                                     "webUrl": upload_result.get("webUrl"),
                                     "size": upload_result.get("size"),
                                     "createdDateTime": upload_result.get("createdDateTime")
                                 })
+                                upload_successful = True
+                                break
+                            else:
+                                logger.warning(f"Upload failed to site {site_name}: {upload_result['error']}")
                         else:
                             # For large files, we would need to implement resumable upload
-                            # For now, return an error for large files
-                            upload_results.append({
-                                "documentPath": documentPath,
-                                "fileName": fileName,
-                                "fileId": fileId,
-                                "error": f"File too large ({len(file_data)} bytes). Files larger than 4MB require resumable upload (not implemented).",
-                                "uploadStatus": "failed"
-                            })
-                    else:
+                            logger.warning(f"File too large ({len(file_data)} bytes) for site {site_name}")
+                            continue
+                    
+                    if not upload_successful:
                         upload_results.append({
-                            "documentPath": documentPath,
                             "fileName": fileName,
-                            "fileId": None,
-                            "error": "No corresponding chat document found",
+                            "fileId": fileId,
+                            "error": f"File too large ({len(file_data)} bytes) or upload failed to all sites. Files larger than 4MB require resumable upload (not implemented).",
                             "uploadStatus": "failed"
                         })
                         
                 except Exception as e:
                     logger.error(f"Error uploading document {fileName}: {str(e)}")
                     upload_results.append({
-                        "documentPath": documentPath,
                         "fileName": fileName,
-                        "fileId": fileId if i < len(chatDocuments) else None,
+                        "fileId": fileId,
                         "error": str(e),
                         "uploadStatus": "failed"
                     })
@@ -621,10 +853,10 @@ class MethodSharepoint(MethodBase):
             # Create result data
             result_data = {
                 "connectionReference": connectionReference,
-                "siteUrl": siteUrl,
-                "documentPaths": documentPaths,
+                "pathQuery": pathQuery,
                 "documentList": documentList,
                 "fileNames": fileNames,
+                "sitesAvailable": len(sites),
                 "uploadResults": upload_results,
                 "connection": {
                     "id": connection["id"],
@@ -668,155 +900,161 @@ class MethodSharepoint(MethodBase):
     @action
     async def listDocuments(self, parameters: Dict[str, Any]) -> ActionResult:
         """
-        List documents in SharePoint folder
+        List documents in SharePoint folders across accessible sites
         
         Parameters:
             connectionReference (str): Reference to the Microsoft connection
-            siteUrl (str): SharePoint site URL
-            folderPaths (List[str]): List of paths to the folders to list
+            pathQuery (str): Path query to list folders (e.g., "/Documents", "/Shared Documents/Project1", "*" for all sites)
             includeSubfolders (bool, optional): Whether to include subfolders (default: False)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
             connectionReference = parameters.get("connectionReference")
-            siteUrl = parameters.get("siteUrl")
-            folderPaths = parameters.get("folderPaths")
+            pathQuery = parameters.get("pathQuery", "*")
             includeSubfolders = parameters.get("includeSubfolders", False)  # Default to False for better UX
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
-            if not connectionReference or not siteUrl or not folderPaths:
-                return ActionResult.isFailure(error="Connection reference, site URL, and folder paths are required")
+            if not connectionReference:
+                return ActionResult.isFailure(error="Connection reference is required")
             
             # Get Microsoft connection
             connection = self._getMicrosoftConnection(connectionReference)
             if not connection:
                 return ActionResult.isFailure(error="No valid Microsoft connection found for the provided connection reference")
             
-            logger.info(f"Starting SharePoint listDocuments for site: {siteUrl}")
+            logger.info(f"Starting SharePoint listDocuments for pathQuery: {pathQuery}")
             logger.debug(f"Connection ID: {connection['id']}")
-            logger.debug(f"Folder paths: {folderPaths}")
             
-            # Parse site URL to get hostname and site path
-            site_info = self._parseSiteUrl(siteUrl)
-            logger.info(f"Parsed site info - hostname: {site_info['hostname']}, sitePath: {site_info['sitePath']}")
+            # Discover all SharePoint sites accessible to the user
+            sites = await self._discoverSharePointSites(connection["accessToken"])
+            if not sites:
+                return ActionResult.isFailure(error="No SharePoint sites found or accessible")
             
-            if not site_info["hostname"] or not site_info["sitePath"]:
-                logger.error(f"Failed to parse site URL: {siteUrl}")
-                return ActionResult.isFailure(error=f"Invalid SharePoint site URL: {siteUrl}")
+            # Resolve path query into folder paths
+            folder_paths = self._resolvePathQuery(pathQuery)
+            logger.info(f"Resolved folder paths: {folder_paths}")
             
-            # Get site ID
-            logger.info(f"Getting site ID for hostname: {site_info['hostname']}, path: {site_info['sitePath']}")
-            site_id = await self._getSiteId(connection["accessToken"], site_info["hostname"], site_info["sitePath"])
-            logger.info(f"Site ID result: {site_id}")
-            
-            if not site_id:
-                return ActionResult.isFailure(error="Failed to get SharePoint site ID")
-            
-            # Process each folder path
+            # Process each folder path across all sites
             list_results = []
             
-            for folderPath in folderPaths:
+            for folderPath in folder_paths:
                 try:
-                    # Determine the endpoint based on folder path
-                    if folderPath in ["/", ""]:
-                        # Root folder
-                        endpoint = f"sites/{site_id}/drive/root/children"
-                    else:
-                        # Specific folder - remove leading slash if present
-                        folder_path_clean = folderPath.lstrip('/')
-                        endpoint = f"sites/{site_id}/drive/root:/{folder_path_clean}:/children"
+                    folder_results = []
                     
-                    # Make the API call to list folder contents
-                    api_result = await self._makeGraphApiCall(connection["accessToken"], endpoint)
-                    
-                    if "error" in api_result:
-                        list_results.append({
-                            "folderPath": folderPath,
-                            "error": api_result["error"],
-                            "items": []
-                        })
-                        continue
-                    
-                    # Process the results
-                    items = api_result.get("value", [])
-                    processed_items = []
-                    
-                    for item in items:
-                        item_info = {
-                            "id": item.get("id"),
-                            "name": item.get("name"),
-                            "size": item.get("size", 0),
-                            "createdDateTime": item.get("createdDateTime"),
-                            "lastModifiedDateTime": item.get("lastModifiedDateTime"),
-                            "webUrl": item.get("webUrl"),
-                            "type": "folder" if "folder" in item else "file"
-                        }
+                    for site in sites:
+                        site_id = site["id"]
+                        site_name = site["displayName"]
+                        site_url = site["webUrl"]
                         
-                        # Add file-specific information
-                        if "file" in item:
-                            item_info.update({
-                                "mimeType": item["file"].get("mimeType"),
-                                "downloadUrl": item.get("@microsoft.graph.downloadUrl")
-                            })
+                        logger.info(f"Listing folder {folderPath} in site: {site_name}")
                         
-                        # Add folder-specific information
-                        if "folder" in item:
-                            item_info.update({
-                                "childCount": item["folder"].get("childCount", 0)
-                            })
+                        # Determine the endpoint based on folder path
+                        if folderPath in ["/", ""] or folderPath == "*":
+                            # Root folder
+                            endpoint = f"sites/{site_id}/drive/root/children"
+                        else:
+                            # Specific folder - remove leading slash if present
+                            folder_path_clean = folderPath.lstrip('/')
+                            endpoint = f"sites/{site_id}/drive/root:/{folder_path_clean}:/children"
                         
-                        processed_items.append(item_info)
-                    
-                    # If include subfolders is enabled, get ONLY direct subfolder contents (1 level deep only)
-                    if includeSubfolders:
-                        logger.info(f"Including subfolders - processing {len([item for item in processed_items if item['type'] == 'folder'])} folders")
-                        subfolder_count = 0
-                        max_subfolders = 10  # Limit to prevent infinite loops
+                        # Make the API call to list folder contents
+                        api_result = await self._makeGraphApiCall(connection["accessToken"], endpoint)
                         
-                        for item in processed_items[:]:  # Use slice to avoid modifying list during iteration
-                            if item["type"] == "folder" and subfolder_count < max_subfolders:
-                                subfolder_count += 1
-                                subfolder_path = f"{folderPath.rstrip('/')}/{item['name']}"
-                                subfolder_endpoint = f"sites/{site_id}/drive/items/{item['id']}/children"
-                                
-                                logger.debug(f"Getting contents of subfolder: {item['name']}")
-                                subfolder_result = await self._makeGraphApiCall(connection["accessToken"], subfolder_endpoint)
-                                if "error" not in subfolder_result:
-                                    subfolder_items = subfolder_result.get("value", [])
-                                    logger.debug(f"Found {len(subfolder_items)} items in subfolder {item['name']}")
+                        if "error" in api_result:
+                            logger.warning(f"Failed to list folder {folderPath} in site {site_name}: {api_result['error']}")
+                            continue
+                        
+                        # Process the results
+                        items = api_result.get("value", [])
+                        processed_items = []
+                        
+                        for item in items:
+                            item_info = {
+                                "id": item.get("id"),
+                                "name": item.get("name"),
+                                "size": item.get("size", 0),
+                                "createdDateTime": item.get("createdDateTime"),
+                                "lastModifiedDateTime": item.get("lastModifiedDateTime"),
+                                "webUrl": item.get("webUrl"),
+                                "type": "folder" if "folder" in item else "file",
+                                "siteName": site_name,
+                                "siteUrl": site_url
+                            }
+                            
+                            # Add file-specific information
+                            if "file" in item:
+                                item_info.update({
+                                    "mimeType": item["file"].get("mimeType"),
+                                    "downloadUrl": item.get("@microsoft.graph.downloadUrl")
+                                })
+                            
+                            # Add folder-specific information
+                            if "folder" in item:
+                                item_info.update({
+                                    "childCount": item["folder"].get("childCount", 0)
+                                })
+                            
+                            processed_items.append(item_info)
+                        
+                        # If include subfolders is enabled, get ONLY direct subfolder contents (1 level deep only)
+                        if includeSubfolders:
+                            logger.info(f"Including subfolders - processing {len([item for item in processed_items if item['type'] == 'folder'])} folders")
+                            subfolder_count = 0
+                            max_subfolders = 10  # Limit to prevent infinite loops
+                            
+                            for item in processed_items[:]:  # Use slice to avoid modifying list during iteration
+                                if item["type"] == "folder" and subfolder_count < max_subfolders:
+                                    subfolder_count += 1
+                                    subfolder_path = f"{folderPath.rstrip('/')}/{item['name']}"
+                                    subfolder_endpoint = f"sites/{site_id}/drive/items/{item['id']}/children"
                                     
-                                    for subfolder_item in subfolder_items:
-                                        # Only add files and direct subfolders, NO RECURSION
-                                        subfolder_item_info = {
-                                            "id": subfolder_item.get("id"),
-                                            "name": subfolder_item.get("name"),
-                                            "size": subfolder_item.get("size", 0),
-                                            "createdDateTime": subfolder_item.get("createdDateTime"),
-                                            "lastModifiedDateTime": subfolder_item.get("lastModifiedDateTime"),
-                                            "webUrl": subfolder_item.get("webUrl"),
-                                            "type": "folder" if "folder" in subfolder_item else "file",
-                                            "parentPath": subfolder_path
-                                        }
+                                    logger.debug(f"Getting contents of subfolder: {item['name']}")
+                                    subfolder_result = await self._makeGraphApiCall(connection["accessToken"], subfolder_endpoint)
+                                    if "error" not in subfolder_result:
+                                        subfolder_items = subfolder_result.get("value", [])
+                                        logger.debug(f"Found {len(subfolder_items)} items in subfolder {item['name']}")
                                         
-                                        if "file" in subfolder_item:
-                                            subfolder_item_info.update({
-                                                "mimeType": subfolder_item["file"].get("mimeType"),
-                                                "downloadUrl": subfolder_item.get("@microsoft.graph.downloadUrl")
-                                            })
-                                        
-                                        processed_items.append(subfolder_item_info)
-                                else:
-                                    logger.warning(f"Failed to get contents of subfolder {item['name']}: {subfolder_result.get('error')}")
-                            elif subfolder_count >= max_subfolders:
-                                logger.warning(f"Reached maximum subfolder limit ({max_subfolders}), skipping remaining folders")
-                                break
+                                        for subfolder_item in subfolder_items:
+                                            # Only add files and direct subfolders, NO RECURSION
+                                            subfolder_item_info = {
+                                                "id": subfolder_item.get("id"),
+                                                "name": subfolder_item.get("name"),
+                                                "size": subfolder_item.get("size", 0),
+                                                "createdDateTime": subfolder_item.get("createdDateTime"),
+                                                "lastModifiedDateTime": subfolder_item.get("lastModifiedDateTime"),
+                                                "webUrl": subfolder_item.get("webUrl"),
+                                                "type": "folder" if "folder" in subfolder_item else "file",
+                                                "parentPath": subfolder_path,
+                                                "siteName": site_name,
+                                                "siteUrl": site_url
+                                            }
+                                            
+                                            if "file" in subfolder_item:
+                                                subfolder_item_info.update({
+                                                    "mimeType": subfolder_item["file"].get("mimeType"),
+                                                    "downloadUrl": subfolder_item.get("@microsoft.graph.downloadUrl")
+                                                })
+                                            
+                                            processed_items.append(subfolder_item_info)
+                                    else:
+                                        logger.warning(f"Failed to get contents of subfolder {item['name']}: {subfolder_result.get('error')}")
+                                elif subfolder_count >= max_subfolders:
+                                    logger.warning(f"Reached maximum subfolder limit ({max_subfolders}), skipping remaining folders")
+                                    break
+                            
+                            logger.info(f"Processed {subfolder_count} subfolders, total items: {len(processed_items)}")
                         
-                        logger.info(f"Processed {subfolder_count} subfolders, total items: {len(processed_items)}")
+                        folder_results.append({
+                            "siteName": site_name,
+                            "siteUrl": site_url,
+                            "itemCount": len(processed_items),
+                            "items": processed_items
+                        })
                     
                     list_results.append({
                         "folderPath": folderPath,
-                        "itemCount": len(processed_items),
-                        "items": processed_items
+                        "sitesProcessed": len(folder_results),
+                        "siteResults": folder_results
                     })
                     
                 except Exception as e:
@@ -824,15 +1062,15 @@ class MethodSharepoint(MethodBase):
                     list_results.append({
                         "folderPath": folderPath,
                         "error": str(e),
-                        "items": []
+                        "siteResults": []
                     })
             
             # Create result data
             result_data = {
                 "connectionReference": connectionReference,
-                "siteUrl": siteUrl,
-                "folderPaths": folderPaths,
+                "pathQuery": pathQuery,
                 "includeSubfolders": includeSubfolders,
+                "sitesSearched": len(sites),
                 "listResults": list_results,
                 "connection": {
                     "id": connection["id"],
diff --git a/modules/workflow/managerWorkflow.py b/modules/workflow/managerWorkflow.py
index 59aa338a..ce7a2366 100644
--- a/modules/workflow/managerWorkflow.py
+++ b/modules/workflow/managerWorkflow.py
@@ -141,7 +141,7 @@ class WorkflowManager:
             self.chatManager.handlingTasks._checkWorkflowStopped()
             
             # Create initial message using interface
-            # Generate the correct documentsLabel that matches what getDocumentReferenceList() will create
+            # Generate the correct documentsLabel that matches what getDocumentReferenceString will create
             round_num = workflow.currentRound
             task_num = 0
             action_num = 0
diff --git a/notes/changelog.txt b/notes/changelog.txt
index fca700df..affd7a3d 100644
--- a/notes/changelog.txt
+++ b/notes/changelog.txt
@@ -2,7 +2,9 @@
 TODO
 
 # System
-- web
+- sharepoint to fix
+- document handling centralized
+- ai handling centralized
 - neutralizer to activate AND put back placeholders to the returned data
 
 # Tests
diff --git a/notes/management_summary.html b/notes/management_summary.html
deleted file mode 100644
index 58ca722f..00000000
--- a/notes/management_summary.html
+++ /dev/null
@@ -1,128 +0,0 @@
-<!DOCTYPE html>
-<html lang="de">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Management Summary: Methoden-basierte Chat-Architektur</title>
-    <style>
-        body {
-            font-family: Arial, sans-serif;
-            line-height: 1.6;
-            max-width: 800px;
-            margin: 0 auto;
-            padding: 20px;
-            color: #333;
-        }
-        h1 {
-            color: #2c3e50;
-            border-bottom: 2px solid #3498db;
-            padding-bottom: 10px;
-        }
-        h2 {
-            color: #2c3e50;
-            margin-top: 30px;
-        }
-        .example {
-            background-color: #f8f9fa;
-            border-left: 4px solid #3498db;
-            padding: 15px;
-            margin: 20px 0;
-        }
-        .old-arch, .new-arch {
-            margin: 15px 0;
-            padding: 15px;
-            border-radius: 5px;
-        }
-        .old-arch {
-            background-color: #fff3cd;
-            border: 1px solid #ffeeba;
-        }
-        .new-arch {
-            background-color: #d4edda;
-            border: 1px solid #c3e6cb;
-        }
-        .benefits {
-            background-color: #e8f4f8;
-            padding: 15px;
-            border-radius: 5px;
-            margin: 20px 0;
-        }
-        .benefits ul {
-            margin: 10px 0;
-            padding-left: 20px;
-        }
-        .benefits li {
-            margin: 5px 0;
-        }
-    </style>
-</head>
-<body>
-    <h1>Management Summary: Methoden-basierte Chat-Architektur</h1>
-
-    <p>Die Umstellung von einer Agenten-basierten auf eine Methoden-basierte Chat-Architektur stellt einen fundamentalen Paradigmenwechsel dar. Während die Mehrheit der KI-Chat-Systeme weiterhin auf Agenten-Architekturen setzt, ermöglicht unser methoden-basierter Ansatz eine präzisere Kontrolle und effizientere Integration.</p>
-
-    <p>Der methoden-basierte Ansatz definiert klare, selbstbeschreibende Operationen mit festgelegten Parametern und Ergebnissen. Im Gegensatz zu Agenten, die als Blackbox-Operationen fungieren, bieten Methoden eine transparente, validierbare und vorhersehbare Ausführung. Diese Struktur ermöglicht eine präzise Fehlerbehandlung und Retry-Logik auf Aktions-Ebene, anstatt auf Agenten-Ebene.</p>
-
-    <p>Die Integration mit Benutzerdaten erfolgt direkt über definierte Authentifizierungspfade, was die Sicherheit erhöht und die Komplexität reduziert. Jede Methode ist selbstbeschreibend und enthält ihre eigenen Validierungsregeln, was die Wartbarkeit verbessert und die Entwicklung neuer Funktionen beschleunigt.</p>
-
-    <p>Der methoden-basierte Ansatz reduziert die KI-Abhängigkeit bei der Ausführung von Operationen, während die KI weiterhin für die Planung und Koordination der Methoden eingesetzt wird. Diese Trennung von Planung und Ausführung führt zu zuverlässigeren Ergebnissen und besserer Nachvollziehbarkeit.</p>
-
-    <p>Die Architektur ermöglicht eine präzise Dokumentation und Validierung jeder Operation, was in einer regulierten Umgebung von besonderem Wert ist. Die klare Struktur erleichtert die Integration neuer Dienste und die Erweiterung bestehender Funktionalitäten.</p>
-
-    <h2>Praktisches Beispiel: Dokumentenverarbeitung und E-Mail-Versand</h2>
-
-    <div class="example">
-        <div class="old-arch">
-            <strong>Alte Agenten-basierte Architektur:</strong><br>
-            <pre>
-Benutzer: "Suche nach Verträgen im SharePoint und sende mir eine Zusammenfassung per E-Mail"
-
-Agent SharePoint:
-- Sucht nach Verträgen
-- Extrahiert Inhalte
-- Speichert Ergebnisse
-
-Agent Outlook:
-- Liest Ergebnisse
-- Erstellt E-Mail
-- Sendet E-Mail</pre>
-        </div>
-
-        <div class="new-arch">
-            <strong>Neue Methoden-basierte Architektur:</strong><br>
-            <pre>
-Benutzer: "Suche nach Verträgen im SharePoint und sende mir eine Zusammenfassung per E-Mail"
-
-Methoden-Katalog:
-1. SharePoint.searchDocuments
-   - Parameter: {query: "Verträge", site: "valueon"}
-   - Retry: 3x bei Netzwerkfehler
-   - Auth: MSFT
-
-2. Document.extractContent
-   - Parameter: {documents: [...], sections: ["Zusammenfassung"]}
-   - Retry: 2x bei Extraktionsfehler
-   - Auth: LOCAL
-
-3. Outlook.sendMail
-   - Parameter: {to: ["user@example.com"], subject: "Vertragszusammenfassung"}
-   - Retry: 1x bei SMTP-Fehler
-   - Auth: MSFT</pre>
-        </div>
-
-        <div class="benefits">
-            <strong>Vorteile im Beispiel:</strong>
-            <ul>
-                <li>Jede Operation ist klar definiert und validierbar</li>
-                <li>Retry-Logik ist spezifisch für jede Operation</li>
-                <li>Authentifizierung ist explizit definiert</li>
-                <li>Fehler können präzise zugeordnet werden</li>
-                <li>Operationen können unabhängig voneinander getestet werden</li>
-                <li>Neue Operationen können einfach hinzugefügt werden</li>
-            </ul>
-        </div>
-    </div>
-
-    <p>Die KI plant die Ausführung dieser Methoden, aber die eigentliche Ausführung erfolgt durch die definierten Methoden mit klaren Parametern und Ergebnissen. Dies führt zu einer zuverlässigeren und besser nachvollziehbaren Ausführung.</p>
-</body>
-</html> 
\ No newline at end of file
diff --git a/notes/methodbased_arch.html b/notes/methodbased_arch.html
deleted file mode 100644
index 70d0a6ea..00000000
--- a/notes/methodbased_arch.html
+++ /dev/null
@@ -1,129 +0,0 @@
-
-<!DOCTYPE html>
-<html lang="de">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Management Summary: Methoden-basierte Chat-Architektur</title>
-    <style>
-        body {
-            font-family: Arial, sans-serif;
-            line-height: 1.6;
-            max-width: 800px;
-            margin: 0 auto;
-            padding: 20px;
-            color: #333;
-        }
-        h1 {
-            color: #2c3e50;
-            border-bottom: 2px solid #3498db;
-            padding-bottom: 10px;
-        }
-        h2 {
-            color: #2c3e50;
-            margin-top: 30px;
-        }
-        .example {
-            background-color: #f8f9fa;
-            border-left: 4px solid #3498db;
-            padding: 15px;
-            margin: 20px 0;
-        }
-        .old-arch, .new-arch {
-            margin: 15px 0;
-            padding: 15px;
-            border-radius: 5px;
-        }
-        .old-arch {
-            background-color: #fff3cd;
-            border: 1px solid #ffeeba;
-        }
-        .new-arch {
-            background-color: #d4edda;
-            border: 1px solid #c3e6cb;
-        }
-        .benefits {
-            background-color: #e8f4f8;
-            padding: 15px;
-            border-radius: 5px;
-            margin: 20px 0;
-        }
-        .benefits ul {
-            margin: 10px 0;
-            padding-left: 20px;
-        }
-        .benefits li {
-            margin: 5px 0;
-        }
-    </style>
-</head>
-<body>
-    <h1>Management Summary: Methoden-basierte Chat-Architektur</h1>
-
-    <p>Die Umstellung von einer Agenten-basierten auf eine Methoden-basierte Chat-Architektur stellt einen fundamentalen Paradigmenwechsel dar. Während die Mehrheit der KI-Chat-Systeme weiterhin auf Agenten-Architekturen setzt, ermöglicht unser methoden-basierter Ansatz eine präzisere Kontrolle und effizientere Integration.</p>
-
-    <p>Der methoden-basierte Ansatz definiert klare, selbstbeschreibende Operationen mit festgelegten Parametern und Ergebnissen. Im Gegensatz zu Agenten, die als Blackbox-Operationen fungieren, bieten Methoden eine transparente, validierbare und vorhersehbare Ausführung. Diese Struktur ermöglicht eine präzise Fehlerbehandlung und Retry-Logik auf Aktions-Ebene, anstatt auf Agenten-Ebene.</p>
-
-    <p>Die Integration mit Benutzerdaten erfolgt direkt über definierte Authentifizierungspfade, was die Sicherheit erhöht und die Komplexität reduziert. Jede Methode ist selbstbeschreibend und enthält ihre eigenen Validierungsregeln, was die Wartbarkeit verbessert und die Entwicklung neuer Funktionen beschleunigt.</p>
-
-    <p>Der methoden-basierte Ansatz reduziert die KI-Abhängigkeit bei der Ausführung von Operationen, während die KI weiterhin für die Planung und Koordination der Methoden eingesetzt wird. Diese Trennung von Planung und Ausführung führt zu zuverlässigeren Ergebnissen und besserer Nachvollziehbarkeit.</p>
-
-    <p>Die Architektur ermöglicht eine präzise Dokumentation und Validierung jeder Operation, was in einer regulierten Umgebung von besonderem Wert ist. Die klare Struktur erleichtert die Integration neuer Dienste und die Erweiterung bestehender Funktionalitäten.</p>
-
-    <h2>Praktisches Beispiel: Dokumentenverarbeitung und E-Mail-Versand</h2>
-
-    <div class="example">
-        <div class="old-arch">
-            <strong>Alte Agenten-basierte Architektur:</strong><br>
-            <pre>
-Benutzer: "Suche nach Verträgen im SharePoint und sende mir eine Zusammenfassung per E-Mail"
-
-Agent SharePoint:
-- Sucht nach Verträgen
-- Extrahiert Inhalte
-- Speichert Ergebnisse
-
-Agent Outlook:
-- Liest Ergebnisse
-- Erstellt E-Mail
-- Sendet E-Mail</pre>
-        </div>
-
-        <div class="new-arch">
-            <strong>Neue Methoden-basierte Architektur:</strong><br>
-            <pre>
-Benutzer: "Suche nach Verträgen im SharePoint und sende mir eine Zusammenfassung per E-Mail"
-
-Methoden-Katalog:
-1. SharePoint.searchDocuments
-   - Parameter: {query: "Verträge", site: "valueon"}
-   - Retry: 3x bei Netzwerkfehler
-   - Auth: MSFT
-
-2. Document.extractContent
-   - Parameter: {documents: [...], sections: ["Zusammenfassung"]}
-   - Retry: 2x bei Extraktionsfehler
-   - Auth: LOCAL
-
-3. Outlook.sendMail
-   - Parameter: {to: ["user@example.com"], subject: "Vertragszusammenfassung"}
-   - Retry: 1x bei SMTP-Fehler
-   - Auth: MSFT</pre>
-        </div>
-
-        <div class="benefits">
-            <strong>Vorteile im Beispiel:</strong>
-            <ul>
-                <li>Jede Operation ist klar definiert und validierbar</li>
-                <li>Retry-Logik ist spezifisch für jede Operation</li>
-                <li>Authentifizierung ist explizit definiert</li>
-                <li>Fehler können präzise zugeordnet werden</li>
-                <li>Operationen können unabhängig voneinander getestet werden</li>
-                <li>Neue Operationen können einfach hinzugefügt werden</li>
-            </ul>
-        </div>
-    </div>
-
-    <p>Die KI plant die Ausführung dieser Methoden, aber die eigentliche Ausführung erfolgt durch die definierten Methoden mit klaren Parametern und Ergebnissen. Dies führt zu einer zuverlässigeren und besser nachvollziehbaren Ausführung.</p>
-</body>
-</html>
\ No newline at end of file
diff --git a/notes/methodbased_specification.md b/notes/methodbased_specification.md
deleted file mode 100644
index 6aa273c7..00000000
--- a/notes/methodbased_specification.md
+++ /dev/null
@@ -1,999 +0,0 @@
-# Chat System Process Flow Specification
-
-## 1. System Overview
-
-### 1.1 Core Components
-- **WorkflowManager**: Orchestrates the overall workflow process
-- **ChatManager**: Manages chat interactions and task execution
-- **ServiceCenter**: Central state and context management
-- **AgentTask**: Core data object for task execution
-
-### 1.2 Service center Structure
-```python
-from enum import Enum
-from typing import Dict, List, Optional, Any, Literal
-from datetime import datetime, UTC
-from pydantic import BaseModel, Field
-
-class TaskStatus(str, Enum):
-    PENDING = "pending"
-    SUCCESS = "success"
-    FAILED = "failed"
-    RETRY = "retry"
-    TIMEOUT = "timeout"
-    ROLLBACK = "rollback"
-
-class ActionStatus(str, Enum):
-    PENDING = "pending"
-    SUCCESS = "success"
-    FAILED = "failed"
-    RETRY = "retry"
-    TIMEOUT = "timeout"
-    SKIPPED = "skipped"
-    DEPENDENCY_FAILED = "dependency_failed"
-
-class AuthSource(str, Enum):
-    LOCAL = "local"
-    MSFT = "msft"
-    GOOGLE = "google"
-    # Add more auth sources as needed
-
-class MethodParameter(BaseModel):
-    """Model for method parameters"""
-    name: str
-    type: str
-    required: bool
-    validation: Optional[callable] = None
-    description: str
-
-class ActionResult(BaseModel):
-    """Model for method results"""
-    success: bool
-    data: Dict[str, Any]
-    metadata: Dict[str, Any]
-    validation: List[str]
-
-class MethodBase:
-    """Base class for all methods"""
-    
-    def __init__(self, service):
-        self.service = service
-        self.name: str
-        self.description: str
-        self.auth_source: AuthSource = AuthSource.LOCAL  # Default to local auth
-        
-    @property
-    def actions(self) -> Dict[str, Dict[str, Any]]:
-        """Available actions and their parameters"""
-        raise NotImplementedError
-        
-    async def execute(self, action: str, parameters: Dict[str, Any], auth_data: Optional[Dict[str, Any]] = None) -> ActionResult:
-        """Execute method action with authentication data"""
-        raise NotImplementedError
-        
-    async def validate_parameters(self, action: str, parameters: Dict[str, Any]) -> bool:
-        """Validate action parameters"""
-        if action not in self.actions:
-            return False
-            
-        action_def = self.actions[action]
-        required_params = {k for k, v in action_def['parameters'].items() if v['required']}
-        return all(param in parameters for param in required_params)
-        
-    async def rollback(self, action: str, parameters: Dict[str, Any], auth_data: Optional[Dict[str, Any]] = None) -> None:
-        """Rollback action if needed"""
-        pass
-
-class Action(BaseModel):
-    """Action model with validation"""
-    method: str
-    action: str
-    parameters: Dict[str, Any]
-    retryCount: int = 0
-    retryMax: int
-    status: ActionStatus = ActionStatus.PENDING
-    timeout: Optional[int] = None
-    dependencies: List[str] = []
-    rollback_on_failure: bool = False
-    auth_source: Optional[AuthSource] = None  # Auth source for this action
-    
-    class Config:
-        use_enum_values = True
-
-class AgentTask(BaseModel):
-    """Task model with validation"""
-    id: str
-    workflowId: str
-    status: TaskStatus = TaskStatus.PENDING
-    userInput: str
-    dataList: List[Dict[str, str]]  # List of available connections
-    actionList: List[Action]
-    chatHistory: str
-    taskHistory: str
-    previousTaskFeedback: Optional[str]
-    thisTaskFeedback: Optional[str]
-    result: Optional[Dict[str, Any]]
-    documentsInput: List[Dict]
-    documentsOutput: List[Dict]
-    startedAt: str
-    finishedAt: Optional[str]
-    error: Optional[str]
-    dependencies: List[str] = []
-    requiredOutputs: List[str] = []
-    
-    class Config:
-        use_enum_values = True
-        
-    def get_auth_data(self, auth_source: AuthSource) -> Optional[Dict[str, Any]]:
-        """Get authentication data for the specified source"""
-        return next(
-            (conn for conn in self.dataList if conn.get('source') == auth_source),
-            None
-        )
-        
-    def get_action_by_id(self, action_id: str) -> Optional[Action]:
-        """Get action by its ID (method:action)"""
-        return next((a for a in self.actionList if f"{a.method}:{a.action}" == action_id), None)
-        
-    def can_execute_action(self, action: Action) -> bool:
-        """Check if action can be executed based on dependencies and auth"""
-        # Check dependencies
-        if action.dependencies:
-            if not all(
-                self.get_action_by_id(dep).status == ActionStatus.SUCCESS
-                for dep in action.dependencies
-            ):
-                return False
-                
-        # Check authentication
-        if action.auth_source and action.auth_source != AuthSource.LOCAL:
-            if not self.get_auth_data(action.auth_source):
-                return False
-                
-        return True
-        
-    def is_complete(self) -> bool:
-        """Check if all actions are complete"""
-        return all(a.status in [ActionStatus.SUCCESS, ActionStatus.SKIPPED] 
-                  for a in self.actionList)
-        
-    def has_failed(self) -> bool:
-        """Check if any action has failed"""
-        return any(a.status == ActionStatus.FAILED for a in self.actionList)
-
-class ServiceCenter:
-    """Service center with improved state management"""
-    
-    def __init__(self):
-        self.state = {
-            'status': TaskStatus.PENDING,
-            'retryCount': 0,
-            'retryMax': 3,
-            'timeout': 300,  # 5 minutes
-            'lastError': None,
-            'lastErrorTime': None
-        }
-        self.methods: Dict[str, MethodBase] = {}
-        self.tasks: Dict[str, AgentTask] = {}
-        self.promptManager = AIPromptManager()
-        self.taskStateManager = TaskStateManager()
-        self.documentProcessor = DocumentExtraction()
-        
-    async def execute_task(self, task: AgentTask) -> None:
-        """Execute task with improved error handling and timeout"""
-        try:
-            # Check for timeout
-            if (datetime.now(UTC) - datetime.fromisoformat(task.startedAt)).seconds > self.state['timeout']:
-                task.status = TaskStatus.TIMEOUT
-                return
-                
-            # Execute actions
-            for action in task.actionList:
-                if not task.can_execute_action(action):
-                    if not task.get_auth_data(action.auth_source):
-                        action.status = ActionStatus.FAILED
-                        task.error = f"Missing authentication for {action.auth_source}"
-                    else:
-                        action.status = ActionStatus.DEPENDENCY_FAILED
-                    continue
-                    
-                try:
-                    # Get method
-                    method = self.methods.get(action.method)
-                    if not method:
-                        raise ValueError(f"Unknown method: {action.method}")
-                        
-                    # Validate parameters
-                    if not await method.validate_parameters(action.action, action.parameters):
-                        raise ValueError(f"Invalid parameters for {action.method}:{action.action}")
-                        
-                    # Get auth data if needed
-                    auth_data = None
-                    if action.auth_source and action.auth_source != AuthSource.LOCAL:
-                        auth_data = task.get_auth_data(action.auth_source)
-                        if not auth_data:
-                            raise ValueError(f"Missing authentication data for {action.auth_source}")
-                        
-                    # Execute with timeout
-                    result = await asyncio.wait_for(
-                        method.execute(action.action, action.parameters, auth_data),
-                        timeout=action.timeout or 60
-                    )
-                    
-                    if result.success:
-                        action.status = ActionStatus.SUCCESS
-                    else:
-                        if self._should_retry(result.data.get('error')):
-                            action.retryCount += 1
-                            if action.retryCount > action.retryMax:
-                                action.status = ActionStatus.FAILED
-                                if action.rollback_on_failure:
-                                    await method.rollback(action.action, action.parameters, auth_data)
-                            else:
-                                action.status = ActionStatus.RETRY
-                        else:
-                            action.status = ActionStatus.FAILED
-                            if action.rollback_on_failure:
-                                await method.rollback(action.action, action.parameters, auth_data)
-                                
-                except asyncio.TimeoutError:
-                    action.status = ActionStatus.TIMEOUT
-                except Exception as e:
-                    action.status = ActionStatus.FAILED
-                    if action.rollback_on_failure:
-                        await method.rollback(action.action, action.parameters, auth_data)
-                        
-            # Update task status
-            if task.has_failed():
-                task.status = TaskStatus.FAILED
-            elif task.is_complete():
-                task.status = TaskStatus.SUCCESS
-                task.finishedAt = datetime.now(UTC).isoformat()
-                
-        except Exception as e:
-            task.status = TaskStatus.FAILED
-            task.error = str(e)
-
-class AIPromptManager:
-    """Manages AI prompts and response validation"""
-    
-    def generatePrompt(self, context: Dict[str, Any], examples: List[Dict]) -> str:
-        """Generate a context-aware prompt with few-shot examples"""
-        prompt = (
-            f"Task: {context['task']}\n"
-            f"Document: {context['document']['name']} ({context['document']['type']})\n"
-            "Examples:\n"
-        )
-        for ex in examples:
-            prompt += f"- {ex['input']} => {ex['output']}\n"
-        prompt += "Extract the most relevant information for the task above."
-        return prompt
-
-    def validateResponse(self, response: str, schema: Dict) -> bool:
-        """Validate AI response against a schema"""
-        import jsonschema
-        try:
-            jsonschema.validate(instance=response, schema=schema)
-            return True
-        except jsonschema.ValidationError:
-            return False
-
-class TaskStateManager:
-    """Manages task state and retry tracking"""
-    
-    def __init__(self):
-        self.taskStates = {}
-
-    def trackState(self, task: AgentTask):
-        """Track task state"""
-        self.taskStates[task.id] = {
-            "status": task.status,
-            "retryState": getattr(task, "retryState", {}),
-            "history": getattr(task, "history", [])
-        }
-
-    def canRetry(self, task: AgentTask, method: str) -> bool:
-        """Check if task can be retried"""
-        retryState = self.taskStates[task.id].get("retryState", {})
-        return retryState.get(method, 0) < getattr(task, "retryMax", 3)
-
-class DocumentContext(BaseModel):
-    """Model for document context"""
-    id: str
-    extractionHistory: List[Dict]
-    relevantSections: List[str]
-    processingStatus: Dict[str, str]
-
-class DocumentExtraction:
-    """Processes documents with context awareness"""
-    
-    def process_with_context(self, doc: Dict, context: DocumentContext) -> Dict:
-        """Process document with context"""
-        extracted = {}
-        for section in context.relevantSections:
-            extracted[section] = doc.get(section)
-        return extracted
-
-    def track_extraction(self, doc: Dict, extraction: Dict):
-        """Track document extraction"""
-        if 'extractionHistory' not in doc:
-            doc['extractionHistory'] = []
-        doc['extractionHistory'].append(extraction)
-
-class ErrorRecovery(BaseModel):
-    """Model for error recovery strategies"""
-    strategy: str  # e.g., "retry", "fallback", "skip"
-    fallbackActions: List[str]
-    contextPreservation: bool
-
-### 1.3 Method-Based Module Structure
-```python
-# Example: methodSharepoint.py
-class MethodSharepoint:
-    """SharePoint method implementation"""
-    
-    def __init__(self, service):
-        self.service = service
-        self.name = "sharepoint"
-        self.description = "Search and process SharePoint documents"
-        self.auth_source = AuthSource.MSFT  # Requires Microsoft authentication
-        
-    @property
-    def actions(self) -> Dict[str, Dict[str, Any]]:
-        """Available actions and their parameters"""
-        return {
-            "search": {
-                "description": "Search SharePoint documents",
-                "retryMax": 3,
-                "timeout": 30,
-                "parameters": {
-                    "query": {"type": "string", "required": True},
-                    "site": {"type": "string", "required": False},
-                    "folder": {"type": "string", "required": False},
-                    "maxResults": {"type": "number", "required": False}
-                }
-            }
-        }
-    
-    async def execute(self, action: str, parameters: Dict[str, Any], auth_data: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
-        """Execute SharePoint method"""
-        if not auth_data:
-            return {"success": False, "error": "Missing Microsoft authentication"}
-            
-        if action == "search":
-            return await self._searchDocuments(parameters, auth_data)
-        return {"success": False, "error": f"Unknown action: {action}"}
-    
-    async def _searchDocuments(self, parameters: Dict[str, Any], auth_data: Dict[str, Any]) -> Dict[str, Any]:
-        """Search SharePoint documents"""
-        # Implementation using existing SharePoint agent functionality
-        pass
-
-# Example: methodOutlook.py
-class MethodOutlook:
-    """Outlook method implementation"""
-    
-    def __init__(self, service):
-        self.service = service
-        self.name = "outlook"
-        self.description = "Handle Outlook email operations"
-        
-    @property
-    def actions(self) -> Dict[str, Dict[str, Any]]:
-        """Available actions and their parameters"""
-        return {
-            "readMails": {
-                "description": "Read emails from specified folder",
-                "retryMax": 2,  # Action-specific retry limit
-                "parameters": {
-                    "folder": {"type": "string", "required": False},
-                    "unreadOnly": {"type": "boolean", "required": False},
-                    "fromAddress": {"type": "string", "required": False},
-                    "maxResults": {"type": "number", "required": False}
-                }
-            },
-            "sendMail": {
-                "description": "Send an email",
-                "retryMax": 1,  # Action-specific retry limit
-                "parameters": {
-                    "to": {"type": "array", "items": "string", "required": True},
-                    "subject": {"type": "string", "required": True},
-                    "body": {"type": "string", "required": True},
-                    "attachments": {"type": "array", "items": "FileRef", "required": False}
-                }
-            }
-        }
-    
-    async def execute(self, action: str, parameters: Dict[str, Any]) -> Dict[str, Any]:
-        """Execute Outlook method"""
-        if action == "readMails":
-            return await self._readMails(parameters)
-        elif action == "sendMail":
-            return await self._sendMail(parameters)
-        return {"success": False, "error": f"Unknown action: {action}"}
-```
-
-### 1.4 Key Data Objects
-```python
-class ChatWorkflow:
-    id: str
-    mandateId: str
-    status: str
-    name: Optional[str]
-    currentRound: int
-    lastActivity: str
-    startedAt: str
-    logs: List[ChatLog]
-    messages: List[ChatMessage]
-    stats: Optional[ChatStat]
-    tasks: List[Task]
-
-class AgentTask:
-    id: str
-    workflowId: str
-    status: str  # pending, success, failed, retry
-    userInput: str  # AI-processed summary
-    dataList: List[Dict[str, str]]  # User connections
-    actionList: List[Dict[str, Any]]  # Actions to execute, e.g.:
-    # [
-    #     {
-    #         "method": "sharepoint",
-    #         "action": "search",
-    #         "parameters": {
-    #             "query": "offerings",
-    #             "site": "valueon"
-    #         },
-    #         "retryCount": 0,
-    #         "retryMax": 3,
-    #         "status": "pending"  # pending, success, failed, retry
-    #     },
-    #     {
-    #         "method": "outlook",
-    #         "action": "sendMail",
-    #         "parameters": {
-    #             "to": ["user@example.com"],
-    #             "subject": "Offer Summary",
-    #             "body": "..."
-    #         },
-    #         "retryCount": 0,
-    #         "retryMax": 1,
-    #         "status": "pending"
-    #     }
-    # ]
-    chatHistory: str  # Summary of previous messages
-    taskHistory: str  # Summary of previous tasks
-    previousTaskFeedback: Optional[str]
-    thisTaskFeedback: Optional[str]
-    result: Optional[ChatMessage]
-    documentsInput: List[Dict]
-    documentsOutput: List[Dict]
-    startedAt: str
-    finishedAt: Optional[str]
-    error: Optional[str]
-    dependencies: List[str] = []     # Task dependencies
-    requiredOutputs: List[str] = []  # Required outputs from dependencies
-```
-
-## 2. Process Flow
-
-### 2.1 Initialization Phase
-```mermaid
-graph TD
-    A[User Input] --> B[WorkflowManager.workflowProcess]
-    B --> C[ChatManager.initialize]
-    C --> D[Create ServiceCenter]
-    D --> E[Create Initial Task]
-```
-
-1. **WorkflowManager.workflowProcess**
-   - Receives user input and workflow
-   - Initializes chat manager
-   - Starts task processing loop
-
-2. **ChatManager.initialize**
-   - Creates ServiceCenter with all required components
-   - Initializes service interfaces
-   - Sets up task and state management
-
-### 2.2 Task Creation Phase
-
-1. **Create Initial Task**
-   ```python
-   def createInitialTask(self, userInput: UserInputRequest) -> AgentTask:
-       # 1. Get available methods and their actions
-       available_methods = self._getAvailableMethods()
-       method_catalog = {
-           method.name: {
-               "description": method.description,
-               "actions": method.actions
-           }
-           for method in available_methods
-       }
-       
-       # 2. Process user input with AI including document analysis
-       processedInput = await self.service.model['callAiBasic'](
-           f"""Analyze user request and documents:
-           User Prompt: {userInput.prompt}
-           Documents: {userInput.listFileId}
-           
-           Available Methods:
-           {json.dumps(method_catalog, indent=2)}
-           
-           Please provide:
-           1. Main objective
-           2. Required actions (using available methods and their actions)
-           3. Required data sources
-           4. Document processing requirements
-           5. Expected output format
-           
-           Format your response as JSON:
-           {{
-               "objective": "string",
-               "actions": [
-                   {{
-                       "method": "string",
-                       "action": "string",
-                       "parameters": {{
-                           "param1": "value1",
-                           "param2": "value2"
-                       }}
-                   }}
-               ],
-               "dataSources": ["string"],
-               "documentRequirements": ["string"],
-               "outputFormat": "string"
-           }}
-           """
-       )
-       
-       # 3. Create task with processed input and initialize action states
-       actions = []
-       for action in processedInput['actions']:
-           method = next(m for m in available_methods if m.name == action['method'])
-           action_info = method.actions[action['action']]
-           actions.append({
-               **action,
-               "retryCount": 0,
-               "retryMax": action_info['retryMax'],
-               "status": "pending"
-           })
-       
-       task = AgentTask(
-           workflowId=self.service.workflow.id,
-           userInput=processedInput,
-           dataList=self.service.context['dataConnections'],
-           actionList=actions,
-           chatHistory=await self.workflowSummarize(userInput),
-           startedAt=datetime.now(UTC).isoformat()
-       )
-       
-       # 4. Store in service
-       self.service.tasks['current'] = task
-       return task
-   ```
-
-### 2.3 Task Execution Phase
-
-1. **Execute Task**
-   ```python
-   async def executeTask(self, task: AgentTask) -> None:
-       """Execute task actions in sequence"""
-       for action in task.actionList:
-           if action['status'] == 'pending':
-               try:
-                   # Get method instance
-                   method = self.service.methods[action['method']]
-                   
-                   # Execute action
-                   result = await method.execute(
-                       action['action'],
-                       action['parameters']
-                   )
-                   
-                   if result['success']:
-                       action['status'] = 'success'
-                   else:
-                       if self._shouldRetry(result['error']):
-                           action['retryCount'] += 1
-                           if action['retryCount'] > action['retryMax']:
-                               action['status'] = 'failed'
-                               task.status = 'failed'
-                               task.error = "Maximum retries exceeded"
-                           else:
-                               action['status'] = 'retry'
-                               task.status = 'retry'
-                       else:
-                           action['status'] = 'failed'
-                           task.status = 'failed'
-                           task.error = result['error']
-                   
-               except Exception as e:
-                   action['status'] = 'failed'
-                   task.status = 'failed'
-                   task.error = str(e)
-                   
-               # Update task status based on action status
-               if action['status'] == 'failed':
-                   break
-               
-       # Mark task as complete if all actions succeeded
-       if all(a['status'] == 'success' for a in task.actionList):
-           task.status = 'success'
-           task.finishedAt = datetime.now(UTC).isoformat()
-   ```
-
-### 2.4 Task Analysis Phase
-
-1. **Define Next Task**
-   ```python
-   def defineNextTask(self, currentTask: AgentTask) -> Optional[AgentTask]:
-       try:
-           # 1. Analyze current task results using basic AI
-           analysis = await self.service.model['callAiBasic'](
-               f"""Analyze task results and determine next steps:
-               Previous Feedback: {currentTask.previousTaskFeedback}
-               Current Feedback: {currentTask.thisTaskFeedback}
-               User Input: {currentTask.userInput}
-               Current Documents: {currentTask.documentsOutput}
-               
-               Please provide:
-               1. Task completion status
-               2. Next required actions
-               3. Required documents
-               4. Method recommendations
-               
-               Format your response as JSON:
-               {{
-                   "isComplete": boolean,
-                   "nextActions": ["string"],
-                   "requiredDocuments": ["string"],
-                   "recommendedMethods": ["string"]
-               }}
-               """
-           )
-           
-           # 2. Parse and validate AI response
-           analysis_data = json.loads(analysis)
-           
-           # 3. Determine if next task needed
-           if not analysis_data["isComplete"]:
-               # 4. Create next task
-               nextTask = self._createNextTask(currentTask, analysis_data)
-               self.service.tasks['previous'] = currentTask
-               self.service.tasks['current'] = nextTask
-               return nextTask
-           
-           return None
-           
-       except Exception as e:
-           logger.error(f"Error defining next task: {str(e)}")
-           return None
-   ```
-
-## 3. Method Integration
-
-### 3.1 Method Registration
-```python
-def _registerMethods(self):
-    """Register available methods in service center"""
-    self.service.methods = {
-        "sharepoint": MethodSharepoint(self.service),
-        "outlook": MethodOutlook(self.service),
-        "web": MethodWeb(self.service),
-        "document": MethodDocument(self.service)
-    }
-```
-
-### 3.2 Method Execution
-```python
-def _executeMethod(self, method: str, parameters: Dict[str, Any]) -> Dict[str, Any]:
-    """Execute a method with parameters"""
-    try:
-        # Get method implementation
-        method_impl = self.service.methods.get(method)
-        if not method_impl:
-            return {"success": False, "error": f"Unknown method: {method}"}
-        
-        # Execute method
-        return await method_impl.execute(parameters)
-        
-    except Exception as e:
-        return {"success": False, "error": str(e)}
-```
-
-## 4. Error Handling
-
-### 4.1 Error Types
-1. **AI Errors**
-   - Model unavailable
-   - Invalid response
-   - Timeout
-
-2. **Method Errors**
-   - Invalid method
-   - Execution failure
-   - Resource unavailable
-
-3. **Task Errors**
-   - Invalid state
-   - Missing data
-   - Timeout
-
-### 4.2 Retry Logic
-```python
-def _shouldRetry(self, error: str) -> bool:
-    """Determine if error is retryable"""
-    retryable_errors = [
-        "AI down",
-        "Document not found",
-        "Content extraction failed"
-    ]
-    return any(err in error for err in retryable_errors)
-
-def _shouldCreateNextTask(self, analysis: Dict[str, Any]) -> bool:
-    """Determine if next task is needed based on AI analysis"""
-    return not analysis.get("isComplete", True)
-```
-
-## 5. AI Integration Points
-
-### 5.1 User Input Processing
-```python
-async def _processUserInput(self, input: str, documents: List[str]) -> str:
-    """Process user input including document analysis"""
-    context = {
-        "task": "Process user input",
-        "document": {"name": "User Input", "type": "text"}
-    }
-    examples = [
-        {"input": "Search documents", "output": "Extract relevant information"}
-    ]
-    prompt = self.service.promptManager.generatePrompt(context, examples)
-    
-    return await self.service.model['callAiBasic'](
-        f"""Analyze user request and documents:
-        User Input: {input}
-        Documents: {documents}
-        
-        {prompt}
-        
-        Please provide:
-        1. Main objective
-        2. Required actions
-        3. Required data sources
-        4. Document processing requirements
-        5. Expected output format
-        
-        Format your response as JSON:
-        {{
-            "objective": "string",
-            "actions": ["string"],
-            "dataSources": ["string"],
-            "documentRequirements": ["string"],
-            "outputFormat": "string"
-        }}
-        """
-    )
-```
-
-### 5.2 Task Analysis
-```python
-async def _analyzeTaskResults(self, task: AgentTask) -> str:
-    """Analyze task results and determine next steps"""
-    context = {
-        "task": "Analyze task results",
-        "document": {"name": "Task Results", "type": "json"}
-    }
-    examples = [
-        {"input": "Task completed", "output": "Generate next steps"}
-    ]
-    prompt = self.service.promptManager.generatePrompt(context, examples)
-    
-    return await self.service.model['callAiBasic'](
-        f"""Analyze task results and determine next steps:
-        Task Input: {task.userInput}
-        Previous Feedback: {task.previousTaskFeedback}
-        Current Feedback: {task.thisTaskFeedback}
-        Current Documents: {task.documentsOutput}
-        
-        {prompt}
-        
-        Please provide:
-        1. Task completion status
-        2. Next required actions
-        3. Required documents
-        4. Method recommendations
-        
-        Format your response as JSON:
-        {{
-            "isComplete": boolean,
-            "nextActions": ["string"],
-            "requiredDocuments": ["string"],
-            "recommendedMethods": ["string"]
-        }}
-        """
-    )
-```
-
-### 5.3 Result Processing
-```python
-async def _processTaskResults(self, task: AgentTask) -> str:
-    """Process task results and generate feedback"""
-    context = {
-        "task": "Process task results",
-        "document": {"name": "Task Results", "type": "json"}
-    }
-    examples = [
-        {"input": "Task results", "output": "Generate summary"}
-    ]
-    prompt = self.service.promptManager.generatePrompt(context, examples)
-    
-    return await self.service.model['callAiBasic'](
-        f"""Process task results and generate feedback:
-        Task Input: {task.userInput}
-        Method Results: {task.result}
-        Generated Documents: {task.documentsOutput}
-        
-        {prompt}
-        
-        Please provide:
-        1. Summary of completed actions
-        2. Generated document descriptions
-        3. Next steps or completion status
-        
-        Format your response as JSON:
-        {{
-            "summary": "string",
-            "documents": ["string"],
-            "nextSteps": ["string"]
-        }}
-        """
-    )
-```
-
-## 6. File Structure and Implementation Plan
-
-### 6.1 File Structure
-```
-gateway/
-├── modules/
-│   ├── workflow/
-│   │   ├── managerWorkflow.py      # Workflow management and state machine
-│   │   ├── managerChat.py          # Chat management and AI response validation
-│   │   ├── managerPrompt.py        # AI prompt generation and management
-│   │   ├── methodBase.py           # Base method class with result validation
-│   │   └── documentExtraction.py    # Document content extraction
-│   │
-│   ├── agents/                     # To be refactored into methods
-│   │   ├── agentSharepoint.py      → methods/methodSharepoint.py
-│   │   ├── agentOutlook.py         → methods/methodOutlook.py
-│   │   ├── agentWebcrawler.py      → methods/methodWeb.py
-│   │   ├── agentDocument.py        → methods/methodDocument.py
-│   │   └── agentCoder.py          → methods/methodCoder.py
-│   │
-│   ├── methods/                    # New directory for method implementations
-│   │   ├── methodSharepoint.py     # SharePoint operations
-│   │   ├── methodOutlook.py        # Outlook operations
-│   │   ├── methodWeb.py           # Web operations
-│   │   ├── methodDocument.py       # Document operations
-│   │   ├── methodCoder.py         # Code generation operations
-│   │   └── methodPowerpoint.py     # PowerPoint operations
-│   │
-│   └── interfaces/
-│       ├── interfaceChatModel.py     # Chat system models and enums
-│       └── interfaceAppModel.py      # Application models including UserConnection
-```
-
-### 6.2 Implementation Plan
-
-#### Phase 1: Core Structure Setup
-1. **File Renaming and Organization**
-   - Rename manager files to follow `manager*.py` pattern
-   - Move document processor to `documentExtraction.py`
-   - Create new `methods` directory
-
-2. **Model Updates**
-   - Update `interfaceChatModel.py` with new enums and models
-   - Integrate `UserConnection` from `interfaceAppModel.py`
-   - Update validation logic in respective modules
-
-#### Phase 2: Method Migration
-1. **Base Method Implementation**
-   - Implement `methodBase.py` with core functionality
-   - Add method result validation
-   - Set up authentication handling
-
-2. **Agent to Method Conversion**
-   - Convert each agent to its method implementation
-   - Migrate functionality while maintaining existing behavior
-   - Add method-specific validation
-
-3. **New Method Implementation**
-   - Implement `methodPowerpoint.py`
-   - Add PowerPoint-specific operations
-   - Integrate with document processing
-
-#### Phase 3: Manager Updates
-1. **Chat Manager Enhancement**
-   - Integrate AI response validation
-   - Update service center structure
-   - Improve error handling
-
-2. **Document Manager Integration**
-   - Update document operations for new method structure
-   - Enhance content extraction capabilities
-   - Improve file handling
-
-3. **Workflow Manager Updates**
-   - Update state machine for method-based approach
-   - Improve task management
-   - Enhance error recovery
-
-#### Phase 4: Testing and Validation
-1. **Unit Testing**
-   - Test each method implementation
-   - Validate error handling
-   - Verify authentication flow
-
-2. **Integration Testing**
-   - Test method interactions
-   - Validate document processing
-   - Verify workflow execution
-
-3. **Performance Testing**
-   - Measure response times
-   - Validate resource usage
-   - Test concurrent operations
-
-#### Phase 5: Documentation and Cleanup
-1. **Documentation**
-   - Update API documentation
-   - Document method implementations
-   - Add usage examples
-
-2. **Code Cleanup**
-   - Remove deprecated code
-   - Clean up old agent files
-   - Optimize imports
-
-3. **Final Review**
-   - Code review
-   - Security audit
-   - Performance optimization
-
-### 6.3 Migration Strategy
-1. **Incremental Migration**
-   - Migrate one agent at a time
-   - Maintain backward compatibility
-   - Use feature flags for gradual rollout
-
-2. **Testing Strategy**
-   - Unit tests for each method
-   - Integration tests for workflows
-   - End-to-end tests for complete scenarios
-
-3. **Rollback Plan**
-   - Keep old agent implementations until stable
-   - Maintain version control
-   - Document rollback procedures
-
-### 6.4 Success Criteria
-1. **Functionality**
-   - All existing features working
-   - New method-based structure operational
-   - Improved error handling
-
-2. **Performance**
-   - Equal or better response times
-   - Reduced resource usage
-   - Improved scalability
-
-3. **Maintainability**
-   - Clear code structure
-   - Comprehensive documentation
-   - Easy to extend
-
-4. **Security**
-   - Proper authentication handling
-   - Secure data processing
-   - Access control implementation
\ No newline at end of file
diff --git a/test_ai_calls.md b/test_ai_calls.md
deleted file mode 100644
index 75ed3310..00000000
--- a/test_ai_calls.md
+++ /dev/null
@@ -1,235 +0,0 @@
-# AI Call Functions Test and Content Size Analysis
-
-## Overview
-This file documents the ServiceCenter AI functions that have risk of delivering too big content,
-along with their usage patterns and potential size issues.
-
-## High-Risk AI Functions
-
-### 1. summarizeChat() -> callAiTextBasic()
-**Location**: gateway/modules/chat/handling/promptFactory.py:122
-**Risk Level**: MEDIUM
-**Content**: Entire workflow message history
-**Usage**:
-```python
-messageSummary = await service.summarizeChat(context.workflow.messages) if context.workflow else ""
-```
-**Potential Issues**:
-- Long conversations can generate very large summaries
-- Includes all previous messages in workflow
-- No size limits or truncation
-
-### 2. callAiTextAdvanced() -> interfaceAiCalls.callAiTextAdvanced()
-**Risk Level**: HIGH
-**Multiple Usage Points**:
-
-#### A. Task Planning (handlingTasks.py:116)
-```python
-prompt = await self.service.callAiTextAdvanced(task_planning_prompt)
-```
-**Content**: User input + document context + connection context + previous results
-**Risk**: VERY HIGH - includes all available documents and context
-
-#### B. Action Definition (handlingTasks.py:388)
-```python
-prompt = await self.service.callAiTextAdvanced(action_prompt)
-```
-**Content**: Task context + available documents + connections + previous results
-**Risk**: HIGH - comprehensive context for action planning
-
-#### C. Result Review (handlingTasks.py:894)
-```python
-response = await self.service.callAiTextAdvanced(prompt)
-```
-**Content**: Action results + success criteria + context
-**Risk**: MEDIUM-HIGH - depends on result size
-
-#### D. Email Composition (methodOutlook.py:1609)
-```python
-composed_email = await self.service.interfaceAiCalls.callAiTextAdvanced(ai_prompt)
-```
-**Content**: Document content + email requirements
-**Risk**: MEDIUM - depends on document size
-
-#### E. AI Processing (methodAi.py:175)
-```python
-result = await self.service.callAiTextAdvanced(enhanced_prompt, context)
-```
-**Content**: User prompt + extracted document content
-**Risk**: HIGH - includes full document content
-
-### 3. callAiTextBasic() -> interfaceAiCalls.callAiTextBasic()
-**Risk Level**: MEDIUM
-**Multiple Usage Points**:
-
-#### A. Document Format Conversion (methodDocument.py:429)
-```python
-formatted_content = await self.service.callAiTextBasic(ai_prompt, content)
-```
-**Content**: Document content + format requirements
-**Risk**: MEDIUM - depends on document size
-
-#### B. HTML Report Generation (methodDocument.py:642)
-```python
-aiReport = await self.service.callAiTextBasic(aiPrompt, combinedContent)
-```
-**Content**: Combined content from multiple documents
-**Risk**: HIGH - combines multiple documents
-
-#### C. AI Processing Fallback (methodAi.py:177)
-```python
-result = await self.service.callAiTextBasic(enhanced_prompt, context)
-```
-**Content**: User prompt + document context
-**Risk**: MEDIUM - includes document content
-
-#### D. Document Content Processing (documentExtraction.py:1459)
-```python
-processedContent = await self._serviceCenter.callAiTextBasic(aiPrompt, contentToProcess)
-```
-**Content**: Document chunks + AI prompt
-**Risk**: MEDIUM - processes document chunks
-
-### 4. extractContentFromDocument() -> documentProcessor.processFileData()
-**Risk Level**: HIGH
-**Multiple Usage Points**:
-
-#### A. Document Content Extraction (methodDocument.py:74)
-```python
-extracted_content = await self.service.extractContentFromDocument(
-    prompt=aiPrompt,
-    document=chatDocument
-)
-```
-**Content**: Full document + extraction prompt
-**Risk**: HIGH - processes entire documents
-
-#### B. HTML Report Generation (methodDocument.py:581)
-```python
-extracted_content = await self.service.extractContentFromDocument(
-    prompt="Extract readable text content for HTML report generation", 
-    document=doc
-)
-```
-**Content**: Full document content
-**Risk**: HIGH - processes documents for reports
-
-#### C. Email Composition (methodOutlook.py:1510)
-```python
-extracted_content = await self.service.extractContentFromDocument(
-    prompt="Extract readable text content for email composition", 
-    document=doc
-)
-```
-**Content**: Full document content
-**Risk**: HIGH - processes documents for emails
-
-#### D. AI Processing (methodAi.py:94)
-```python
-extracted_content = await self.service.extractContentFromDocument(
-    prompt=extraction_prompt.strip(), 
-    document=doc
-)
-```
-**Content**: Full document content
-**Risk**: HIGH - processes documents for AI analysis
-
-## Risk Assessment Summary
-
-### CRITICAL RISK (Immediate Attention Required)
-1. **Task Planning** (handlingTasks.py:116) - Entire workflow context
-2. **Action Definition** (handlingTasks.py:388) - Comprehensive context
-3. **Document Processing** (all extractContentFromDocument calls) - Full documents
-4. **AI Method Processing** (methodAi.py:175) - Document content + context
-5. **Report Generation** (methodDocument.py:642) - Multiple documents combined
-
-### HIGH RISK (Monitor Closely)
-1. **Chat Summarization** (promptFactory.py:122) - Message history
-2. **Document Format Conversion** (methodDocument.py:429) - Single documents
-3. **Email Composition** (methodOutlook.py:1609) - Document content
-
-## Potential Issues
-
-### Content Size Problems
-- Large documents (PDFs, Word docs, Excel files) can exceed AI model limits
-- Combined document content in reports can be massive
-- Long conversation histories in chat summarization
-- Full workflow context in task planning
-
-### Performance Issues
-- Timeout errors for large content
-- Memory issues with large document processing
-- API rate limiting with large requests
-- Cost implications for large AI calls
-
-### Error Scenarios
-- OpenAI API 400 errors (content too large)
-- Timeout errors (processing too slow)
-- Memory exhaustion (large document processing)
-- Incomplete processing (truncated content)
-
-## Recommended Solutions
-
-### 1. Content Size Limits
-- Implement maximum content size checks before AI calls
-- Truncate large content with appropriate warnings
-- Split large documents into chunks
-
-### 2. Content Filtering
-- Remove unnecessary context from prompts
-- Filter out large binary content
-- Use document summaries instead of full content
-
-### 3. Chunking Strategy
-- Process large documents in smaller chunks
-- Implement progressive processing
-- Use streaming for large responses
-
-### 4. Caching and Optimization
-- Cache processed document content
-- Reuse extracted content across operations
-- Implement smart content selection
-
-### 5. Error Handling
-- Graceful degradation for oversized content
-- Fallback strategies for failed AI calls
-- User notifications for content size issues
-
-## Test Scenarios
-
-### Test Case 1: Large Document Processing
-- Upload a 10MB PDF document
-- Try to extract content for AI processing
-- Monitor for size limit errors
-
-### Test Case 2: Multiple Document Reports
-- Upload 5+ large documents
-- Generate HTML report
-- Check for combined content size issues
-
-### Test Case 3: Long Conversation History
-- Create workflow with 50+ messages
-- Test chat summarization
-- Monitor for context size limits
-
-### Test Case 4: Task Planning with Large Context
-- Create workflow with many documents
-- Test task planning functionality
-- Check for prompt size limits
-
-## Monitoring Recommendations
-
-1. **Log Content Sizes**: Track the size of content sent to AI functions
-2. **Monitor API Errors**: Watch for 400 errors indicating content too large
-3. **Performance Metrics**: Track processing times for large content
-4. **User Feedback**: Monitor for incomplete or failed operations
-5. **Cost Tracking**: Monitor AI API costs for large requests
-
-## Implementation Priority
-
-1. **Immediate**: Add content size checks to extractContentFromDocument
-2. **High**: Implement chunking for large document processing
-3. **Medium**: Add content filtering to task planning prompts
-4. **Low**: Implement caching for processed content
-
-This analysis should help identify and mitigate the risks of delivering too big content to AI functions.
diff --git a/test_ai_fallback.py b/test_ai_fallback.py
deleted file mode 100644
index fc320229..00000000
--- a/test_ai_fallback.py
+++ /dev/null
@@ -1,103 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script to verify AI fallback mechanism from Basic to Advanced when context length is exceeded.
-"""
-
-import asyncio
-import logging
-from modules.interfaces.interfaceAiCalls import AiCalls
-from modules.connectors.connectorAiOpenai import ContextLengthExceededException
-
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-
-async def test_context_length_fallback():
-    """Test the fallback mechanism when context length is exceeded"""
-    
-    # Create AI calls instance
-    ai_calls = AiCalls()
-    
-    # Create a very large context that would exceed OpenAI's context limit
-    large_context = "This is a test context. " * 10000  # Create a large context
-    prompt = "Please summarize this context in one sentence."
-    
-    logger.info("Testing AI Basic with large context (should trigger fallback)...")
-    
-    try:
-        # This should trigger the context length exceeded error and fallback to Advanced
-        result = await ai_calls.callAiTextBasic(prompt, large_context)
-        logger.info(f"✅ Fallback successful! Result: {result[:100]}...")
-        return True
-    except Exception as e:
-        logger.error(f"❌ Test failed: {str(e)}")
-        return False
-
-async def test_direct_context_length_exception():
-    """Test that the ContextLengthExceededException is properly raised"""
-    
-    from modules.connectors.connectorAiOpenai import AiOpenai
-    
-    logger.info("Testing direct ContextLengthExceededException...")
-    
-    try:
-        # Create OpenAI connector
-        openai_connector = AiOpenai()
-        
-        # Create messages that would exceed context length
-        large_messages = [
-            {"role": "user", "content": "Test message. " * 50000}  # Very large message
-        ]
-        
-        # This should raise ContextLengthExceededException
-        await openai_connector.callAiBasic(large_messages)
-        logger.error("❌ Expected ContextLengthExceededException but none was raised")
-        return False
-        
-    except ContextLengthExceededException as e:
-        logger.info(f"✅ ContextLengthExceededException properly raised: {str(e)}")
-        return True
-    except Exception as e:
-        logger.error(f"❌ Unexpected exception: {str(e)}")
-        return False
-
-async def main():
-    """Run all tests"""
-    logger.info("Starting AI fallback mechanism tests...")
-    
-    tests = [
-        ("Context Length Fallback", test_context_length_fallback),
-        ("Direct Exception Test", test_direct_context_length_exception),
-    ]
-    
-    results = []
-    for test_name, test_func in tests:
-        logger.info(f"\n--- Running {test_name} ---")
-        try:
-            result = await test_func()
-            results.append((test_name, result))
-        except Exception as e:
-            logger.error(f"Test {test_name} crashed: {str(e)}")
-            results.append((test_name, False))
-    
-    # Summary
-    logger.info("\n" + "="*50)
-    logger.info("TEST SUMMARY")
-    logger.info("="*50)
-    
-    passed = 0
-    for test_name, result in results:
-        status = "✅ PASSED" if result else "❌ FAILED"
-        logger.info(f"{test_name}: {status}")
-        if result:
-            passed += 1
-    
-    logger.info(f"\nTotal: {passed}/{len(results)} tests passed")
-    
-    if passed == len(results):
-        logger.info("🎉 All tests passed! Fallback mechanism is working correctly.")
-    else:
-        logger.warning("⚠️  Some tests failed. Please check the implementation.")
-
-if __name__ == "__main__":
-    asyncio.run(main())
diff --git a/test_documentExtraction.py b/test_documentExtraction.py
deleted file mode 100644
index 25324725..00000000
--- a/test_documentExtraction.py
+++ /dev/null
@@ -1,855 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for DocumentExtraction class.
-Processes all files in d:/temp folder and stores extracted content in d:/temp/extracted.
-
-Features:
-- Option to extract content WITH AI processing (default)
-- Option to extract content WITHOUT AI processing (content-only mode)
-- Supports all document types: text, images, PDFs, Office documents, etc.
-- Detailed logging and progress tracking
-- Separate output directories for AI vs content-only modes
-
-Usage:
-- Interactive mode: python test_documentExtraction.py
-- Content-only mode: python test_documentExtraction.py --no-ai
-- Content-only mode: python test_documentExtraction.py --content-only
-- Specify custom input/output: python test_documentExtraction.py --input-dir /path/to/input --output-dir /path/to/output --no-ai
-"""
-
-import os
-import asyncio
-import logging
-import sys
-import argparse
-from pathlib import Path
-from typing import List, Optional
-from datetime import datetime, UTC
-
-# Configure logging
-logging.basicConfig(
-    level=logging.DEBUG,  # Changed from INFO to DEBUG
-    format='%(asctime)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-
-# Filter out specific unwanted log messages
-class LogFilter(logging.Filter):
-    """Filter to hide specific unwanted log messages."""
-    
-    def filter(self, record):
-        # Hide workflow stats update errors
-        if "Workflow" in record.getMessage() and "not found for stats update" in record.getMessage():
-            return False
-        
-        # Hide HTTP request info messages
-        if "HTTP Request:" in record.getMessage() and "POST https://api.openai.com" in record.getMessage():
-            return False
-        
-        # Hide HTTP response info messages
-        if "HTTP/1.1 200 OK" in record.getMessage():
-            return False
-        
-        return True
-
-# Apply the filter to the root logger
-root_logger = logging.getLogger()
-root_logger.addFilter(LogFilter())
-
-def check_dependencies():
-    """Check if required dependencies are available and provide installation instructions."""
-    missing_deps = []
-    
-    # Check for required dependencies
-    try:
-        import bs4
-        logger.info("beautifulsoup4 is available")
-    except ImportError:
-        missing_deps.append("beautifulsoup4")
-        logger.error("beautifulsoup4 is missing")
-    
-    try:
-        import PyPDF2
-        logger.info("PyPDF2 is available")
-    except ImportError:
-        missing_deps.append("PyPDF2")
-        logger.error("PyPDF2 is missing")
-    
-    try:
-        import fitz
-        logger.info("PyMuPDF (fitz) is available")
-    except ImportError:
-        missing_deps.append("PyMuPDF")
-        logger.error("PyMuPDF (fitz) is missing")
-    
-    try:
-        import docx
-        logger.info("python-docx is available")
-    except ImportError:
-        missing_deps.append("python-docx")
-        logger.error("python-docx is missing")
-    
-    try:
-        import openpyxl
-        logger.info("openpyxl is available")
-    except ImportError:
-        missing_deps.append("openpyxl")
-        logger.error("openpyxl is missing")
-    
-    try:
-        import pptx
-        logger.info("python-pptx is available")
-    except ImportError:
-        missing_deps.append("python-pptx")
-        logger.error("python-pptx is missing")
-    
-    try:
-        from PIL import Image
-        logger.info("Pillow (PIL) is available")
-    except ImportError:
-        missing_deps.append("Pillow")
-        logger.error("Pillow (PIL) is missing")
-    
-    if missing_deps:
-        logger.error("\n" + "="*60)
-        logger.error("MISSING DEPENDENCIES DETECTED!")
-        logger.error("="*60)
-        logger.error("The following packages are required but not installed:")
-        for dep in missing_deps:
-            logger.error(f"  - {dep}")
-        logger.error("\nTo install all dependencies, run:")
-        logger.error("pip install -r requirements.txt")
-        logger.error("\nOr install individual packages:")
-        for dep in missing_deps:
-            if dep == "beautifulsoup4":
-                logger.error(f"  pip install {dep}")
-            elif dep == "PyMuPDF":
-                logger.error(f"  pip install {dep}")
-            elif dep == "Pillow":
-                logger.error(f"  pip install {dep}")
-            else:
-                logger.error(f"  pip install {dep}")
-        logger.error("="*60)
-        return False
-    
-    logger.info("All required dependencies are available!")
-    return True
-
-def check_module_imports():
-    """Check if we can import the required modules."""
-    try:
-        # Add the gateway directory to the path so we can import our modules
-        sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
-        
-        from modules.chat.documents.documentExtraction import DocumentExtraction
-        from modules.chat.serviceCenter import ServiceCenter
-        from modules.interfaces.interfaceAppModel import User, UserConnection
-        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem
-        
-        logger.info("All required modules imported successfully")
-        return True
-    except ImportError as e:
-        logger.error(f"Failed to import required modules: {e}")
-        logger.error("Make sure you're running this script from the gateway directory")
-        return False
-    except Exception as e:
-        logger.error(f"Unexpected error importing modules: {e}")
-        return False
-
-def create_mock_service_center():
-    """Create a proper ServiceCenter for testing purposes with all required fields."""
-    try:
-        from modules.chat.serviceCenter import ServiceCenter
-        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
-        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
-        from modules.interfaces.interfaceChatModel import ChatLog, ChatMessage, ChatStat
-        
-        # Create proper user with all required fields
-        mock_user = User(
-            id="test_user_001",
-            username="testuser",
-            email="test@example.com",
-            fullName="Test User",
-            language="en",
-            enabled=True,
-            privilege=UserPrivilege.USER,
-            authenticationAuthority=AuthAuthority.LOCAL,
-            mandateId="test_mandate_001"
-        )
-        
-        # Create proper workflow with all required fields
-        current_time = datetime.now(UTC).isoformat()
-        mock_workflow = ChatWorkflow(
-            id="test_workflow_001",
-            mandateId="test_mandate_001",
-            status="active",
-            name="Test Document Extraction Workflow",
-            currentRound=1,
-            lastActivity=current_time,
-            startedAt=current_time,
-            logs=[],
-            messages=[],
-            stats=None,
-            tasks=[]
-        )
-        
-        # Create service center
-        service_center = ServiceCenter(mock_user, mock_workflow)
-        logger.info("ServiceCenter created successfully with proper objects")
-        return service_center
-        
-    except Exception as e:
-        logger.error(f"Failed to create ServiceCenter: {e}")
-        return None
-
-class DocumentExtractionTester:
-    """Test class for DocumentExtraction functionality."""
-    
-    def __init__(self, input_dir: str = "d:/temp/test-extraction", output_dir: str = None, enable_ai: bool = True):
-        """
-        Initialize the tester.
-        
-        Args:
-            input_dir: Directory containing files to process
-            output_dir: Directory to store extracted content (auto-generated if None)
-            enable_ai: Whether to enable AI processing (default: True)
-        """
-        self.input_dir = Path(input_dir)
-        
-        # Auto-generate output directory if not specified
-        if output_dir is None:
-            if enable_ai:
-                self.output_dir = Path(input_dir) / "extracted"
-            else:
-                self.output_dir = Path(input_dir) / "extracted-raw"
-        else:
-            self.output_dir = Path(output_dir)
-            
-        self.extractor = None
-        self.service_center = None
-        self.enable_ai = enable_ai
-        
-        if enable_ai:
-            self.prompt = "Make a summary of each sentence for each page or chapter of the document"
-        else:
-            self.prompt = None  # No prompt needed for content-only extraction
-        
-        # Track processing results for summary
-        self.processing_results = []
-        
-        # Ensure output directory exists
-        logger.info(f"Creating output directory: {self.output_dir}")
-        self.output_dir.mkdir(parents=True, exist_ok=True)
-        
-        # Verify directory was created
-        if self.output_dir.exists():
-            logger.info(f"Output directory created/verified: {self.output_dir}")
-            logger.info(f"Output directory absolute path: {self.output_dir.absolute()}")
-        else:
-            logger.error(f"Failed to create output directory: {self.output_dir}")
-        
-        # Log configuration
-        logger.info(f"Configuration: AI processing = {'ENABLED' if self.enable_ai else 'DISABLED'}")
-        logger.info(f"Input directory: {self.input_dir}")
-        logger.info(f"Output directory: {self.output_dir}")
-        
-        # Test basic file writing capability
-        test_file = self.output_dir / "test_write_capability.txt"
-        try:
-            logger.info(f"Testing file write capability to: {test_file}")
-            logger.info(f"Absolute path: {test_file.absolute()}")
-            
-            with open(test_file, 'w', encoding='utf-8') as f:
-                f.write("Test file to verify write capability")
-            
-            if test_file.exists():
-                actual_size = test_file.stat().st_size
-                logger.info(f"Basic file writing test passed: {test_file} (size: {actual_size} bytes)")
-                
-                # Test reading the file back
-                with open(test_file, 'r', encoding='utf-8') as f:
-                    content = f.read()
-                logger.info(f"File read test passed: content length = {len(content)}")
-                
-                # Clean up test file
-                test_file.unlink()
-                logger.info("Test file cleaned up")
-            else:
-                logger.error(f"Basic file writing test failed: {test_file}")
-        except Exception as e:
-            logger.error(f"Basic file writing test failed with error: {e}")
-            import traceback
-            traceback.print_exc()
-        
-        # Supported file extensions for content extraction
-        self.supported_extensions = {
-            # Text and data files
-            '.txt', '.csv', '.json', '.xml', '.html', '.htm', '.svg',
-            '.md', '.markdown', '.rst', '.log', '.ini', '.cfg', '.conf',
-            
-            # Programming languages
-            '.js', '.ts', '.jsx', '.tsx', '.py', '.java', '.c', '.cpp', '.cc', '.cxx',
-            '.h', '.hpp', '.cs', '.php', '.rb', '.go', '.rs', '.swift', '.kt', '.scala',
-            '.r', '.m', '.pl', '.sh', '.bash', '.zsh', '.fish', '.ps1', '.bat', '.cmd',
-            '.vbs', '.lua', '.sql', '.r', '.dart', '.elm', '.clj', '.hs', '.fs', '.ml',
-            
-            # Web technologies
-            '.css', '.scss', '.sass', '.less', '.vue', '.svelte', '.astro',
-            
-            # Configuration and build files
-            '.yaml', '.yml', '.toml', '.env', '.gitignore', '.dockerfile', '.dockerignore',
-            '.makefile', '.cmake', '.gradle', '.maven', '.pom', '.sln', '.vcxproj',
-            '.csproj', '.fsproj', '.vbproj', '.xcodeproj', '.pbxproj',
-            
-            # Documentation and markup
-            '.tex', '.bib', '.adoc', '.asciidoc', '.wiki', '.creole',
-            
-            # Images
-            '.jpg', '.jpeg', '.png', '.gif', '.webp', '.bmp', '.tiff', '.ico',
-            
-            # Documents
-            '.pdf', '.docx', '.xlsx', '.pptx', '.odt', '.ods', '.odp',
-            
-            # Legacy Office formats
-            '.doc', '.xls', '.ppt',
-            
-            # Archives and binaries
-            '.zip', '.tar', '.gz', '.7z', '.rar', '.exe', '.dll', '.so', '.dylib'
-        }
-    
-    def initialize_extractor(self):
-        """Initialize the DocumentExtraction instance with a proper ServiceCenter."""
-        try:
-            # First create the service center
-            self.service_center = create_mock_service_center()
-            if not self.service_center:
-                logger.error("Failed to create ServiceCenter!")
-                return False
-            
-            # Now create DocumentExtraction with the service center
-            from modules.chat.documents.documentExtraction import DocumentExtraction
-            self.extractor = DocumentExtraction(self.service_center)
-            logger.info("DocumentExtraction initialized successfully with ServiceCenter")
-            return True
-        except Exception as e:
-            logger.error(f"Failed to initialize DocumentExtraction: {e}")
-            return False
-    
-    def get_files_to_process(self) -> List[Path]:
-        """Get list of files to process from input directory."""
-        if not self.input_dir.exists():
-            logger.error(f"Input directory {self.input_dir} does not exist!")
-            logger.info("Creating input directory and adding a test file...")
-            self.input_dir.mkdir(parents=True, exist_ok=True)
-            
-            # Create a test file if none exist
-            test_file = self.input_dir / "test.txt"
-            with open(test_file, 'w') as f:
-                f.write("This is a test file for document extraction.\nIt contains multiple lines.\nAnd some special characters: äöüß")
-            logger.info(f"Created test file: {test_file}")
-        
-        files = []
-        all_files = list(self.input_dir.iterdir())
-        logger.info(f"All files in directory: {[f.name for f in all_files]}")
-        
-        for file_path in all_files:
-            if file_path.is_file():
-                logger.debug(f"Checking file: {file_path.name} (extension: {file_path.suffix})")
-                if file_path.suffix.lower() in self.supported_extensions:
-                    files.append(file_path)
-                    logger.debug(f"Added file: {file_path.name}")
-                else:
-                    logger.debug(f"Skipped file: {file_path.name} (unsupported extension)")
-        
-        logger.info(f"Found {len(files)} supported files to process")
-        if files:
-            logger.info(f"Files to process: {[f.name for f in files]}")
-        return files
-    
-    async def process_single_file(self, file_path: Path) -> bool:
-        """
-        Process a single file and extract its content.
-        
-        Args:
-            file_path: Path to the file to process
-            
-        Returns:
-            True if successful, False otherwise
-        """
-        if not self.extractor:
-            logger.error("DocumentExtraction not initialized!")
-            return False
-            
-        try:
-            logger.info(f"Processing file: {file_path.name}")
-            
-            # Read file data
-            with open(file_path, 'rb') as f:
-                file_data = f.read()
-            
-            logger.debug(f"File size: {len(file_data)} bytes")
-            
-            # Determine MIME type based on extension
-            mime_type = self._get_mime_type(file_path.suffix)
-            logger.debug(f"MIME type: {mime_type}")
-            
-            # Process the file with or without AI based on configuration
-            extracted_content = await self.extractor.processFileData(
-                fileData=file_data,
-                fileName=file_path.name,
-                mimeType=mime_type,
-                base64Encoded=False,
-                prompt=self.prompt,
-                enableAI=self.enable_ai
-            )
-            
-            logger.debug(f"Extracted {len(extracted_content.contents)} content items")
-            
-            # Debug: Show content details
-            for i, content_item in enumerate(extracted_content.contents):
-                logger.debug(f"Content item {i+1}: label='{content_item.label}', has_data={content_item.data is not None}, data_length={len(content_item.data) if content_item.data else 0}")
-            
-            # Special logging for JavaScript files
-            if mime_type == "application/javascript":
-                logger.debug(f"JavaScript file detected: {file_path.name}")
-                logger.debug(f"Original file size: {len(file_data)} bytes")
-                for i, content_item in enumerate(extracted_content.contents):
-                    if content_item.data:
-                        content_size = len(content_item.data.encode('utf-8'))
-                        logger.debug(f"JavaScript content item {i+1}: {content_size} bytes")
-                        # Check if content was truncated
-                        if content_size < len(file_data) * 0.9:  # If less than 90% of original
-                            logger.warning(f"JavaScript content may be truncated: {content_size} bytes vs {len(file_data)} bytes original")
-            
-            # Track processing result
-            result = {
-                'fileName': file_path.name,
-                'status': 'OK',
-                'content_items': 0,
-                'output_files': [],
-                'total_content_size': 0
-            }
-            
-            # Save each content item as a separate file
-            if extracted_content.contents:
-                for i, content_item in enumerate(extracted_content.contents):
-                    if content_item.data:
-                        content_size = len(content_item.data.encode('utf-8'))
-                        result['total_content_size'] += content_size
-                        logger.debug(f"Content item {i+1}: {content_item.label}, size: {content_size} bytes")
-                        
-                        # Generate fileName with new naming convention
-                        if len(extracted_content.contents) == 1:
-                            # Single content item
-                            output_fileName = f"{file_path.stem} - {content_item.label} 1.txt"
-                        else:
-                            # Multiple content items - add sequence number
-                            output_fileName = f"{file_path.stem} - {content_item.label} {i+1}.txt"
-                        
-                        output_file = self.output_dir / output_fileName
-                        
-                        # Write only the raw extracted content
-                        logger.debug(f"Attempting to write to: {output_file}")
-                        try:
-                            with open(output_file, 'w', encoding='utf-8') as f:
-                                f.write(content_item.data)
-                            
-                            # Verify file was created
-                            if output_file.exists():
-                                actual_size = output_file.stat().st_size
-                                logger.info(f"File created successfully: {output_fileName} (expected: {content_size} bytes, actual: {actual_size} bytes)")
-                            else:
-                                logger.error(f"File was not created: {output_file}")
-                            
-                            result['output_files'].append(output_fileName)
-                            result['content_items'] += 1
-                        except Exception as write_error:
-                            logger.error(f"Error writing file {output_fileName}: {write_error}")
-                            import traceback
-                            traceback.print_exc()
-                    else:
-                        logger.warning(f"Content item {i+1} has no data, skipping")
-            else:
-                logger.warning(f"No content extracted from {file_path.name}")
-                result['status'] = 'FAIL'
-                result['error'] = 'No content extracted'
-            
-            # Add result to tracking list
-            self.processing_results.append(result)
-            
-            logger.info(f"Successfully processed {file_path.name} - Total content: {result['total_content_size']} bytes")
-            return True
-            
-        except Exception as e:
-            error_msg = str(e)
-            logger.error(f"Error processing {file_path.name}: {error_msg}")
-            
-            # Track failed result
-            result = {
-                'fileName': file_path.name,
-                'status': 'FAIL',
-                'content_items': 0,
-                'output_files': [],
-                'error': error_msg,
-                'total_content_size': 0
-            }
-            self.processing_results.append(result)
-            
-            return False
-    
-    def _get_mime_type(self, extension: str) -> str:
-        """Get MIME type based on file extension."""
-        mime_types = {
-            # Text and data files
-            '.txt': 'text/plain',
-            '.csv': 'text/csv',
-            '.json': 'application/json',
-            '.xml': 'application/xml',
-            '.html': 'text/html',
-            '.htm': 'text/html',
-            '.svg': 'image/svg+xml',
-            '.md': 'text/markdown',
-            '.markdown': 'text/markdown',
-            '.rst': 'text/x-rst',
-            '.log': 'text/plain',
-            '.ini': 'text/plain',
-            '.cfg': 'text/plain',
-            '.conf': 'text/plain',
-            
-            # Programming languages
-            '.js': 'application/javascript',
-            '.ts': 'application/typescript',
-            '.jsx': 'text/jsx',
-            '.tsx': 'text/tsx',
-            '.py': 'text/x-python',
-            '.java': 'text/x-java-source',
-            '.c': 'text/x-c',
-            '.cpp': 'text/x-c++src',
-            '.cc': 'text/x-c++src',
-            '.cxx': 'text/x-c++src',
-            '.h': 'text/x-c',
-            '.hpp': 'text/x-c++hdr',
-            '.cs': 'text/x-csharp',
-            '.php': 'application/x-httpd-php',
-            '.rb': 'text/x-ruby',
-            '.go': 'text/x-go',
-            '.rs': 'text/x-rust',
-            '.swift': 'text/x-swift',
-            '.kt': 'text/x-kotlin',
-            '.scala': 'text/x-scala',
-            '.r': 'text/x-r',
-            '.m': 'text/x-matlab',
-            '.pl': 'text/x-perl',
-            '.sh': 'application/x-sh',
-            '.bash': 'application/x-sh',
-            '.zsh': 'application/x-sh',
-            '.fish': 'application/x-sh',
-            '.ps1': 'application/x-powershell',
-            '.bat': 'application/x-msdos-program',
-            '.cmd': 'application/x-msdos-program',
-            '.vbs': 'text/vbscript',
-            '.lua': 'text/x-lua',
-            '.sql': 'application/sql',
-            '.dart': 'application/dart',
-            '.elm': 'text/x-elm',
-            '.clj': 'text/x-clojure',
-            '.hs': 'text/x-haskell',
-            '.fs': 'text/x-fsharp',
-            '.ml': 'text/x-ocaml',
-            
-            # Web technologies
-            '.css': 'text/css',
-            '.scss': 'text/x-scss',
-            '.sass': 'text/x-sass',
-            '.less': 'text/x-less',
-            '.vue': 'text/x-vue',
-            '.svelte': 'text/x-svelte',
-            '.astro': 'text/x-astro',
-            
-            # Configuration and build files
-            '.yaml': 'application/x-yaml',
-            '.yml': 'application/x-yaml',
-            '.toml': 'application/toml',
-            '.env': 'text/plain',
-            '.gitignore': 'text/plain',
-            '.dockerfile': 'text/x-dockerfile',
-            '.dockerignore': 'text/plain',
-            '.makefile': 'text/x-makefile',
-            '.cmake': 'text/x-cmake',
-            '.gradle': 'text/x-gradle',
-            '.maven': 'text/x-maven',
-            '.pom': 'application/xml',
-            '.sln': 'text/plain',
-            '.vcxproj': 'application/xml',
-            '.csproj': 'application/xml',
-            '.fsproj': 'application/xml',
-            '.vbproj': 'application/xml',
-            '.xcodeproj': 'text/plain',
-            '.pbxproj': 'text/plain',
-            
-            # Documentation and markup
-            '.tex': 'application/x-tex',
-            '.bib': 'text/x-bibtex',
-            '.adoc': 'text/asciidoc',
-            '.asciidoc': 'text/asciidoc',
-            '.wiki': 'text/x-wiki',
-            '.creole': 'text/x-wiki',
-            
-            # Images
-            '.jpg': 'image/jpeg',
-            '.jpeg': 'image/jpeg',
-            '.png': 'image/png',
-            '.gif': 'image/gif',
-            '.webp': 'image/webp',
-            '.bmp': 'image/bmp',
-            '.tiff': 'image/tiff',
-            '.ico': 'image/x-icon',
-            
-            # Documents
-            '.pdf': 'application/pdf',
-            '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
-            '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-            '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
-            '.odt': 'application/vnd.oasis.opendocument.text',
-            '.ods': 'application/vnd.oasis.opendocument.spreadsheet',
-            '.odp': 'application/vnd.oasis.opendocument.presentation',
-            
-            # Legacy Office formats
-            '.doc': 'application/msword',
-            '.xls': 'application/vnd.ms-excel',
-            '.ppt': 'application/vnd.ms-powerpoint',
-            
-            # Archives and binaries (will be processed as binary)
-            '.zip': 'application/zip',
-            '.tar': 'application/x-tar',
-            '.gz': 'application/gzip',
-            '.7z': 'application/x-7z-compressed',
-            '.rar': 'application/vnd.rar',
-            '.exe': 'application/x-msdownload',
-            '.dll': 'application/x-msdownload',
-            '.so': 'application/x-sharedlib',
-            '.dylib': 'application/x-mach-binary'
-        }
-        return mime_types.get(extension.lower(), 'application/octet-stream')
-    
-    async def run_tests(self) -> None:
-        """Run the document extraction tests on all files."""
-        mode = "WITH AI" if self.enable_ai else "CONTENT ONLY (No AI)"
-        logger.info(f"Starting document extraction tests - {mode}")
-        logger.info(f"Input directory: {self.input_dir}")
-        logger.info(f"Output directory: {self.output_dir}")
-        if self.enable_ai:
-            logger.info(f"Processing prompt: {self.prompt}")
-        else:
-            logger.info("AI processing: DISABLED - Raw content extraction only")
-        
-        # Initialize the extractor
-        if not self.initialize_extractor():
-            logger.error("Cannot proceed without DocumentExtraction!")
-            return
-        
-        # Get files to process
-        files = self.get_files_to_process()
-        
-        if not files:
-            logger.warning("No files found to process!")
-            return
-        
-        # Process each file
-        successful = 0
-        failed = 0
-        
-        logger.info(f"Starting to process {len(files)} files...")
-        for i, file_path in enumerate(files):
-            logger.info(f"Processing file {i+1}/{len(files)}: {file_path.name}")
-            try:
-                if await self.process_single_file(file_path):
-                    successful += 1
-                    logger.info(f"File {i+1} processed successfully")
-                else:
-                    failed += 1
-                    logger.error(f"File {i+1} processing failed")
-            except Exception as e:
-                failed += 1
-                logger.error(f"Exception processing file {i+1}: {e}")
-                import traceback
-                traceback.print_exc()
-        
-        # Print detailed summary
-        mode = "WITH AI" if self.enable_ai else "CONTENT ONLY (No AI)"
-        logger.info("\n" + "=" * 80)
-        logger.info(f"DETAILED TEST SUMMARY - {mode}")
-        logger.info("=" * 80)
-        logger.info(f"Total files processed: {len(files)}")
-        logger.info(f"Successful: {successful}")
-        logger.info(f"Failed: {failed}")
-        logger.info(f"Output directory: {self.output_dir}")
-        if self.enable_ai:
-            logger.info("AI processing: ENABLED")
-        else:
-            logger.info("AI processing: DISABLED")
-        logger.info("=" * 80)
-        
-        # List all processed documents with results
-        logger.info("\nPROCESSING RESULTS:")
-        logger.info("-" * 80)
-        
-        for result in self.processing_results:
-            status_icon = "✅" if result['status'] == 'OK' else "❌"
-            logger.info(f"{status_icon} {result['fileName']} - {result['status']}")
-            
-            if result['status'] == 'OK':
-                if result['content_items'] == 1:
-                    logger.info(f"   └─ Generated: {result['output_files'][0]} ({result['total_content_size']} bytes)")
-                else:
-                    logger.info(f"   └─ Generated {result['content_items']} files ({result['total_content_size']} total bytes):")
-                    for output_file in result['output_files']:
-                        logger.info(f"      └─ {output_file}")
-            else:
-                error_msg = result.get('error', 'Unknown error')
-                logger.info(f"   └─ Error: {error_msg}")
-        
-        logger.info("-" * 80)
-        logger.info("=" * 80)
-
-def parse_arguments():
-    """Parse command line arguments."""
-    parser = argparse.ArgumentParser(description='Document Extraction Test Script')
-    parser.add_argument('--no-ai', '--content-only', action='store_true', 
-                       help='Run in content-only mode without AI processing')
-    parser.add_argument('--input-dir', type=str, default='d:/temp/test-extraction',
-                       help='Input directory containing files to process (default: d:/temp/test-extraction)')
-    parser.add_argument('--output-dir', type=str, 
-                       help='Output directory for extracted content (auto-generated if not specified)')
-    parser.add_argument('--verbose', '-v', action='store_true',
-                       help='Enable verbose logging')
-    
-    return parser.parse_args()
-
-async def main():
-    """Main function to run the tests."""
-    # Parse command line arguments
-    args = parse_arguments()
-    
-    # Set logging level based on verbosity
-    if args.verbose:
-        logging.getLogger().setLevel(logging.DEBUG)
-    else:
-        logging.getLogger().setLevel(logging.INFO)
-    
-    logger.info("DocumentExtraction Test Script")
-    logger.info("=" * 50)
-    logger.info(f"Source: {args.input_dir}")
-    
-    # Determine output directory
-    if args.output_dir:
-        output_dir = args.output_dir
-    else:
-        if args.no_ai:
-            output_dir = f"{args.input_dir}/extracted-raw"
-        else:
-            output_dir = f"{args.input_dir}/extracted"
-    
-    logger.info(f"Output: {output_dir}")
-    logger.info("=" * 50)
-    
-    # Check dependencies first
-    if not check_dependencies():
-        logger.error("Please install missing dependencies before running tests.")
-        return
-    
-    # Check module imports
-    if not check_module_imports():
-        logger.error("Cannot import required modules. Please check your setup.")
-        return
-    
-    # Determine mode based on command line arguments
-    if args.no_ai:
-        enable_ai = False
-        logger.info("Running in CONTENT ONLY mode (no AI processing)")
-    else:
-        # Interactive mode: ask user for choice
-        print("\n" + "=" * 50)
-        print("SELECT EXTRACTION MODE:")
-        print("=" * 50)
-        print("1. With AI processing (default)")
-        print("2. Content only (no AI processing)")
-        print("=" * 50)
-        
-        try:
-            choice = input("Enter your choice (1 or 2, default is 1): ").strip()
-            if choice == "2":
-                enable_ai = False
-                output_dir = f"{args.input_dir}/extracted-raw"
-                logger.info("Selected: Content only mode (no AI processing)")
-            else:
-                enable_ai = True
-                output_dir = f"{args.input_dir}/extracted"
-                logger.info("Selected: AI processing mode")
-        except (EOFError, KeyboardInterrupt):
-            # Default to AI mode if input fails
-            enable_ai = True
-            output_dir = f"{args.input_dir}/extracted"
-            logger.info("Defaulting to AI processing mode")
-    
-    # Run tests with selected mode
-    tester = DocumentExtractionTester(
-        input_dir=args.input_dir,
-        output_dir=output_dir,
-        enable_ai=enable_ai
-    )
-    await tester.run_tests()
-
-if __name__ == "__main__":
-    # Check if command line arguments are provided for automated testing
-    if len(sys.argv) > 1:
-        # Parse arguments and run directly
-        asyncio.run(main())
-    else:
-        # Interactive mode: ask user for choice
-        asyncio.run(main())
-
-# Convenience function for easy content-only extraction
-async def extract_documents_content_only(input_folder: str, output_folder: str = None):
-    """
-    Convenience function to extract documents without AI processing.
-    
-    Args:
-        input_folder: Path to folder containing documents to extract
-        output_folder: Path to folder where extracted content will be stored (optional)
-    
-    Example:
-        # Extract from d:/temp to d:/temp/extracted-raw
-        asyncio.run(extract_documents_content_only("d:/temp"))
-        
-        # Extract from custom folders
-        asyncio.run(extract_documents_content_only("c:/my_docs", "c:/my_docs/extracted"))
-    """
-    if output_folder is None:
-        output_folder = f"{input_folder}/extracted-raw"
-    
-    logger.info(f"Running content-only extraction from {input_folder} to {output_folder}")
-    
-    # Check dependencies and imports
-    if not check_dependencies():
-        logger.error("Missing dependencies. Please install required packages.")
-        return False
-    
-    if not check_module_imports():
-        logger.error("Cannot import required modules. Please check your setup.")
-        return False
-    
-    # Create tester and run
-    tester = DocumentExtractionTester(
-        input_dir=input_folder,
-        output_dir=output_folder,
-        enable_ai=False
-    )
-    
-    await tester.run_tests()
-    return True
-
-# Example usage (uncomment to use):
-# if __name__ == "__main__":
-#     # For content-only extraction from d:/temp to d:/temp/extracted-raw
-#     asyncio.run(extract_documents_content_only("d:/temp"))
diff --git a/test_excel_processing.py b/test_excel_processing.py
deleted file mode 100644
index 3e39b324..00000000
--- a/test_excel_processing.py
+++ /dev/null
@@ -1,189 +0,0 @@
-#!/usr/bin/env python3
-"""
-Simple test script for enhanced Excel processing functionality.
-This script tests the DocumentExtraction class with Excel files.
-"""
-
-import os
-import sys
-import asyncio
-import logging
-from pathlib import Path
-
-# Configure logging
-logging.basicConfig(
-    level=logging.DEBUG,
-    format='%(asctime)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-
-# Add the gateway directory to the path
-sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
-
-async def test_excel_processing():
-    """Test Excel processing functionality."""
-    try:
-        # Import required modules
-        from modules.chat.documents.documentExtraction import DocumentExtraction
-        from modules.chat.serviceCenter import ServiceCenter
-        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
-        from modules.interfaces.interfaceChatModel import ChatWorkflow
-        from datetime import datetime, UTC
-        
-        logger.info("Testing Excel processing functionality...")
-        
-        # Create mock service center
-        mock_user = User(
-            id="test_user_001",
-            username="testuser",
-            email="test@example.com",
-            fullName="Test User",
-            language="en",
-            enabled=True,
-            privilege=UserPrivilege.USER,
-            authenticationAuthority=AuthAuthority.LOCAL,
-            mandateId="test_mandate_001"
-        )
-        
-        current_time = datetime.now(UTC).isoformat()
-        mock_workflow = ChatWorkflow(
-            id="test_workflow_001",
-            mandateId="test_mandate_001",
-            status="active",
-            name="Test Excel Processing Workflow",
-            currentRound=1,
-            lastActivity=current_time,
-            startedAt=current_time,
-            logs=[],
-            messages=[],
-            stats=None,
-            tasks=[]
-        )
-        
-        service_center = ServiceCenter(mock_user, mock_workflow)
-        logger.info("ServiceCenter created successfully")
-        
-        # Create DocumentExtraction instance
-        extractor = DocumentExtraction(service_center)
-        logger.info("DocumentExtraction created successfully")
-        
-        # Test with a sample Excel file if available
-        test_file_path = "d:/temp/test-extraction/test.xlsx"
-        
-        if os.path.exists(test_file_path):
-            logger.info(f"Found test file: {test_file_path}")
-            
-            # Read the file
-            with open(test_file_path, 'rb') as f:
-                file_data = f.read()
-            
-            logger.info(f"File size: {len(file_data)} bytes")
-            
-            # Process the Excel file
-            logger.info("Processing Excel file...")
-            result = await extractor.processFileData(
-                fileData=file_data,
-                fileName="test.xlsx",
-                mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-                base64Encoded=False,
-                prompt=None,
-                enableAI=False
-            )
-            
-            logger.info(f"Excel processing completed successfully!")
-            logger.info(f"Generated {len(result.contents)} content items:")
-            
-            for i, content_item in enumerate(result.contents):
-                logger.info(f"  Item {i+1}: {content_item.label}")
-                logger.info(f"    MIME type: {content_item.metadata.mimeType}")
-                logger.info(f"    Size: {content_item.metadata.size} bytes")
-                if content_item.data:
-                    logger.info(f"    Data preview: {content_item.data[:100]}...")
-                else:
-                    logger.info(f"    Data: None")
-            
-        else:
-            logger.info("No test Excel file found. Creating a simple test...")
-            
-            # Test the openpyxl library directly
-            try:
-                import openpyxl
-                from openpyxl import Workbook
-                
-                # Create a test workbook
-                wb = Workbook()
-                ws = wb.active
-                ws.title = "Test Sheet"
-                
-                # Add some test data
-                ws['A1'] = "Name"
-                ws['B1'] = "Age"
-                ws['C1'] = "City"
-                ws['A2'] = "John Doe"
-                ws['B2'] = 30
-                ws['C2'] = "New York"
-                ws['A3'] = "Jane Smith"
-                ws['B3'] = 25
-                ws['C3'] = "Los Angeles"
-                
-                # Test properties
-                wb.properties.title = "Test Workbook"
-                wb.properties.creator = "Test User"
-                wb.properties.subject = "Test Subject"
-                
-                logger.info("Test workbook created successfully")
-                logger.info(f"  Title: {wb.properties.title}")
-                logger.info(f"  Creator: {wb.properties.creator}")
-                logger.info(f"  Subject: {wb.properties.subject}")
-                logger.info(f"  Sheets: {wb.sheetnames}")
-                
-                # Test the DocumentExtraction with this workbook
-                from io import BytesIO
-                
-                # Save to bytes
-                buffer = BytesIO()
-                wb.save(buffer)
-                buffer.seek(0)
-                file_data = buffer.getvalue()
-                
-                logger.info(f"Test workbook size: {len(file_data)} bytes")
-                
-                # Process with DocumentExtraction
-                result = await extractor.processFileData(
-                    fileData=file_data,
-                    fileName="test_workbook.xlsx",
-                    mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
-                    base64Encoded=False,
-                    prompt=None,
-                    enableAI=False
-                )
-                
-                logger.info(f"Test workbook processing completed successfully!")
-                logger.info(f"Generated {len(result.contents)} content items:")
-                
-                for i, content_item in enumerate(result.contents):
-                    logger.info(f"  Item {i+1}: {content_item.label}")
-                    logger.info(f"    MIME type: {content_item.metadata.mimeType}")
-                    logger.info(f"    Size: {content_item.metadata.size} bytes")
-                    if content_item.data:
-                        logger.info(f"    Data preview: {content_item.data[:200]}...")
-                    else:
-                        logger.info(f"    Data: None")
-                
-            except ImportError as e:
-                logger.error(f"openpyxl not available: {e}")
-            except Exception as e:
-                logger.error(f"Error testing Excel functionality: {e}")
-        
-        logger.info("Excel processing test completed!")
-        
-    except ImportError as e:
-        logger.error(f"Failed to import required modules: {e}")
-        logger.error("Make sure you're running this script from the gateway directory")
-    except Exception as e:
-        logger.error(f"Unexpected error: {e}")
-        import traceback
-        traceback.print_exc()
-
-if __name__ == "__main__":
-    asyncio.run(test_excel_processing())
diff --git a/test_methodWeb.py b/test_methodWeb.py
deleted file mode 100644
index a4578418..00000000
--- a/test_methodWeb.py
+++ /dev/null
@@ -1,658 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for MethodWeb class.
-Tests all web actions: search, crawl, and scrape with various parameter sets.
-
-Features:
-- Tests web search functionality with different queries
-- Tests web crawling with URL lists
-- Tests web scraping (search + crawl combined)
-- Detailed logging and progress tracking
-- Error handling and validation testing
-- Configuration validation
-
-Usage:
-- Interactive mode: python test_methodWeb.py
-- Automated mode: python test_methodWeb.py --auto
-- Verbose mode: python test_methodWeb.py --verbose
-"""
-
-import os
-import asyncio
-import logging
-import sys
-import argparse
-import json
-from pathlib import Path
-from typing import List, Optional, Dict, Any
-from datetime import datetime, UTC
-
-# Configure logging
-logging.basicConfig(
-    level=logging.INFO,
-    format='%(asctime)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-
-# Filter out specific unwanted log messages
-class LogFilter(logging.Filter):
-    """Filter to hide specific unwanted log messages."""
-    
-    def filter(self, record):
-        # Hide HTTP request info messages
-        if "HTTP Request:" in record.getMessage() and "POST https://api.tavily.com" in record.getMessage():
-            return False
-        
-        # Hide HTTP response info messages
-        if "HTTP/1.1 200 OK" in record.getMessage():
-            return False
-        
-        return True
-
-# Apply the filter to the root logger
-root_logger = logging.getLogger()
-root_logger.addFilter(LogFilter())
-
-def check_dependencies():
-    """Check if required dependencies are available."""
-    missing_deps = []
-    
-    # Check for required dependencies
-    try:
-        import tavily
-        logger.info("tavily-python is available")
-    except ImportError:
-        missing_deps.append("tavily-python")
-        logger.error("tavily-python is missing")
-    
-    try:
-        import httpx
-        logger.info("httpx is available")
-    except ImportError:
-        missing_deps.append("httpx")
-        logger.error("httpx is missing")
-    
-    if missing_deps:
-        logger.error("\n" + "="*60)
-        logger.error("MISSING DEPENDENCIES DETECTED!")
-        logger.error("="*60)
-        logger.error("The following packages are required but not installed:")
-        for dep in missing_deps:
-            logger.error(f"  - {dep}")
-        logger.error("\nTo install all dependencies, run:")
-        logger.error("pip install -r requirements.txt")
-        logger.error("="*60)
-        return False
-    
-    logger.info("All required dependencies are available!")
-    return True
-
-def check_module_imports():
-    """Check if we can import the required modules."""
-    try:
-        # Add the gateway directory to the path so we can import our modules
-        sys.path.append(os.path.join(os.path.dirname(__file__), '..', '..', '..'))
-        
-        from modules.methods.methodWeb import MethodWeb
-        from modules.chat.serviceCenter import ServiceCenter
-        from modules.interfaces.interfaceAppModel import User, UserConnection, UserPrivilege, AuthAuthority
-        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
-        from modules.shared.configuration import APP_CONFIG
-        
-        logger.info("All required modules imported successfully")
-        return True
-    except ImportError as e:
-        logger.error(f"Failed to import required modules: {e}")
-        logger.error("Make sure you're running this script from the gateway directory")
-        return False
-    except Exception as e:
-        logger.error(f"Unexpected error importing modules: {e}")
-        return False
-
-def check_configuration():
-    """Check if required configuration is available."""
-    try:
-        from modules.shared.configuration import APP_CONFIG
-        
-        # Check Tavily API key
-        tavily_api_key = APP_CONFIG.get("Connector_WebTavily_API_KEY")
-        if not tavily_api_key or tavily_api_key == "your_tavily_api_key_here":
-            logger.error("Tavily API key not configured!")
-            logger.error("Please set Connector_WebTavily_API_KEY in config.ini")
-            return False
-        
-        logger.info("Tavily API key is configured")
-        
-        # Check other web configuration
-        web_configs = [
-            "Web_Search_MAX_QUERY_LENGTH",
-            "Web_Search_MAX_RESULTS", 
-            "Web_Search_MIN_RESULTS",
-            "Web_Crawl_TIMEOUT",
-            "Web_Crawl_MAX_RETRIES",
-            "Web_Crawl_RETRY_DELAY"
-        ]
-        
-        for config_key in web_configs:
-            value = APP_CONFIG.get(config_key)
-            if value:
-                logger.info(f"Configuration {config_key}: {value}")
-            else:
-                logger.warning(f"Configuration {config_key} not set, using default")
-        
-        return True
-        
-    except Exception as e:
-        logger.error(f"Failed to check configuration: {e}")
-        return False
-
-def create_mock_service_center():
-    """Create a proper ServiceCenter for testing purposes."""
-    try:
-        from modules.chat.serviceCenter import ServiceCenter
-        from modules.interfaces.interfaceAppModel import User, UserPrivilege, AuthAuthority
-        from modules.interfaces.interfaceChatModel import ChatWorkflow, TaskItem, TaskStatus
-        from modules.interfaces.interfaceChatModel import ChatLog, ChatMessage, ChatStat
-        
-        # Create proper user with all required fields
-        mock_user = User(
-            id="test_user_web_001",
-            username="testuser_web",
-            email="testweb@example.com",
-            fullName="Test Web User",
-            language="en",
-            enabled=True,
-            privilege=UserPrivilege.USER,
-            authenticationAuthority=AuthAuthority.LOCAL,
-            mandateId="test_mandate_web_001"
-        )
-        
-        # Create proper workflow with all required fields
-        current_time = datetime.now(UTC).timestamp()
-        mock_workflow = ChatWorkflow(
-            id="test_workflow_web_001",
-            mandateId="test_mandate_web_001",
-            status="active",
-            name="Test Web Method Workflow",
-            currentRound=1,
-            lastActivity=current_time,
-            startedAt=current_time,
-            logs=[],
-            messages=[],
-            stats=None,
-            tasks=[]
-        )
-        
-        # Create service center
-        service_center = ServiceCenter(mock_user, mock_workflow)
-        logger.info("ServiceCenter created successfully for web testing")
-        return service_center
-        
-    except Exception as e:
-        logger.error(f"Failed to create ServiceCenter: {e}")
-        return None
-
-class MethodWebTester:
-    """Test class for MethodWeb functionality."""
-    
-    def __init__(self):
-        """Initialize the tester."""
-        self.method_web = None
-        self.service_center = None
-        
-        # Test results tracking
-        self.test_results = []
-        
-        # Test parameter sets
-        self.test_queries = [
-            "Python programming tutorial",
-            "FastAPI documentation",
-            "machine learning basics",
-            "web scraping best practices"
-        ]
-        
-        self.test_urls = [
-            "https://docs.python.org/3/tutorial/",
-            "https://fastapi.tiangolo.com/",
-            "https://scikit-learn.org/stable/",
-            "https://requests.readthedocs.io/en/latest/"
-        ]
-    
-    def initialize_method_web(self):
-        """Initialize the MethodWeb instance with a proper ServiceCenter."""
-        try:
-            # First create the service center
-            self.service_center = create_mock_service_center()
-            if not self.service_center:
-                logger.error("Failed to create ServiceCenter!")
-                return False
-            
-            # Now create MethodWeb with the service center
-            from modules.methods.methodWeb import MethodWeb
-            self.method_web = MethodWeb(self.service_center)
-            logger.info("MethodWeb initialized successfully with ServiceCenter")
-            return True
-        except Exception as e:
-            logger.error(f"Failed to initialize MethodWeb: {e}")
-            return False
-    
-    async def test_search_action(self, query: str, max_results: int = 5) -> Dict[str, Any]:
-        """Test the search action with given parameters."""
-        logger.info(f"Testing search action with query: '{query}', max_results: {max_results}")
-        
-        try:
-            parameters = {
-                "query": query,
-                "maxResults": max_results
-            }
-            
-            result = await self.method_web.search(parameters)
-            
-            test_result = {
-                "action": "search",
-                "query": query,
-                "max_results": max_results,
-                "success": result.success,
-                "error": result.error if not result.success else None,
-                "documents_count": len(result.documents) if result.documents else 0,
-                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
-            }
-            
-            if result.success:
-                logger.info(f"✅ Search successful: {test_result['documents_count']} documents returned")
-                if result.documents:
-                    for i, doc in enumerate(result.documents):
-                        logger.info(f"   Document {i+1}: {doc.documentName}")
-                        if hasattr(doc, 'documentData') and hasattr(doc.documentData, 'results'):
-                            logger.info(f"   Results count: {len(doc.documentData.results)}")
-            else:
-                logger.error(f"❌ Search failed: {result.error}")
-            
-            return test_result
-            
-        except Exception as e:
-            error_msg = str(e)
-            logger.error(f"❌ Search action exception: {error_msg}")
-            return {
-                "action": "search",
-                "query": query,
-                "max_results": max_results,
-                "success": False,
-                "error": f"Exception: {error_msg}",
-                "documents_count": 0,
-                "result_label": None
-            }
-    
-    async def test_crawl_action(self, urls: List[str]) -> Dict[str, Any]:
-        """Test the crawl action with given URLs."""
-        logger.info(f"Testing crawl action with {len(urls)} URLs")
-        
-        try:
-            # Monkeypatch the service to return a mock document and file data
-            class _MockDoc:
-                def __init__(self, fileId: str, fileName: str = "mock_search_results.json"):
-                    self.fileId = fileId
-                    self.fileName = fileName
-
-            def _mock_get_docs(_doc_ids):
-                return [_MockDoc(fileId="mock_file_id", fileName="mock_search_results.json")]
-
-            # Build minimal JSON structure expected by methodWeb.crawl
-            mock_payload = {
-                "documentData": {
-                    "results": [{"url": u} for u in urls]
-                }
-            }
-
-            def _mock_get_file_data(_file_id):
-                return json.dumps(mock_payload).encode("utf-8")
-
-            # Apply monkeypatches to the method's service
-            self.method_web.service.getChatDocumentsFromDocumentList = _mock_get_docs
-            self.method_web.service.getFileData = _mock_get_file_data
-
-            # Use any string as the document list reference; service is mocked
-            parameters = {"documentList": "mock_document_list_ref"}
-            
-            result = await self.method_web.crawl(parameters)
-            
-            test_result = {
-                "action": "crawl",
-                "urls_count": len(urls),
-                "success": result.success,
-                "error": result.error if not result.success else None,
-                "documents_count": len(result.documents) if result.documents else 0,
-                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
-            }
-            
-            if result.success:
-                logger.info(f"✅ Crawl successful: {test_result['documents_count']} documents returned")
-                if result.documents:
-                    for i, doc in enumerate(result.documents):
-                        logger.info(f"   Document {i+1}: {doc.documentName}")
-            else:
-                logger.error(f"❌ Crawl failed: {result.error}")
-            
-            return test_result
-            
-        except Exception as e:
-            error_msg = str(e)
-            logger.error(f"❌ Crawl action exception: {error_msg}")
-            return {
-                "action": "crawl",
-                "urls_count": len(urls),
-                "success": False,
-                "error": f"Exception: {error_msg}",
-                "documents_count": 0,
-                "result_label": None
-            }
-    
-    async def test_scrape_action(self, query: str, max_results: int = 3) -> Dict[str, Any]:
-        """Test the scrape action (search + crawl combined) with given parameters."""
-        logger.info(f"Testing scrape action with query: '{query}', max_results: {max_results}")
-        
-        try:
-            parameters = {
-                "query": query,
-                "maxResults": max_results
-            }
-            
-            result = await self.method_web.scrape(parameters)
-            
-            test_result = {
-                "action": "scrape",
-                "query": query,
-                "max_results": max_results,
-                "success": result.success,
-                "error": result.error if not result.success else None,
-                "documents_count": len(result.documents) if result.documents else 0,
-                "result_label": result.resultLabel if hasattr(result, 'resultLabel') else None
-            }
-            
-            if result.success:
-                logger.info(f"✅ Scrape successful: {test_result['documents_count']} documents returned")
-                if result.documents:
-                    for i, doc in enumerate(result.documents):
-                        logger.info(f"   Document {i+1}: {doc.documentName}")
-                        if hasattr(doc, 'documentData') and hasattr(doc.documentData, 'results'):
-                            logger.info(f"   Results count: {len(doc.documentData.results)}")
-            else:
-                logger.error(f"❌ Scrape failed: {result.error}")
-            
-            return test_result
-            
-        except Exception as e:
-            error_msg = str(e)
-            logger.error(f"❌ Scrape action exception: {error_msg}")
-            return {
-                "action": "scrape",
-                "query": query,
-                "max_results": max_results,
-                "success": False,
-                "error": f"Exception: {error_msg}",
-                "documents_count": 0,
-                "result_label": None
-            }
-    
-    async def test_parameter_validation(self) -> List[Dict[str, Any]]:
-        """Test parameter validation with invalid inputs."""
-        logger.info("Testing parameter validation with invalid inputs")
-        
-        validation_tests = []
-        
-        # Test 1: Empty query
-        logger.info("Test 1: Empty query")
-        result = await self.test_search_action("", 5)
-        # For validation tests, we expect the request to fail with validation error
-        if not result["success"] and "validation error" in result.get("error", "").lower():
-            result["success"] = True  # Mark as successful validation test
-            result["validation_test"] = True
-            result["expected_behavior"] = "Correctly rejected empty query"
-            logger.info("✅ Validation test PASSED: Empty query correctly rejected")
-        validation_tests.append(result)
-        
-        # Test 2: Query too long (over 400 characters)
-        long_query = "a" * 500
-        logger.info("Test 2: Query too long")
-        result = await self.test_search_action(long_query, 5)
-        if not result["success"] and "validation error" in result.get("error", "").lower():
-            result["success"] = True  # Mark as successful validation test
-            result["validation_test"] = True
-            result["expected_behavior"] = "Correctly rejected overly long query"
-            logger.info("✅ Validation test PASSED: Long query correctly rejected")
-        validation_tests.append(result)
-        
-        # Test 3: Max results too high
-        logger.info("Test 3: Max results too high")
-        result = await self.test_search_action("test", 25)
-        if not result["success"] and "validation error" in result.get("error", "").lower():
-            result["success"] = True  # Mark as successful validation test
-            result["validation_test"] = True
-            result["expected_behavior"] = "Correctly rejected excessive max results"
-            logger.info("✅ Validation test PASSED: High max results correctly rejected")
-        validation_tests.append(result)
-        
-        # Test 4: Max results too low
-        logger.info("Test 4: Max results too low")
-        result = await self.test_search_action("test", 0)
-        if not result["success"] and "validation error" in result.get("error", "").lower():
-            result["success"] = True  # Mark as successful validation test
-            result["validation_test"] = True
-            result["expected_behavior"] = "Correctly rejected zero max results"
-            logger.info("✅ Validation test PASSED: Zero max results correctly rejected")
-        validation_tests.append(result)
-        
-        return validation_tests
-    
-    async def run_all_tests(self) -> None:
-        """Run all web method tests."""
-        logger.info("Starting MethodWeb comprehensive tests")
-        logger.info("=" * 60)
-        
-        # Initialize the method
-        if not self.initialize_method_web():
-            logger.error("Cannot proceed without MethodWeb!")
-            return
-        
-        # Test 1: Search actions with different queries
-        logger.info("\n" + "=" * 60)
-        logger.info("TEST 1: SEARCH ACTIONS")
-        logger.info("=" * 60)
-        
-        for i, query in enumerate(self.test_queries):
-            logger.info(f"\nSearch test {i+1}/{len(self.test_queries)}")
-            result = await self.test_search_action(query, 3)
-            self.test_results.append(result)
-            await asyncio.sleep(1)  # Rate limiting
-        
-        # Test 2: Scrape actions (search + crawl combined)
-        logger.info("\n" + "=" * 60)
-        logger.info("TEST 2: SCRAPE ACTIONS")
-        logger.info("=" * 60)
-        
-        scrape_queries = self.test_queries[:2]  # Use first 2 queries for scraping
-        for i, query in enumerate(scrape_queries):
-            logger.info(f"\nScrape test {i+1}/{len(scrape_queries)}")
-            result = await self.test_scrape_action(query, 2)
-            self.test_results.append(result)
-            await asyncio.sleep(2)  # Rate limiting for scraping
-        
-        # Test 3: Parameter validation
-        logger.info("\n" + "=" * 60)
-        logger.info("TEST 3: PARAMETER VALIDATION")
-        logger.info("=" * 60)
-        
-        validation_results = await self.test_parameter_validation()
-        self.test_results.extend(validation_results)
-        
-        # Test 4: Crawl action (if we have search results)
-        logger.info("\n" + "=" * 60)
-        logger.info("TEST 4: CRAWL ACTIONS")
-        logger.info("=" * 60)
-        
-        logger.info("Testing crawl with sample URLs")
-        result = await self.test_crawl_action(self.test_urls[:2])
-        self.test_results.append(result)
-        
-        # Print comprehensive summary
-        self.print_test_summary()
-    
-    def print_test_summary(self):
-        """Print comprehensive test summary."""
-        logger.info("\n" + "=" * 80)
-        logger.info("COMPREHENSIVE TEST SUMMARY")
-        logger.info("=" * 80)
-        
-        total_tests = len(self.test_results)
-        successful_tests = sum(1 for result in self.test_results if result["success"])
-        failed_tests = total_tests - successful_tests
-        
-        logger.info(f"Total tests run: {total_tests}")
-        logger.info(f"Successful: {successful_tests}")
-        logger.info(f"Failed: {failed_tests}")
-        logger.info(f"Success rate: {(successful_tests/total_tests)*100:.1f}%")
-        
-        # Group results by action type
-        action_groups = {}
-        for result in self.test_results:
-            action = result["action"]
-            if action not in action_groups:
-                action_groups[action] = []
-            action_groups[action].append(result)
-        
-        logger.info("\n" + "-" * 80)
-        logger.info("RESULTS BY ACTION TYPE:")
-        logger.info("-" * 80)
-        
-        for action, results in action_groups.items():
-            action_successful = sum(1 for r in results if r["success"])
-            action_total = len(results)
-            logger.info(f"\n{action.upper()} ACTIONS:")
-            logger.info(f"  Total: {action_total}, Successful: {action_successful}, Failed: {action_total - action_successful}")
-            
-            for i, result in enumerate(results):
-                status_icon = "✅" if result["success"] else "❌"
-                
-                # Handle validation tests specially
-                if result.get("validation_test", False):
-                    logger.info(f"  {status_icon} Validation Test {i+1}: {result.get('expected_behavior', 'Validation working correctly')}")
-                    if result.get("error"):
-                        logger.info(f"      Validation Error: {result['error']}")
-                elif action == "search":
-                    logger.info(f"  {status_icon} Test {i+1}: '{result['query']}' -> {result['documents_count']} docs")
-                elif action == "scrape":
-                    logger.info(f"  {status_icon} Test {i+1}: '{result['query']}' -> {result['documents_count']} docs")
-                elif action == "crawl":
-                    logger.info(f"  {status_icon} Test {i+1}: {result['urls_count']} URLs -> {result['documents_count']} docs")
-                
-                if not result["success"] and not result.get("validation_test", False):
-                    logger.info(f"      Error: {result['error']}")
-        
-        logger.info("\n" + "-" * 80)
-        logger.info("CONFIGURATION STATUS:")
-        logger.info("-" * 80)
-        
-        try:
-            from modules.shared.configuration import APP_CONFIG
-            tavily_key = APP_CONFIG.get("Connector_WebTavily_API_KEY")
-            if tavily_key and tavily_key != "your_tavily_api_key_here":
-                logger.info("✅ Tavily API key: Configured")
-            else:
-                logger.info("❌ Tavily API key: Not configured")
-            
-            web_configs = [
-                ("Web_Search_MAX_QUERY_LENGTH", "400"),
-                ("Web_Search_MAX_RESULTS", "20"),
-                ("Web_Search_MIN_RESULTS", "1"),
-                ("Web_Crawl_TIMEOUT", "30"),
-                ("Web_Crawl_MAX_RETRIES", "3"),
-                ("Web_Crawl_RETRY_DELAY", "2")
-            ]
-            
-            for config_key, default_value in web_configs:
-                value = APP_CONFIG.get(config_key, default_value)
-                logger.info(f"✅ {config_key}: {value}")
-                
-        except Exception as e:
-            logger.error(f"❌ Configuration check failed: {e}")
-        
-        logger.info("=" * 80)
-
-def parse_arguments():
-    """Parse command line arguments."""
-    parser = argparse.ArgumentParser(description='MethodWeb Test Script')
-    parser.add_argument('--auto', action='store_true', 
-                       help='Run tests automatically without user interaction')
-    parser.add_argument('--verbose', '-v', action='store_true',
-                       help='Enable verbose logging')
-    parser.add_argument('--quick', action='store_true',
-                       help='Run quick tests with fewer queries')
-    
-    return parser.parse_args()
-
-async def main():
-    """Main function to run the tests."""
-    # Parse command line arguments
-    args = parse_arguments()
-    
-    # Set logging level based on verbosity
-    if args.verbose:
-        logging.getLogger().setLevel(logging.DEBUG)
-    else:
-        logging.getLogger().setLevel(logging.INFO)
-    
-    logger.info("MethodWeb Test Script")
-    logger.info("=" * 50)
-    
-    # Check dependencies first
-    if not check_dependencies():
-        logger.error("Please install missing dependencies before running tests.")
-        return
-    
-    # Check module imports
-    if not check_module_imports():
-        logger.error("Cannot import required modules. Please check your setup.")
-        return
-    
-    # Check configuration
-    if not check_configuration():
-        logger.error("Configuration check failed. Please check your config.ini file.")
-        return
-    
-    # Determine test mode
-    if args.auto:
-        logger.info("Running in automated mode")
-    else:
-        # Interactive mode: ask user for confirmation
-        print("\n" + "=" * 50)
-        print("METHODWEB TEST SCRIPT")
-        print("=" * 50)
-        print("This script will test the MethodWeb functionality including:")
-        print("- Web search actions")
-        print("- Web scraping actions") 
-        print("- Web crawling actions")
-        print("- Parameter validation")
-        print("=" * 50)
-        
-        try:
-            choice = input("Do you want to proceed? (y/N): ").strip().lower()
-            if choice not in ['y', 'yes']:
-                logger.info("Test cancelled by user")
-                return
-        except (EOFError, KeyboardInterrupt):
-            logger.info("Test cancelled by user")
-            return
-    
-    # Create tester and run tests
-    tester = MethodWebTester()
-    
-    # Modify test queries for quick mode
-    if args.quick:
-        tester.test_queries = tester.test_queries[:2]  # Use only first 2 queries
-        logger.info("Running in quick mode with reduced test set")
-    
-    await tester.run_all_tests()
-
-if __name__ == "__main__":
-    # Run the tests
-    asyncio.run(main())
diff --git a/test_outlook_filters.py b/test_outlook_filters.py
deleted file mode 100644
index 4a7c0a8b..00000000
--- a/test_outlook_filters.py
+++ /dev/null
@@ -1,51 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for Outlook filter logic
-"""
-
-def test_build_graph_filter():
-    """Test the filter building logic"""
-    
-    # Mock the _buildGraphFilter method
-    def _buildGraphFilter(filter_text):
-        if not filter_text:
-            return {}
-            
-        filter_text = filter_text.strip()
-        
-        # Handle email address filters
-        if '@' in filter_text and '.' in filter_text and ' ' not in filter_text:
-            return {"$filter": f"from/fromAddress/address eq '{filter_text}'"}
-        
-        # Handle search queries (from:, to:, subject:, etc.)
-        if any(filter_text.startswith(prefix) for prefix in ['from:', 'to:', 'subject:', 'received:', 'hasattachment:']):
-            return {"$search": f'"{filter_text}"'}
-        
-        # Handle text content - search in subject
-        return {"$filter": f"contains(subject,'{filter_text}')"}
-    
-    # Test cases
-    test_cases = [
-        ("peter.muster@domain.com", {"$filter": "from/fromAddress/address eq 'peter.muster@domain.com'"}),
-        ("from:user@example.com", {"$search": '"from:user@example.com"'}),
-        ("subject:meeting", {"$search": '"subject:meeting"'}),
-        ("project update", {"$filter": "contains(subject,'project update')"}),
-        ("", {}),
-        ("  hello world  ", {"$filter": "contains(subject,'hello world')"}),
-    ]
-    
-    print("Testing Outlook filter logic:")
-    print("=" * 50)
-    
-    for test_input, expected_output in test_cases:
-        result = _buildGraphFilter(test_input)
-        status = "✓ PASS" if result == expected_output else "✗ FAIL"
-        print(f"{status} | Input: '{test_input}'")
-        print(f"      | Expected: {expected_output}")
-        print(f"      | Got:      {result}")
-        print()
-    
-    print("Test completed!")
-
-if __name__ == "__main__":
-    test_build_graph_filter()
diff --git a/test_outlook_filters_fixed.py b/test_outlook_filters_fixed.py
deleted file mode 100644
index ef9663f3..00000000
--- a/test_outlook_filters_fixed.py
+++ /dev/null
@@ -1,70 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for fixed Outlook filter logic
-"""
-
-def test_build_graph_filter():
-    """Test the corrected filter building logic"""
-    
-    # Mock the corrected _buildGraphFilter method
-    def _buildGraphFilter(filter_text):
-        if not filter_text:
-            return {}
-            
-        filter_text = filter_text.strip()
-        
-        # Handle search queries (from:, to:, subject:, etc.) - check this FIRST
-        if any(filter_text.startswith(prefix) for prefix in ['from:', 'to:', 'subject:', 'received:', 'hasattachment:']):
-            return {"$search": f'"{filter_text}"'}
-        
-        # Handle email address filters (only if it's NOT a search query)
-        if '@' in filter_text and '.' in filter_text and ' ' not in filter_text and not filter_text.startswith('from:'):
-            return {"$filter": f"from/fromAddress/address eq '{filter_text}'"}
-        
-        # Handle text content - search in subject
-        return {"$filter": f"contains(subject,'{filter_text}')"}
-    
-    # Test cases
-    test_cases = [
-        ("peter.muster@domain.com", {"$filter": "from/fromAddress/address eq 'peter.muster@domain.com'"}),
-        ("from:user@example.com", {"$search": '"from:user@example.com"'}),
-        ("subject:meeting", {"$search": '"subject:meeting"'}),
-        ("project update", {"$filter": "contains(subject,'project update')"}),
-        ("", {}),
-        ("  hello world  ", {"$filter": "contains(subject,'hello world')"}),
-        # Additional edge cases
-        ("to:manager@company.com", {"$search": '"to:manager@company.com"'}),
-        ("received:today", {"$search": '"received:today"'}),
-        ("hasattachment:true", {"$search": '"hasattachment:true"'}),
-        ("user@domain.com", {"$filter": "from/fromAddress/address eq 'user@domain.com'"}),
-        ("from:user@domain.com subject:budget", {"$search": '"from:user@domain.com subject:budget"'}),
-    ]
-    
-    print("Testing FIXED Outlook filter logic:")
-    print("=" * 50)
-    
-    passed = 0
-    failed = 0
-    
-    for test_input, expected_output in test_cases:
-        result = _buildGraphFilter(test_input)
-        status = "✓ PASS" if result == expected_output else "✗ FAIL"
-        if result == expected_output:
-            passed += 1
-        else:
-            failed += 1
-            
-        print(f"{status} | Input: '{test_input}'")
-        print(f"      | Expected: {expected_output}")
-        print(f"      | Got:      {result}")
-        print()
-    
-    print(f"Test completed! {passed} passed, {failed} failed")
-    
-    if failed == 0:
-        print("🎉 All tests passed!")
-    else:
-        print("❌ Some tests failed. Please check the logic.")
-
-if __name__ == "__main__":
-    test_build_graph_filter()
diff --git a/test_pydantic_compat.py b/test_pydantic_compat.py
deleted file mode 100644
index be25ab8a..00000000
--- a/test_pydantic_compat.py
+++ /dev/null
@@ -1,100 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for Pydantic compatibility module.
-This script tests the version-aware functionality for both Pydantic v1 and v2.
-"""
-
-import sys
-import os
-
-# Add the modules directory to the path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'modules'))
-
-def test_compatibility_module():
-    """Test the Pydantic compatibility module"""
-    try:
-        from shared.pydanticCompat import (
-            PYDANTIC_VERSION, 
-            create_private_field, 
-            create_model_config,
-            model_to_dict,
-            model_from_dict,
-            get_version_info
-        )
-        
-        print(f"✅ Successfully imported Pydantic compatibility module")
-        print(f"📊 Pydantic version detected: {PYDANTIC_VERSION}")
-        
-        # Test version info
-        version_info = get_version_info()
-        print(f"🔍 Version info: {version_info}")
-        
-        # Test field creation
-        private_field = create_private_field(default="test")
-        print(f"✅ Private field created: {type(private_field)}")
-        
-        # Test model config
-        config = create_model_config(validate_assignment=True)
-        print(f"✅ Model config created: {type(config)}")
-        
-        return True
-        
-    except Exception as e:
-        print(f"❌ Error testing compatibility module: {e}")
-        return False
-
-def test_chat_document_model():
-    """Test the ChatDocument model with compatibility"""
-    try:
-        from interfaces.interfaceChatModel import ChatDocument
-        
-        print(f"✅ Successfully imported ChatDocument model")
-        
-        # Test creating a document
-        doc = ChatDocument(fileId="test-file-123")
-        print(f"✅ ChatDocument created: {doc.id}")
-        
-        # Test setting component interface
-        doc.setComponentInterface("mock_interface")
-        print(f"✅ Component interface set")
-        
-        # Test serialization
-        doc_dict = doc.to_dict()
-        print(f"✅ Document serialized: {doc_dict}")
-        
-        # Test validation
-        is_valid = doc.validate_component_interface()
-        print(f"✅ Component interface validation: {is_valid}")
-        
-        return True
-        
-    except Exception as e:
-        print(f"❌ Error testing ChatDocument model: {e}")
-        import traceback
-        traceback.print_exc()
-        return False
-
-def main():
-    """Main test function"""
-    print("🧪 Testing Pydantic Compatibility Module")
-    print("=" * 50)
-    
-    # Test compatibility module
-    compat_ok = test_compatibility_module()
-    print()
-    
-    # Test ChatDocument model
-    model_ok = test_chat_document_model()
-    print()
-    
-    # Summary
-    print("=" * 50)
-    if compat_ok and model_ok:
-        print("🎉 All tests passed! Pydantic compatibility is working correctly.")
-        return 0
-    else:
-        print("💥 Some tests failed. Check the errors above.")
-        return 1
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/test_web_csv_functionality.py b/test_web_csv_functionality.py
deleted file mode 100644
index 7242c497..00000000
--- a/test_web_csv_functionality.py
+++ /dev/null
@@ -1,207 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test script for web CSV functionality
-Tests both CSV output generation and CSV input reading
-"""
-
-import sys
-import os
-import asyncio
-from typing import Dict, Any
-
-# Add the gateway directory to the Python path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__)))
-
-from modules.methods.methodWeb import MethodWeb
-from modules.interfaces.interfaceWebModel import WebSearchResultItem, WebSearchDocumentData, WebSearchActionDocument, WebSearchActionResult
-from pydantic import HttpUrl
-
-
-def create_mock_web_search_result():
-    """Create a mock WebSearchActionResult with the provided example data"""
-    
-    # Create mock search result items based on the provided example
-    results = [
-        WebSearchResultItem(
-            title="Switzerland Market Analysis :: Fitch Solutions",
-            url=HttpUrl("https://www.fitchsolutions.com/bmi/region/switzerland")
-        ),
-        WebSearchResultItem(
-            title="OECD Economic Outlook, Volume 2024 Issue 2: Switzerland",
-            url=HttpUrl("https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html")
-        ),
-        WebSearchResultItem(
-            title="The economic context of Switzerland - International Trade Portal",
-            url=HttpUrl("https://www.lloydsbanktrade.com/en/market-potential/switzerland/economical-context")
-        ),
-        WebSearchResultItem(
-            title="Switzerland: Country File, Economic Risk Analysis | Coface",
-            url=HttpUrl("https://www.coface.com/news-economy-and-insights/business-risk-dashboard/country-risk-files/switzerland")
-        ),
-        WebSearchResultItem(
-            title="Swiss Economic Outlook 2025 - Roland Berger",
-            url=HttpUrl("https://www.rolandberger.com/en/Insights/Publications/Swiss-Economic-Outlook-2025.html")
-        )
-    ]
-    
-    # Create document data
-    document_data = WebSearchDocumentData(
-        query="current market trends Switzerland business economy 2024 analysis report",
-        results=results,
-        total_count=len(results)
-    )
-    
-    # Create action document
-    action_document = WebSearchActionDocument(
-        documentName="test_search_results.json",
-        documentData=document_data,
-        mimeType="application/json"
-    )
-    
-    # Create action result
-    action_result = WebSearchActionResult(
-        success=True,
-        documents=[action_document]
-    )
-    
-    return action_result
-
-
-def test_csv_output_generation():
-    """Test CSV output generation from web search results"""
-    print("Testing CSV output generation...")
-    
-    # Create method instance (without service center for testing)
-    method = MethodWeb(None)
-    
-    # Create mock search result
-    mock_result = create_mock_web_search_result()
-    
-    # Convert to CSV
-    csv_content = method._convert_search_results_to_csv(mock_result)
-    
-    print("Generated CSV content:")
-    print(csv_content)
-    print()
-    
-    # Verify CSV format
-    lines = csv_content.strip().split('\n')
-    assert len(lines) == 6, f"Expected 6 lines (header + 5 results), got {len(lines)}"
-    
-    # Check header
-    assert lines[0] == "url;title", f"Expected header 'url;title', got '{lines[0]}'"
-    
-    # Check that URLs are present
-    for i, line in enumerate(lines[1:], 1):
-        parts = line.split(';')
-        assert len(parts) == 2, f"Line {i} should have 2 parts separated by ';', got {len(parts)}"
-        url, title = parts
-        assert url.startswith('https://'), f"Line {i} URL should start with 'https://', got '{url}'"
-        assert title, f"Line {i} should have a title, got empty title"
-    
-    print("✓ CSV output generation test passed!")
-    return csv_content
-
-
-def test_csv_input_reading():
-    """Test CSV input reading functionality"""
-    print("Testing CSV input reading...")
-    
-    # Create method instance
-    method = MethodWeb(None)
-    
-    # Test semicolon-separated CSV
-    semicolon_csv = """url;title
-https://www.fitchsolutions.com/bmi/region/switzerland;Switzerland Market Analysis :: Fitch Solutions
-https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html;OECD Economic Outlook, Volume 2024 Issue 2: Switzerland
-https://www.lloydsbanktrade.com/en/market-potential/switzerland/economical-context;The economic context of Switzerland - International Trade Portal"""
-    
-    urls_semicolon = method._read_csv_with_urls(semicolon_csv)
-    print(f"Extracted {len(urls_semicolon)} URLs from semicolon CSV:")
-    for url in urls_semicolon:
-        print(f"  - {url}")
-    
-    assert len(urls_semicolon) == 3, f"Expected 3 URLs, got {len(urls_semicolon)}"
-    assert all(url.startswith('https://') for url in urls_semicolon), "All URLs should start with https://"
-    
-    print("✓ Semicolon CSV reading test passed!")
-    
-    # Test comma-separated CSV
-    comma_csv = """url,title
-https://www.fitchsolutions.com/bmi/region/switzerland,Switzerland Market Analysis :: Fitch Solutions
-https://www.oecd.org/en/publications/2024/12/oecd-economic-outlook-volume-2024-issue-2_67bb8fac/full-report/switzerland_605fd31f.html,OECD Economic Outlook, Volume 2024 Issue 2: Switzerland"""
-    
-    urls_comma = method._read_csv_with_urls(comma_csv)
-    print(f"Extracted {len(urls_comma)} URLs from comma CSV:")
-    for url in urls_comma:
-        print(f"  - {url}")
-    
-    assert len(urls_comma) == 2, f"Expected 2 URLs, got {len(urls_comma)}"
-    assert all(url.startswith('https://') for url in urls_comma), "All URLs should start with https://"
-    
-    print("✓ Comma CSV reading test passed!")
-    
-    # Test case-insensitive column names
-    case_insensitive_csv = """URL;Title
-https://example.com/test;Test Title"""
-    
-    urls_case = method._read_csv_with_urls(case_insensitive_csv)
-    assert len(urls_case) == 1, f"Expected 1 URL, got {len(urls_case)}"
-    assert urls_case[0] == "https://example.com/test", f"Expected 'https://example.com/test', got '{urls_case[0]}'"
-    
-    print("✓ Case-insensitive CSV reading test passed!")
-
-
-def test_integration():
-    """Test the complete integration: generate CSV and then read it back"""
-    print("Testing integration: generate CSV and read it back...")
-    
-    method = MethodWeb(None)
-    
-    # Generate CSV from mock data
-    mock_result = create_mock_web_search_result()
-    csv_content = method._convert_search_results_to_csv(mock_result)
-    
-    # Read URLs back from the generated CSV
-    extracted_urls = method._read_csv_with_urls(csv_content)
-    
-    print(f"Generated CSV with {len(mock_result.documents[0].documentData.results)} results")
-    print(f"Extracted {len(extracted_urls)} URLs from generated CSV")
-    
-    # Verify we got the same number of URLs
-    assert len(extracted_urls) == len(mock_result.documents[0].documentData.results), \
-        f"Expected {len(mock_result.documents[0].documentData.results)} URLs, got {len(extracted_urls)}"
-    
-    # Verify URLs match
-    original_urls = [str(result.url) for result in mock_result.documents[0].documentData.results]
-    for i, (original, extracted) in enumerate(zip(original_urls, extracted_urls)):
-        assert original == extracted, f"URL {i} mismatch: expected '{original}', got '{extracted}'"
-    
-    print("✓ Integration test passed!")
-
-
-if __name__ == "__main__":
-    print("Running Web CSV Functionality Tests")
-    print("=" * 50)
-    
-    try:
-        # Test CSV output generation
-        csv_content = test_csv_output_generation()
-        print()
-        
-        # Test CSV input reading
-        test_csv_input_reading()
-        print()
-        
-        # Test integration
-        test_integration()
-        print()
-        
-        print("=" * 50)
-        print("🎉 All tests passed successfully!")
-        
-    except Exception as e:
-        print(f"❌ Test failed: {e}")
-        import traceback
-        traceback.print_exc()
-        sys.exit(1)

From 9644514e604637ec7f9215008e38628cc5f6f923 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@valueon.ch>
Date: Thu, 4 Sep 2025 01:48:00 +0200
Subject: [PATCH 17/17] shareopint fixed

---
 modules/methods/methodSharepoint.py | 186 +++++++++++++++++++++++++---
 1 file changed, 172 insertions(+), 14 deletions(-)

diff --git a/modules/methods/methodSharepoint.py b/modules/methods/methodSharepoint.py
index 12af28d6..a8257bc3 100644
--- a/modules/methods/methodSharepoint.py
+++ b/modules/methods/methodSharepoint.py
@@ -357,6 +357,7 @@ class MethodSharepoint(MethodBase):
                 - "and:DELTA AND 2025 Mars AND Group" - all terms must be present
                 - "folders:and:DELTA AND 2025 Mars AND Group" - combined options
                 Note: For storage locations, use "folders:" prefix. All search terms must be present by default.
+            resultDocument (str, optional): JSON result document from previous findDocumentPath action to refine search
             searchScope (str, optional): Search scope - options: "all" (default), "documents" (files only), "pages" (SharePoint pages only)
             maxResults (int, optional): Maximum number of results to return (default: 100)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
@@ -364,6 +365,7 @@ class MethodSharepoint(MethodBase):
         try:
             connectionReference = parameters.get("connectionReference")
             searchQuery = parameters.get("searchQuery", "*")
+            resultDocument = parameters.get("resultDocument")
             searchScope = parameters.get("searchScope", "all")
             maxResults = parameters.get("maxResults", 100)
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
@@ -371,6 +373,36 @@ class MethodSharepoint(MethodBase):
             if not connectionReference:
                 return ActionResult.isFailure(error="Connection reference is required")
             
+            # If resultDocument is provided, extract site information to refine search
+            if resultDocument:
+                try:
+                    import json
+                    # Resolve the reference label to get the actual document list
+                    document_list = self.service.getChatDocumentsFromDocumentList([resultDocument])
+                    if not document_list or len(document_list) == 0:
+                        return ActionResult.isFailure(error=f"No document list found for reference: {resultDocument}")
+                    
+                    # Get the first document's content (which should be the JSON)
+                    first_document = document_list[0]
+                    file_data = self.service.getFileData(first_document.fileId)
+                    if not file_data:
+                        return ActionResult.isFailure(error=f"No file data found for document: {resultDocument}")
+                    
+                    # Parse the JSON content
+                    result_data = json.loads(file_data)
+                    found_documents = result_data.get("foundDocuments", [])
+                    
+                    # Extract site information from the result for context
+                    if found_documents:
+                        # Use the site information from the previous search to refine current search
+                        # This could be used to limit search to specific sites or add context
+                        logger.info(f"Refining search using {len(found_documents)} documents from previous result")
+                        
+                except json.JSONDecodeError as e:
+                    return ActionResult.isFailure(error=f"Invalid JSON in resultDocument: {str(e)}")
+                except Exception as e:
+                    return ActionResult.isFailure(error=f"Error resolving resultDocument reference: {str(e)}")
+            
             # Parse searchQuery to extract path, search terms, search type, and options
             pathQuery, fileQuery, searchType, searchOptions = self._parseSearchQuery(searchQuery)
             
@@ -540,6 +572,7 @@ class MethodSharepoint(MethodBase):
             documentList (str): Reference to the document list to read
             connectionReference (str): Reference to the Microsoft connection
             pathQuery (str): Path query to locate documents (e.g., "/Documents/Project1", "*" for all sites)
+            resultDocument (str, optional): JSON result document from findDocumentPath action (alternative to pathQuery)
             includeMetadata (bool, optional): Whether to include metadata (default: True)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
@@ -547,12 +580,50 @@ class MethodSharepoint(MethodBase):
             documentList = parameters.get("documentList")
             connectionReference = parameters.get("connectionReference")
             pathQuery = parameters.get("pathQuery", "*")
+            resultDocument = parameters.get("resultDocument")
             includeMetadata = parameters.get("includeMetadata", True)
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
             if not documentList or not connectionReference:
                 return ActionResult.isFailure(error="Document list reference and connection reference are required")
             
+            # If resultDocument is provided, extract folder IDs from it
+            if resultDocument:
+                try:
+                    import json
+                    # Resolve the reference label to get the actual document list
+                    document_list = self.service.getChatDocumentsFromDocumentList([resultDocument])
+                    if not document_list or len(document_list) == 0:
+                        return ActionResult.isFailure(error=f"No document list found for reference: {resultDocument}")
+                    
+                    # Get the first document's content (which should be the JSON)
+                    first_document = document_list[0]
+                    file_data = self.service.getFileData(first_document.fileId)
+                    if not file_data:
+                        return ActionResult.isFailure(error=f"No file data found for document: {resultDocument}")
+                    
+                    # Parse the JSON content
+                    result_data = json.loads(file_data)
+                    found_documents = result_data.get("foundDocuments", [])
+                    
+                    # Extract folder IDs from the result
+                    folder_ids = []
+                    for doc in found_documents:
+                        if doc.get("type") == "folder":
+                            folder_ids.append(doc.get("id"))
+                    
+                    if folder_ids:
+                        # Use the first folder ID found as pathQuery
+                        pathQuery = folder_ids[0]
+                        logger.info(f"Using folder ID from resultDocument: {pathQuery}")
+                    else:
+                        return ActionResult.isFailure(error="No folders found in resultDocument")
+                        
+                except json.JSONDecodeError as e:
+                    return ActionResult.isFailure(error=f"Invalid JSON in resultDocument: {str(e)}")
+                except Exception as e:
+                    return ActionResult.isFailure(error=f"Error resolving resultDocument reference: {str(e)}")
+            
             # Get documents from reference - ensure documentList is a list, not a string
             if isinstance(documentList, str):
                 documentList = [documentList]  # Convert string to list
@@ -736,6 +807,7 @@ class MethodSharepoint(MethodBase):
             pathQuery (str): Path query where to upload documents (e.g., "/Documents/Project1", "*" for default location)
             documentList (str): Reference to the document list to upload
             fileNames (List[str]): List of names for the uploaded files
+            resultDocument (str, optional): JSON result document from findDocumentPath action (alternative to pathQuery)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
@@ -743,11 +815,49 @@ class MethodSharepoint(MethodBase):
             pathQuery = parameters.get("pathQuery", "/Documents")
             documentList = parameters.get("documentList")
             fileNames = parameters.get("fileNames")
+            resultDocument = parameters.get("resultDocument")
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
             if not connectionReference or not documentList or not fileNames:
                 return ActionResult.isFailure(error="Connection reference, document list, and file names are required")
             
+            # If resultDocument is provided, extract folder IDs from it
+            if resultDocument:
+                try:
+                    import json
+                    # Resolve the reference label to get the actual document list
+                    document_list = self.service.getChatDocumentsFromDocumentList([resultDocument])
+                    if not document_list or len(document_list) == 0:
+                        return ActionResult.isFailure(error=f"No document list found for reference: {resultDocument}")
+                    
+                    # Get the first document's content (which should be the JSON)
+                    first_document = document_list[0]
+                    file_data = self.service.getFileData(first_document.fileId)
+                    if not file_data:
+                        return ActionResult.isFailure(error=f"No file data found for document: {resultDocument}")
+                    
+                    # Parse the JSON content
+                    result_data = json.loads(file_data)
+                    found_documents = result_data.get("foundDocuments", [])
+                    
+                    # Extract folder IDs from the result
+                    folder_ids = []
+                    for doc in found_documents:
+                        if doc.get("type") == "folder":
+                            folder_ids.append(doc.get("id"))
+                    
+                    if folder_ids:
+                        # Use the first folder ID found as pathQuery
+                        pathQuery = folder_ids[0]
+                        logger.info(f"Using folder ID from resultDocument: {pathQuery}")
+                    else:
+                        return ActionResult.isFailure(error="No folders found in resultDocument")
+                        
+                except json.JSONDecodeError as e:
+                    return ActionResult.isFailure(error=f"Invalid JSON in resultDocument: {str(e)}")
+                except Exception as e:
+                    return ActionResult.isFailure(error=f"Error resolving resultDocument reference: {str(e)}")
+            
             # Get Microsoft connection
             connection = self._getMicrosoftConnection(connectionReference)
             if not connection:
@@ -904,35 +1014,86 @@ class MethodSharepoint(MethodBase):
         
         Parameters:
             connectionReference (str): Reference to the Microsoft connection
-            pathQuery (str): Path query to list folders (e.g., "/Documents", "/Shared Documents/Project1", "*" for all sites)
+            searchQuery (str): [path:][type:][mode:]query - "Test Plan", "folders:Test Plan", "/Documents", "*"
+                Note: Use "folders:Name" to search for folders anywhere, not "path:/Name" which looks only in root
+            resultDocument (str, optional): JSON result document from findDocumentPath action (alternative to searchQuery)
             includeSubfolders (bool, optional): Whether to include subfolders (default: False)
             expectedDocumentFormats (list, optional): Expected document formats with extension, mimeType, description
         """
         try:
             connectionReference = parameters.get("connectionReference")
-            pathQuery = parameters.get("pathQuery", "*")
+            searchQuery = parameters.get("searchQuery", "*")
+            resultDocument = parameters.get("resultDocument")
             includeSubfolders = parameters.get("includeSubfolders", False)  # Default to False for better UX
             expectedDocumentFormats = parameters.get("expectedDocumentFormats", [])
             
             if not connectionReference:
                 return ActionResult.isFailure(error="Connection reference is required")
             
+            # If resultDocument is provided, resolve the reference and extract folder IDs from it
+            if resultDocument:
+                try:
+                    import json
+                    # Resolve the reference label to get the actual document list
+                    document_list = self.service.getChatDocumentsFromDocumentList([resultDocument])
+                    if not document_list or len(document_list) == 0:
+                        return ActionResult.isFailure(error=f"No document list found for reference: {resultDocument}")
+                    
+                    # Get the first document's content (which should be the JSON)
+                    first_document = document_list[0]
+                    logger.info(f"Document fileId: {first_document.fileId}, fileName: {first_document.fileName}")
+                    file_data = self.service.getFileData(first_document.fileId)
+                    if not file_data:
+                        return ActionResult.isFailure(error=f"No file data found for document: {resultDocument} (fileId: {first_document.fileId})")
+                    logger.info(f"File data length: {len(file_data) if file_data else 0}")
+                    
+                    # Parse the JSON content
+                    result_data = json.loads(file_data)
+                    found_documents = result_data.get("foundDocuments", [])
+                    
+                    # Extract folder IDs from the result
+                    folder_ids = []
+                    for doc in found_documents:
+                        if doc.get("type") == "folder":
+                            folder_ids.append(doc.get("id"))
+                    
+                    if folder_ids:
+                        # Use the first folder ID found
+                        searchQuery = folder_ids[0]
+                        logger.info(f"Using folder ID from resultDocument: {searchQuery}")
+                    else:
+                        return ActionResult.isFailure(error="No folders found in resultDocument")
+                        
+                except json.JSONDecodeError as e:
+                    return ActionResult.isFailure(error=f"Invalid JSON in resultDocument: {str(e)}")
+                except Exception as e:
+                    return ActionResult.isFailure(error=f"Error resolving resultDocument reference: {str(e)}")
+            
             # Get Microsoft connection
             connection = self._getMicrosoftConnection(connectionReference)
             if not connection:
                 return ActionResult.isFailure(error="No valid Microsoft connection found for the provided connection reference")
             
-            logger.info(f"Starting SharePoint listDocuments for pathQuery: {pathQuery}")
+            logger.info(f"Starting SharePoint listDocuments for searchQuery: {searchQuery}")
             logger.debug(f"Connection ID: {connection['id']}")
             
+            # Parse searchQuery to extract path, search terms, search type, and options
+            pathQuery, fileQuery, searchType, searchOptions = self._parseSearchQuery(searchQuery)
+            
             # Discover all SharePoint sites accessible to the user
             sites = await self._discoverSharePointSites(connection["accessToken"])
             if not sites:
                 return ActionResult.isFailure(error="No SharePoint sites found or accessible")
             
-            # Resolve path query into folder paths
-            folder_paths = self._resolvePathQuery(pathQuery)
-            logger.info(f"Resolved folder paths: {folder_paths}")
+            # Check if searchQuery is a folder ID (starts with 01PPXICCB...)
+            if searchQuery.startswith('01PPXICCB') or searchQuery.startswith('01'):
+                # Direct folder ID - use it directly
+                folder_paths = [searchQuery]
+                logger.info(f"Using direct folder ID: {searchQuery}")
+            else:
+                # Resolve path query into folder paths
+                folder_paths = self._resolvePathQuery(pathQuery)
+                logger.info(f"Resolved folder paths: {folder_paths}")
             
             # Process each folder path across all sites
             list_results = []
@@ -952,8 +1113,11 @@ class MethodSharepoint(MethodBase):
                         if folderPath in ["/", ""] or folderPath == "*":
                             # Root folder
                             endpoint = f"sites/{site_id}/drive/root/children"
+                        elif folderPath.startswith('01PPXICCB') or folderPath.startswith('01'):
+                            # Direct folder ID
+                            endpoint = f"sites/{site_id}/drive/items/{folderPath}/children"
                         else:
-                            # Specific folder - remove leading slash if present
+                            # Specific folder path - remove leading slash if present
                             folder_path_clean = folderPath.lstrip('/')
                             endpoint = f"sites/{site_id}/drive/root:/{folder_path_clean}:/children"
                         
@@ -1067,16 +1231,10 @@ class MethodSharepoint(MethodBase):
             
             # Create result data
             result_data = {
-                "connectionReference": connectionReference,
-                "pathQuery": pathQuery,
+                "searchQuery": searchQuery,
                 "includeSubfolders": includeSubfolders,
                 "sitesSearched": len(sites),
                 "listResults": list_results,
-                "connection": {
-                    "id": connection["id"],
-                    "authority": "microsoft",
-                    "reference": connectionReference
-                },
                 "timestamp": get_utc_timestamp()
             }