From e0caad0a75a6ace5e6dfe01ef8549f9f3db918c1 Mon Sep 17 00:00:00 2001
From: ValueOn AG <p.motsch@poweron.swiss>
Date: Mon, 8 Jun 2026 20:45:51 +0200
Subject: [PATCH] import fixes

---
 modules/auth/jwtService.py                    |    2 +-
 .../commcoach/routeFeatureCommcoach.py        |   12 +-
 modules/routes/routeRealEstate.py             | 2339 -----------------
 modules/routes/routeRealEstateScraping.py     |  881 -------
 .../services/serviceAi/subDocumentIntents.py  |    2 +-
 .../serviceAi/subJsonResponseHandling.py      |   12 +-
 .../renderers/rendererPptx.py                 |    5 +-
 .../engine/executors/actionNodeExecutor.py    |    1 -
 .../engine/executors/flowExecutor.py          |    4 +-
 9 files changed, 21 insertions(+), 3237 deletions(-)
 delete mode 100644 modules/routes/routeRealEstate.py
 delete mode 100644 modules/routes/routeRealEstateScraping.py

diff --git a/modules/auth/jwtService.py b/modules/auth/jwtService.py
index 6ea4535d..04071053 100644
--- a/modules/auth/jwtService.py
+++ b/modules/auth/jwtService.py
@@ -5,7 +5,7 @@ JWT Service
 Centralizes local JWT creation and cookie helpers.
 """
 
-from datetime import timedelta
+from datetime import datetime, timedelta
 from typing import Optional, Tuple
 from fastapi import Response
 from jose import jwt
diff --git a/modules/features/commcoach/routeFeatureCommcoach.py b/modules/features/commcoach/routeFeatureCommcoach.py
index a60db504..c7759900 100644
--- a/modules/features/commcoach/routeFeatureCommcoach.py
+++ b/modules/features/commcoach/routeFeatureCommcoach.py
@@ -14,7 +14,7 @@ import uuid
 
 
 from typing import Optional
-from fastapi import APIRouter, HTTPException, Depends, Request, WebSocket, WebSocketDisconnect, Query
+from fastapi import APIRouter, HTTPException, Depends, Request, Query
 from fastapi.responses import StreamingResponse, Response
 
 from modules.auth import limiter, getRequestContext, RequestContext
@@ -27,13 +27,13 @@ from .datamodelCommcoach import (
     TrainingModule, TrainingModuleStatus, CoachingSession, CoachingSessionStatus,
     CoachingMessage, CoachingMessageRole, CoachingMessageContentType,
     CoachingTask, CoachingTaskStatus,
-    CoachingPersona, CoachingBadge, ModulePersonaMapping,
+    CoachingPersona,
     CreateModuleRequest, UpdateModuleRequest,
     SendMessageRequest, CreateTaskRequest, UpdateTaskRequest, UpdateTaskStatusRequest,
     UpdateProfileRequest,
-    StartSessionRequest, CreatePersonaRequest, UpdatePersonaRequest, SetModulePersonasRequest,
+    CreatePersonaRequest, UpdatePersonaRequest, SetModulePersonasRequest,
 )
-from .serviceCommcoach import CommcoachService, emitSessionEvent, getSessionEventQueue, cleanupSessionEvents
+from .serviceCommcoach import CommcoachService, emitSessionEvent, getSessionEventQueue
 from modules.shared.i18nRegistry import apiRouteContext
 routeApiMsg = apiRouteContext("routeFeatureCommcoach")
 logger = logging.getLogger(__name__)
@@ -104,7 +104,7 @@ async def listModules(
     context: RequestContext = Depends(getRequestContext),
 ):
     """List all training modules for the current user."""
-    mandateId = _validateInstanceAccess(instanceId, context)
+    _validateInstanceAccess(instanceId, context)
     interface = _getInterface(context, instanceId)
     userId = str(context.user.id)
     modules = interface.getModules(instanceId, userId, includeArchived=includeArchived)
@@ -349,7 +349,7 @@ async def startSession(
                             yield f"data: {json.dumps({'type': 'ttsAudio', 'data': {'audio': audioB64, 'format': 'mp3'}})}\n\n"
                         else:
                             errorDetail = ttsResult.get("error", "Text-to-Speech failed")
-                            yield f"data: {json.dumps({'type': 'error', 'data': {'message': _buildTtsConfigErrorMessage(language, voiceName, errorDetail), 'detail': errorDetail, 'ttsLanguage': language, 'ttsVoice': voiceName}})}\n\n"
+                            yield f"data: {json.dumps({'type': 'error', 'data': {'message': buildTtsConfigErrorMessage(language, voiceName, errorDetail), 'detail': errorDetail, 'ttsLanguage': language, 'ttsVoice': voiceName}})}\n\n"
                 except Exception as e:
                     logger.warning(f"TTS failed for resumed session: {e}")
                     yield f"data: {json.dumps({'type': 'error', 'data': {'message': 'Die konfigurierte Stimme für diese Sprache ist ungültig oder nicht verfügbar. Bitte passe sie unter Einstellungen > Stimme & Sprache an.', 'detail': str(e)}})}\n\n"
diff --git a/modules/routes/routeRealEstate.py b/modules/routes/routeRealEstate.py
deleted file mode 100644
index 81550de2..00000000
--- a/modules/routes/routeRealEstate.py
+++ /dev/null
@@ -1,2339 +0,0 @@
-"""
-Real Estate routes for the backend API.
-Implements stateless endpoints for real estate database operations with AI-powered natural language processing.
-"""
-
-import logging
-import json
-import re
-import requests
-import aiohttp
-import asyncio
-import ssl
-from urllib.parse import urljoin, urlparse
-from typing import Optional, Dict, Any, List, Union
-from fastapi import APIRouter, HTTPException, Depends, Body, Request, Query, Path, status
-
-# Import auth modules
-from modules.auth import limiter, getCurrentUser
-
-# Import models
-from modules.datamodels.datamodelPagination import (
-    PaginationParams,
-    PaginatedResponse,
-    PaginationMetadata,
-    normalize_pagination_dict,
-)
-from modules.interfaces.interfaceDbApp import getRootInterface
-from modules.interfaces.interfaceFeatures import getFeatureInterface
-from modules.features.realEstate.datamodelFeatureRealEstate import (
-    Projekt,
-    Parzelle,
-    Dokument,
-    Gemeinde,
-    Kanton,
-    Land,
-    Kontext,
-    StatusProzess,
-    DokumentTyp,
-)
-
-# Import interfaces
-from modules.interfaces.interfaceDbRealEstateObjects import getInterface as getRealEstateInterface
-from modules.interfaces.interfaceDbComponentObjects import getInterface as getComponentInterface
-
-# Import feature logic for AI-powered commands
-from modules.features.realEstate.mainRealEstate import (
-    processNaturalLanguageCommand,
-    create_project_with_parcel_data,
-    extract_bzo_information,
-)
-
-# Import Swiss Topo MapServer connector for testing
-from modules.connectors.connectorSwissTopoMapServer import SwissTopoMapServerConnector
-from modules.connectors.connectorOerebWfs import OerebWfsConnector
-
-# Import Tavily connector for BZO document search
-from modules.aicore.aicorePluginTavily import AiTavily
-
-# Import helper functions from scraping route
-from modules.routes.routeRealEstateScraping import (
-    _get_language_from_kanton,
-    _get_bzo_search_query,
-)
-
-# Import attribute utilities for model schema
-from modules.shared.attributeUtils import getModelAttributeDefinitions
-from modules.shared.i18nRegistry import apiRouteContext
-routeApiMsg = apiRouteContext("routeRealEstate")
-
-# Configure logger
-logger = logging.getLogger(__name__)
-
-# Create router for real estate endpoints
-router = APIRouter(
-    prefix="/api/realestate",
-    tags=["Real Estate"],
-    responses={
-        404: {"description": "Not found"},
-        400: {"description": "Bad request"},
-        401: {"description": "Unauthorized"},
-        403: {"description": "Forbidden"},
-        500: {"description": "Internal server error"}
-    }
-)
-
-
-# ===== Helper Functions (instanceId-based routes, backend-driven like Trustee) =====
-
-def _parsePagination(pagination: Optional[str]) -> Optional[PaginationParams]:
-    """Parse pagination parameter from JSON string."""
-    if not pagination:
-        return None
-    try:
-        paginationDict = json.loads(pagination)
-        if paginationDict:
-            paginationDict = normalize_pagination_dict(paginationDict)
-            return PaginationParams(**paginationDict)
-    except (json.JSONDecodeError, ValueError) as e:
-        raise HTTPException(
-            status_code=400,
-            detail=f"Invalid pagination parameter: {str(e)}"
-        )
-    return None
-
-
-async def _validateInstanceAccess(instanceId: str, context: RequestContext) -> str:
-    """
-    Validate that the user has access to the feature instance.
-    Returns the mandateId for the instance.
-    """
-    rootInterface = getRootInterface()
-    featureInterface = getFeatureInterface(rootInterface.db)
-    instance = featureInterface.getFeatureInstance(instanceId)
-    if not instance:
-        raise HTTPException(
-            status_code=404,
-            detail=f"Feature instance '{instanceId}' not found"
-        )
-    if instance.featureCode != "realestate":
-        raise HTTPException(
-            status_code=400,
-            detail=f"Instance '{instanceId}' is not a realestate instance"
-        )
-    if not context.isPlatformAdmin:
-        featureAccesses = rootInterface.getFeatureAccessesForUser(str(context.user.id))
-        hasAccess = any(
-            str(fa.featureInstanceId) == instanceId and fa.enabled
-            for fa in featureAccesses
-        )
-        if not hasAccess:
-            raise HTTPException(
-                status_code=403,
-                detail=f"Access denied to feature instance '{instanceId}'"
-            )
-    return str(instance.mandateId)
-
-
-# Mapping of entity names to Pydantic model classes (for attributes endpoint)
-_REALESTATE_ENTITY_MODELS = {
-    "Projekt": Projekt,
-    "Parzelle": Parzelle,
-    "Dokument": Dokument,
-    "Gemeinde": Gemeinde,
-    "Kanton": Kanton,
-    "Land": Land,
-}
-
-
-# ============================================================================
-# INSTANCE-ID ROUTES (backend-driven, analog to Trustee)
-# ============================================================================
-
-@router.get("/{instanceId}/attributes/{entityType}", response_model=Dict[str, Any])
-@limiter.limit("30/minute")
-async def get_entity_attributes(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    entityType: str = Path(..., description="Entity type (e.g., Projekt, Parzelle)"),
-    context: RequestContext = Depends(getRequestContext)
-) -> Dict[str, Any]:
-    """Get attribute definitions for a Real Estate entity. Used by FormGeneratorTable."""
-    await _validateInstanceAccess(instanceId, context)
-    if entityType not in _REALESTATE_ENTITY_MODELS:
-        raise HTTPException(
-            status_code=404,
-            detail=f"Unknown entity type: {entityType}. Valid types: {list(_REALESTATE_ENTITY_MODELS.keys())}"
-        )
-    modelClass = _REALESTATE_ENTITY_MODELS[entityType]
-    try:
-        attrDefs = getModelAttributeDefinitions(modelClass)
-        visibleAttrs = [
-            attr for attr in attrDefs.get("attributes", [])
-            if isinstance(attr, dict) and attr.get("visible", True)
-        ]
-        return {"attributes": visibleAttrs}
-    except Exception as e:
-        logger.error(f"Error getting attributes for {entityType}: {e}")
-        raise HTTPException(
-            status_code=500,
-            detail=f"Error getting attributes for {entityType}: {str(e)}"
-        )
-
-
-@router.get("/{instanceId}/projects/options", response_model=List[Dict[str, Any]])
-@limiter.limit("60/minute")
-async def get_project_options(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> List[Dict[str, Any]]:
-    """Get project options for select dropdowns. Returns: [{ value, label }]"""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    items = interface.getProjekte(recordFilter={"featureInstanceId": instanceId})
-    return [{"value": p.id, "label": getattr(p, "label", None) or p.id} for p in items]
-
-
-@router.get("/{instanceId}/parcels/options", response_model=List[Dict[str, Any]])
-@limiter.limit("60/minute")
-async def get_parcel_options(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> List[Dict[str, Any]]:
-    """Get parcel options for select dropdowns. Returns: [{ value, label }]"""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    items = interface.getParzellen(recordFilter={"featureInstanceId": instanceId})
-    return [{"value": p.id, "label": getattr(p, "label", None) or p.id} for p in items]
-
-
-# ----- Projects CRUD -----
-
-@router.get("/{instanceId}/projects", response_model=PaginatedResponse[Projekt])
-@limiter.limit("30/minute")
-async def get_projects(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    pagination: Optional[str] = Query(None, description="JSON-encoded PaginationParams"),
-    context: RequestContext = Depends(getRequestContext)
-) -> PaginatedResponse[Projekt]:
-    """Get all projects for a feature instance with optional pagination."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    recordFilter = {"featureInstanceId": instanceId}
-    paginationParams = _parsePagination(pagination)
-    if paginationParams:
-        result = interface.getProjekte(pagination=paginationParams, recordFilter=recordFilter)
-        if hasattr(result, 'items'):
-            return PaginatedResponse(
-                items=result.items,
-                pagination=PaginationMetadata(
-                    currentPage=paginationParams.page,
-                    pageSize=paginationParams.pageSize,
-                    totalItems=result.totalItems,
-                    totalPages=result.totalPages,
-                    sort=paginationParams.sort or [],
-                    filters=paginationParams.filters
-                )
-            )
-    items = interface.getProjekte(recordFilter=recordFilter)
-    return PaginatedResponse(items=items, pagination=None)
-
-
-@router.get("/{instanceId}/projects/{projectId}", response_model=Projekt)
-@limiter.limit("30/minute")
-async def get_project_by_id(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    projectId: str = Path(..., description="Project ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> Projekt:
-    """Get a single project by ID."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    projekt = interface.getProjekt(projectId)
-    if not projekt or str(getattr(projekt, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Project '{projectId}' not found")
-    return projekt
-
-
-@router.post("/{instanceId}/projects", response_model=Projekt)
-@limiter.limit("30/minute")
-async def create_project(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    data: Dict[str, Any] = Body(...),
-    context: RequestContext = Depends(getRequestContext)
-) -> Projekt:
-    """Create a new project."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    if "mandateId" not in data:
-        data["mandateId"] = mandateId
-    if "featureInstanceId" not in data:
-        data["featureInstanceId"] = instanceId
-    try:
-        projekt = Projekt(**data)
-    except Exception as e:
-        raise HTTPException(status_code=400, detail=f"Invalid data: {str(e)}")
-    return interface.createProjekt(projekt)
-
-
-@router.put("/{instanceId}/projects/{projectId}", response_model=Projekt)
-@limiter.limit("30/minute")
-async def update_project(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    projectId: str = Path(..., description="Project ID"),
-    data: Dict[str, Any] = Body(...),
-    context: RequestContext = Depends(getRequestContext)
-) -> Projekt:
-    """Update a project."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    projekt = interface.getProjekt(projectId)
-    if not projekt or str(getattr(projekt, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Project '{projectId}' not found")
-    updated = interface.updateProjekt(projectId, data)
-    if not updated:
-        raise HTTPException(status_code=500, detail=routeApiMsg("Update failed"))
-    return updated
-
-
-@router.delete("/{instanceId}/projects/{projectId}", status_code=status.HTTP_204_NO_CONTENT)
-@limiter.limit("30/minute")
-async def delete_project(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    projectId: str = Path(..., description="Project ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> None:
-    """Delete a project."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    projekt = interface.getProjekt(projectId)
-    if not projekt or str(getattr(projekt, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Project '{projectId}' not found")
-    if not interface.deleteProjekt(projectId):
-        raise HTTPException(status_code=500, detail=routeApiMsg("Delete failed"))
-
-
-# ----- Parcels CRUD -----
-
-@router.get("/{instanceId}/parcels", response_model=PaginatedResponse[Parzelle])
-@limiter.limit("30/minute")
-async def get_parcels(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    pagination: Optional[str] = Query(None, description="JSON-encoded PaginationParams"),
-    context: RequestContext = Depends(getRequestContext)
-) -> PaginatedResponse[Parzelle]:
-    """Get all parcels for a feature instance with optional pagination."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    recordFilter = {"featureInstanceId": instanceId}
-    paginationParams = _parsePagination(pagination)
-    if paginationParams:
-        result = interface.getParzellen(pagination=paginationParams, recordFilter=recordFilter)
-        if hasattr(result, 'items'):
-            return PaginatedResponse(
-                items=result.items,
-                pagination=PaginationMetadata(
-                    currentPage=paginationParams.page,
-                    pageSize=paginationParams.pageSize,
-                    totalItems=result.totalItems,
-                    totalPages=result.totalPages,
-                    sort=paginationParams.sort or [],
-                    filters=paginationParams.filters
-                )
-            )
-    items = interface.getParzellen(recordFilter=recordFilter)
-    return PaginatedResponse(items=items, pagination=None)
-
-
-@router.get("/{instanceId}/parcels/{parcelId}", response_model=Parzelle)
-@limiter.limit("30/minute")
-async def get_parcel_by_id(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    parcelId: str = Path(..., description="Parcel ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> Parzelle:
-    """Get a single parcel by ID."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    parzelle = interface.getParzelle(parcelId)
-    if not parzelle or str(getattr(parzelle, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Parcel '{parcelId}' not found")
-    return parzelle
-
-
-@router.post("/{instanceId}/parcels", response_model=Parzelle)
-@limiter.limit("30/minute")
-async def create_parcel(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    data: Dict[str, Any] = Body(...),
-    context: RequestContext = Depends(getRequestContext)
-) -> Parzelle:
-    """Create a new parcel."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    if "mandateId" not in data:
-        data["mandateId"] = mandateId
-    if "featureInstanceId" not in data:
-        data["featureInstanceId"] = instanceId
-    try:
-        parzelle = Parzelle(**data)
-    except Exception as e:
-        raise HTTPException(status_code=400, detail=f"Invalid data: {str(e)}")
-    return interface.createParzelle(parzelle)
-
-
-@router.put("/{instanceId}/parcels/{parcelId}", response_model=Parzelle)
-@limiter.limit("30/minute")
-async def update_parcel(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    parcelId: str = Path(..., description="Parcel ID"),
-    data: Dict[str, Any] = Body(...),
-    context: RequestContext = Depends(getRequestContext)
-) -> Parzelle:
-    """Update a parcel."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    parzelle = interface.getParzelle(parcelId)
-    if not parzelle or str(getattr(parzelle, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Parcel '{parcelId}' not found")
-    updated = interface.updateParzelle(parcelId, data)
-    if not updated:
-        raise HTTPException(status_code=500, detail=routeApiMsg("Update failed"))
-    return updated
-
-
-@router.delete("/{instanceId}/parcels/{parcelId}", status_code=status.HTTP_204_NO_CONTENT)
-@limiter.limit("30/minute")
-async def delete_parcel(
-    request: Request,
-    instanceId: str = Path(..., description="Feature Instance ID"),
-    parcelId: str = Path(..., description="Parcel ID"),
-    context: RequestContext = Depends(getRequestContext)
-) -> None:
-    """Delete a parcel."""
-    mandateId = await _validateInstanceAccess(instanceId, context)
-    interface = getRealEstateInterface(
-        context.user, mandateId=mandateId, featureInstanceId=instanceId
-    )
-    parzelle = interface.getParzelle(parcelId)
-    if not parzelle or str(getattr(parzelle, "featureInstanceId", None)) != instanceId:
-        raise HTTPException(status_code=404, detail=f"Parcel '{parcelId}' not found")
-    if not interface.deleteParzelle(parcelId):
-        raise HTTPException(status_code=500, detail=routeApiMsg("Delete failed"))
-
-
-# ============================================================================
-# LEGACY / STATELESS ROUTES (unchanged)
-# ============================================================================
-
-@router.post("/command", response_model=Dict[str, Any])
-@limiter.limit("120/minute")
-async def process_command(
-    request: Request,
-    userInput: str = Body(..., embed=True, description="Natural language command"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Process natural language command and execute corresponding CRUD operation.
-    
-    Uses AI to analyze user intent and extract parameters, then executes the appropriate
-    CRUD operation. Works stateless without session management.
-    
-    Example user inputs:
-    - "Erstelle ein neues Projekt namens 'Hauptstrasse 42'"
-    - "Zeige mir alle Projekte in Zürich"
-    - "Aktualisiere Projekt XYZ mit Status 'Planung'"
-    - "Lösche Parzelle ABC"
-    - "SELECT * FROM Projekt WHERE plz = '8000'"
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "success": true,
-        "intent": "CREATE|READ|UPDATE|DELETE|QUERY",
-        "entity": "Projekt|Parzelle|...|null",
-        "result": {...}
-    }
-    """
-    try:
-        # Validate CSRF token (middleware also checks, but explicit validation for better error messages)
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for POST /api/realestate/command from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for POST /api/realestate/command from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for POST /api/realestate/command from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Processing command request from user {currentUser.id} (mandate: {currentUser.mandateId})")
-        logger.debug(f"User input: {userInput}")
-        
-        # Process natural language command with AI
-        result = await processNaturalLanguageCommand(
-            currentUser=currentUser,
-            userInput=userInput
-        )
-        
-        return result
-        
-    except ValueError as e:
-        logger.error(f"Validation error in process_command: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_400_BAD_REQUEST,
-            detail=f"Validation error: {str(e)}"
-        )
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error processing command: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error processing command: {str(e)}"
-        )
-
-@router.get("/tables", response_model=Dict[str, Any])
-@limiter.limit("120/minute")
-async def get_available_tables(
-    request: Request,
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Get all available real estate tables.
-    
-    Returns a list of available table names with their descriptions.
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Example:
-    - GET /api/realestate/tables
-    """
-    try:
-        # Validate CSRF token if provided
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for GET /api/realestate/tables from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for GET /api/realestate/tables from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for GET /api/realestate/tables from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Getting available tables for user {currentUser.id} (mandate: {currentUser.mandateId})")
-        
-        # Define available tables with descriptions
-        tables = [
-            {
-                "name": "Projekt",
-                "description": "Real estate projects",
-                "model": "Projekt"
-            },
-            {
-                "name": "Parzelle",
-                "description": "Plots/parcels",
-                "model": "Parzelle"
-            },
-            {
-                "name": "Dokument",
-                "description": "Documents",
-                "model": "Dokument"
-            },
-            {
-                "name": "Gemeinde",
-                "description": "Municipalities",
-                "model": "Gemeinde"
-            },
-            {
-                "name": "Kanton",
-                "description": "Cantons",
-                "model": "Kanton"
-            },
-            {
-                "name": "Land",
-                "description": "Countries",
-                "model": "Land"
-            },
-        ]
-        
-        return {
-            "tables": tables,
-            "count": len(tables)
-        }
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error getting available tables: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error getting available tables: {str(e)}"
-        )
-
-
-@router.get("/table/{table}", response_model=PaginatedResponse[Any])
-@limiter.limit("120/minute")
-async def get_table_data(
-    request: Request,
-    table: str = Path(..., description="Table name (Projekt, Parzelle, Dokument, Gemeinde, Kanton, Land)"),
-    pagination: Optional[str] = Query(None, description="JSON-encoded PaginationParams object"),
-    currentUser: User = Depends(getCurrentUser)
-) -> PaginatedResponse[Dict[str, Any]]:
-    """
-    Get all data from a specific real estate table with optional pagination.
-    
-    Available tables:
-    - Projekt: Real estate projects
-    - Parzelle: Plots/parcels
-    - Dokument: Documents
-    - Gemeinde: Municipalities
-    - Kanton: Cantons
-    - Land: Countries
-    
-    Query Parameters:
-    - pagination: JSON-encoded PaginationParams object, or None for no pagination
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Examples:
-    - GET /api/realestate/table/Projekt (no pagination - returns all items)
-    - GET /api/realestate/table/Parzelle?pagination={"page":1,"pageSize":10,"sort":[]}
-    - GET /api/realestate/table/Gemeinde?pagination={"page":2,"pageSize":20,"sort":[{"field":"label","direction":"asc"}]}
-    """
-    try:
-        # Validate CSRF token if provided
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for GET /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for GET /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for GET /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Getting table data for '{table}' from user {currentUser.id} (mandate: {currentUser.mandateId})")
-        
-        # Map table names to model classes and getter methods
-        table_mapping = {
-            "Projekt": (Projekt, "getProjekte"),
-            "Parzelle": (Parzelle, "getParzellen"),
-            "Dokument": (Dokument, "getDokumente"),
-            "Gemeinde": (Gemeinde, "getGemeinden"),
-            "Kanton": (Kanton, "getKantone"),
-            "Land": (Land, "getLaender"),
-        }
-        
-        # Validate table name
-        if table not in table_mapping:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=f"Invalid table name '{table}'. Available tables: {', '.join(table_mapping.keys())}"
-            )
-        
-        # Get interface and fetch data
-        realEstateInterface = getRealEstateInterface(currentUser)
-        model_class, method_name = table_mapping[table]
-        getter_method = getattr(realEstateInterface, method_name)
-        
-        # Fetch all records (no filter for now)
-        records = getter_method(recordFilter=None)
-        
-        # Keep records as model instances (like routeDataFiles does with FileItem)
-        # FastAPI will automatically serialize Pydantic models to JSON
-        items = records
-        
-        # Parse pagination parameter
-        paginationParams = None
-        if pagination:
-            try:
-                paginationDict = json.loads(pagination)
-                paginationParams = PaginationParams(**paginationDict) if paginationDict else None
-            except (json.JSONDecodeError, ValueError) as e:
-                raise HTTPException(
-                    status_code=status.HTTP_400_BAD_REQUEST,
-                    detail=f"Invalid pagination parameter: {str(e)}"
-                )
-        
-        # Apply pagination if requested
-        if paginationParams:
-            # Apply sorting if specified
-            if paginationParams.sort:
-                for sort_field in reversed(paginationParams.sort):  # Reverse to apply in priority order
-                    field_name = sort_field.field
-                    direction = sort_field.direction.lower()
-                    
-                    def sort_key(item):
-                        # Access attribute from model instance
-                        value = getattr(item, field_name, None)
-                        # Handle None values - put them at the end for asc, at the start for desc
-                        if value is None:
-                            return (1, None)  # Use tuple to ensure None values sort consistently
-                        return (0, value)
-                    
-                    items.sort(key=sort_key, reverse=(direction == "desc"))
-            
-            # Apply pagination
-            total_items = len(items)
-            total_pages = (total_items + paginationParams.pageSize - 1) // paginationParams.pageSize  # Ceiling division
-            start_idx = (paginationParams.page - 1) * paginationParams.pageSize
-            end_idx = start_idx + paginationParams.pageSize
-            paginated_items = items[start_idx:end_idx]
-            
-            return PaginatedResponse(
-                items=paginated_items,
-                pagination=PaginationMetadata(
-                    currentPage=paginationParams.page,
-                    pageSize=paginationParams.pageSize,
-                    totalItems=total_items,
-                    totalPages=total_pages,
-                    sort=paginationParams.sort,
-                    filters=paginationParams.filters
-                )
-            )
-        else:
-            # No pagination - return all items (as model instances, like routeDataFiles)
-            return PaginatedResponse(
-                items=items,
-                pagination=None
-            )
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error getting table data for '{table}': {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error getting table data: {str(e)}"
-        )
-
-
-@router.post("/table/{table}", response_model=Dict[str, Any])
-@limiter.limit("120/minute")
-async def create_table_record(
-    request: Request,
-    table: str = Path(..., description="Table name (Projekt, Parzelle, Dokument, Gemeinde, Kanton, Land)"),
-    data: Dict[str, Any] = Body(..., description="Record data to create"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Create a new record in a specific real estate table.
-    
-    Available tables:
-    - Projekt: Real estate projects (with parcel data support)
-    - Parzelle: Plots/parcels
-    - Dokument: Documents
-    - Gemeinde: Municipalities
-    - Kanton: Cantons
-    - Land: Countries
-    
-    Request Body:
-    For Projekt:
-    {
-        "label": "Projekt Bezeichnung",
-        "statusProzess": "Eingang",  // Optional
-        "parzelle": {
-            "id": "OE5913",
-            "egrid": "CH252699779137",
-            "perimeter": {...},
-            "geometry": {...},  // Used for baulinie
-            ...
-        }
-    }
-    
-    For other tables:
-    - JSON object with fields matching the table's data model
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Examples:
-    - POST /api/realestate/table/Projekt
-      Body: {"label": "Hauptstrasse 42", "parzelle": {...}}
-    - POST /api/realestate/table/Parzelle
-      Body: {"label": "Parzelle 1", "strasseNr": "Hauptstrasse 42", "plz": "8000", "bauzone": "W3"}
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for POST /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for POST /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for POST /api/realestate/table/{table} from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Special handling for Projekt with parcel data
-        if table == "Projekt" and ("parzelle" in data or "parzellen" in data):
-            logger.info(f"Creating Projekt with parcel data for user {currentUser.id} (mandate: {currentUser.mandateId})")
-            
-            # Extract fields
-            label = data.get("label")
-            if not label:
-                raise HTTPException(
-                    status_code=status.HTTP_400_BAD_REQUEST,
-                    detail=routeApiMsg("label is required")
-                )
-            
-            status_prozess = data.get("statusProzess", "Eingang")
-            
-            # Support both single parzelle and multiple parzellen
-            parzellen_data = []
-            if "parzellen" in data:
-                # Multiple parcels
-                parzellen_data = data.get("parzellen", [])
-                if not isinstance(parzellen_data, list):
-                    raise HTTPException(
-                        status_code=status.HTTP_400_BAD_REQUEST,
-                        detail=routeApiMsg("parzellen must be an array")
-                    )
-            elif "parzelle" in data:
-                # Single parcel (backward compatibility)
-                parzelle_data = data.get("parzelle")
-                if parzelle_data:
-                    parzellen_data = [parzelle_data]
-            
-            if not parzellen_data:
-                raise HTTPException(
-                    status_code=status.HTTP_400_BAD_REQUEST,
-                    detail=routeApiMsg("parzelle or parzellen data is required")
-                )
-            
-            # Use helper function to create project with parcel data
-            try:
-                result = await create_project_with_parcel_data(
-                    currentUser=currentUser,
-                    projekt_label=label,
-                    parzellen_data=parzellen_data,
-                    status_prozess=status_prozess,
-                )
-                
-                # Return in format expected by frontend (single record, not nested)
-                return result.get("projekt", {})
-            except HTTPException:
-                # Re-raise HTTPExceptions directly
-                raise
-            except Exception as e:
-                logger.error(f"Error creating Projekt with parcel data: {str(e)}", exc_info=True)
-                raise HTTPException(
-                    status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-                    detail=f"Error creating Projekt: {str(e)}"
-                )
-        
-        # Standard handling for other tables or Projekt without parcel data
-        logger.info(f"Creating record in table '{table}' for user {currentUser.id} (mandate: {currentUser.mandateId})")
-        logger.debug(f"Record data: {data}")
-        
-        # Map table names to model classes and create methods
-        table_mapping = {
-            "Projekt": (Projekt, "createProjekt"),
-            "Parzelle": (Parzelle, "createParzelle"),
-            "Dokument": (Dokument, "createDokument"),
-            "Gemeinde": (Gemeinde, "createGemeinde"),
-            "Kanton": (Kanton, "createKanton"),
-            "Land": (Land, "createLand"),
-        }
-        
-        # Validate table name
-        if table not in table_mapping:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=f"Invalid table name '{table}'. Available tables: {', '.join(table_mapping.keys())}"
-            )
-        
-        # Get interface
-        realEstateInterface = getRealEstateInterface(currentUser)
-        model_class, method_name = table_mapping[table]
-        create_method = getattr(realEstateInterface, method_name)
-        
-        # Ensure mandateId is set (will be set by interface if missing)
-        if "mandateId" not in data:
-            data["mandateId"] = currentUser.mandateId
-        
-        # Create model instance from data
-        try:
-            model_instance = model_class(**data)
-        except Exception as e:
-            logger.error(f"Error creating {table} model instance: {str(e)}", exc_info=True)
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=f"Invalid data for {table}: {str(e)}"
-            )
-        
-        # Create record
-        try:
-            created_record = create_method(model_instance)
-            
-            # Convert to dictionary for response
-            if hasattr(created_record, 'model_dump'):
-                return created_record.model_dump()
-            else:
-                return created_record
-                
-        except Exception as e:
-            logger.error(f"Error creating {table} record: {str(e)}", exc_info=True)
-            raise HTTPException(
-                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-                detail=f"Error creating {table} record: {str(e)}"
-            )
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error creating record in table '{table}': {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error creating record: {str(e)}"
-        )
-
-
-@router.get("/parcel/search", response_model=Dict[str, Any])
-@limiter.limit("60/minute")
-async def search_parcel(
-    request: Request,
-    location: str = Query(..., description="Either coordinates as 'x,y' (LV95) or address string"),
-    include_adjacent: bool = Query(False, description="Include adjacent parcels information"),
-    fetch_documents: bool = Query(True, description="If true, fetch BZO documents for the Gemeinde (default: true)"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Search for parcel information by address or coordinates.
-    
-    Returns comprehensive parcel information including:
-    - Parcel identification (number, EGRID, etc.)
-    - Precise boundary geometry for map display
-    - Administrative context (canton, municipality)
-    - Link to official cadastral map
-    - Optional: Adjacent parcels
-    - Optional: Gemeinde information and BZO documents (if fetch_documents=true)
-    
-    Query Parameters:
-    - location: Either coordinates as "x,y" (LV95/EPSG:2056) or address string
-    - include_adjacent: If true, fetches information about adjacent parcels (slower)
-    - fetch_documents: If true, checks for and fetches Bauzonenverordnung (BZO) documents for the Gemeinde (default: true, slower)
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Examples:
-    - GET /api/realestate/parcel/search?location=2600000,1200000
-    - GET /api/realestate/parcel/search?location=Bundesplatz 3, 3003 Bern
-    - GET /api/realestate/parcel/search?location=Bundesplatz 3, 3003 Bern&include_adjacent=true
-    - GET /api/realestate/parcel/search?location=Bundesplatz 3, 3003 Bern&fetch_documents=true
-    
-    Returns:
-    {
-        "parcel": {
-            "id": "823",
-            "egrid": "CH294676423526",
-            "number": "823",
-            "name": "823",
-            "identnd": "BE0200000042",
-            "canton": "BE",
-            "municipality_code": 351,
-            "municipality_name": "Bern",
-            "address": "Bundesplatz 3 3011 Bern",
-            "plz": "3011",
-            "perimeter": {...},
-            "area_m2": 1234.56,
-            "centroid": {"x": 2600000, "y": 1200000},
-            "geoportal_url": "https://...",
-            "realestate_type": null,
-            "bauzone": "W3"
-        },
-        "map_view": {
-            "center": {"x": 2600000, "y": 1200000},
-            "zoom_bounds": {"min_x": ..., "max_x": ..., "min_y": ..., "max_y": ...},
-            "geometry_geojson": {...}
-        },
-        "adjacent_parcels": [...],  // Optional (only if include_adjacent=true)
-        "gemeinde": {  // Optional (only if fetch_documents=true)
-            "id": "...",
-            "label": "Bern",
-            "plz": "3011"
-        },
-        "documents": [  // Optional (only if fetch_documents=true and documents found/created)
-            {
-                "id": "...",
-                "label": "BZO Bern",
-                "dokumentTyp": "gemeindeBzoAktuell",
-                "dokumentReferenz": "...",
-                "quelle": "https://...",
-                "mimeType": "application/pdf"
-            }
-        ]
-    }
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for GET /api/realestate/parcel/search from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        logger.info(f"Searching parcel for user {currentUser.id} (mandate: {currentUser.mandateId}) with location: {location}")
-        
-        # Initialize connector
-        connector = SwissTopoMapServerConnector()
-        
-        # Search for parcel
-        parcel_data = await connector.search_parcel(location)
-        
-        if not parcel_data:
-            raise HTTPException(
-                status_code=status.HTTP_404_NOT_FOUND,
-                detail=f"No parcel found for location: {location}"
-            )
-        
-        # Extract and normalize attributes
-        extracted_attributes = connector.extract_parcel_attributes(parcel_data)
-        attributes = parcel_data.get("attributes", {})
-        geometry = parcel_data.get("geometry", {})
-        
-        # Calculate parcel area from perimeter
-        area_m2 = None
-        centroid = None
-        if extracted_attributes.get("perimeter"):
-            perimeter = extracted_attributes["perimeter"]
-            points = perimeter.get("punkte", [])
-            
-            # Calculate area using shoelace formula
-            if len(points) >= 3:
-                area = 0
-                for i in range(len(points)):
-                    j = (i + 1) % len(points)
-                    area += points[i]["x"] * points[j]["y"]
-                    area -= points[j]["x"] * points[i]["y"]
-                area_m2 = abs(area / 2)
-                
-                # Calculate centroid
-                sum_x = sum(p["x"] for p in points)
-                sum_y = sum(p["y"] for p in points)
-                centroid = {
-                    "x": sum_x / len(points),
-                    "y": sum_y / len(points)
-                }
-        
-        # Extract municipality name and address from Swiss Topo data
-        municipality_name = None
-        full_address = None
-        plz = None
-        canton = attributes.get("ak")  # Extract canton early so it's always available
-        
-        # Debug: Log all available attributes to understand what we have
-        logger.debug(f"Parcel attributes keys: {list(attributes.keys())}")
-        logger.debug(f"Sample parcel attributes: {dict(list(attributes.items())[:10])}")  # First 10 items
-        
-        # First, check if municipality is directly in parcel attributes (ggdename or dplzname)
-        # These fields are often present in the parcel data itself from Swiss Topo
-        municipality_from_attrs = attributes.get("ggdename") or attributes.get("dplzname") or attributes.get("gemeinde") or attributes.get("gemeindename")
-        if municipality_from_attrs:
-            # Use connector's cleaning method to remove canton suffix
-            municipality_name = connector._clean_municipality_name(str(municipality_from_attrs))
-            logger.info(f"Found municipality '{municipality_name}' in parcel attributes (from {municipality_from_attrs})")
-        
-        # Also check extracted_attributes for municipality
-        if not municipality_name:
-            municipality_from_extracted = extracted_attributes.get("kontextGemeinde")
-            if municipality_from_extracted:
-                municipality_name = str(municipality_from_extracted)
-                logger.info(f"Found municipality '{municipality_name}' in extracted attributes")
-        
-        # Also check for PLZ in parcel attributes
-        if not plz:
-            plz_from_attrs = attributes.get("dplz4") or attributes.get("plz")
-            if plz_from_attrs:
-                plz = str(plz_from_attrs).strip()
-                logger.debug(f"Found PLZ '{plz}' in parcel attributes")
-        
-        # Try to use geocoded address info if available (more accurate than centroid query)
-        geocoded_address = parcel_data.get('geocoded_address')
-        if geocoded_address:
-            if not full_address:
-                full_address = geocoded_address.get('full_address')
-            if not plz:
-                plz = geocoded_address.get('plz')
-            if not municipality_name:
-                geocoded_municipality = geocoded_address.get('municipality')
-                if geocoded_municipality:
-                    municipality_name = connector._clean_municipality_name(geocoded_municipality)
-                    logger.debug(f"Found municipality '{municipality_name}' from geocoded address")
-            if full_address:
-                logger.debug(f"Using geocoded address: {full_address}")
-        
-        # If geocoded address not available, try to get address by querying the address layer
-        # Use query coordinates (where user clicked/geocoded) instead of parcel centroid
-        # This ensures we get the address at the exact location, not at the parcel center
-        query_coords = parcel_data.get('query_coordinates')
-        address_query_coords = query_coords if query_coords else centroid
-        
-        if not full_address and address_query_coords:
-            query_x = address_query_coords['x']
-            query_y = address_query_coords['y']
-            logger.debug(f"Querying address layer at query coordinates: ({query_x}, {query_y})")
-            
-            # Check if this was a coordinate search (not geocoded address)
-            is_coordinate_search = ',' in location and not any(c.isalpha() for c in location.split(',')[0])
-            
-            # Use connector's helper method to query building layer
-            # Use tolerance=1 (minimum) for coordinate searches to get exact building
-            building_tolerance = 1 if is_coordinate_search else 10
-            building_result = await connector._query_building_layer(query_x, query_y, tolerance=building_tolerance, buffer=25)
-            
-            if building_result:
-                addr_attrs = building_result.get("attributes", {})
-                logger.debug(f"Address layer attributes: {addr_attrs}")
-                
-                # Extract address using connector's helper method
-                address_info = connector._extract_address_from_building_attrs(addr_attrs)
-                if not full_address:
-                    full_address = address_info.get('full_address')
-                if not plz:
-                    plz = address_info.get('plz')
-                if not municipality_name:
-                    municipality_name = address_info.get('municipality')
-                    if municipality_name:
-                        logger.debug(f"Found municipality '{municipality_name}' from building layer")
-                
-                if full_address:
-                    logger.debug(f"Constructed address: {full_address}")
-        
-        # If address not found via building layer, try to construct from available data
-        if not full_address:
-            # Check if location was provided as an address string
-            if location and any(c.isalpha() for c in location) and "CH" not in location:
-                # Location looks like an address (not an EGRID)
-                full_address = location
-                logger.debug(f"Using location as address: {full_address}")
-        
-        # Try to extract municipality name from address string if not found yet
-        if not municipality_name and full_address:
-            # Parse address string to extract municipality name
-            # Format is usually: "Street Number, PLZ Municipality" or "Street Number PLZ Municipality"
-            # Examples: "Forchstrasse 6c, 8610 Uster" or "Bundesplatz 3 3011 Bern"
-            # Try to match PLZ followed by municipality name
-            # PLZ is typically 4 digits, municipality name follows
-            plz_municipality_match = re.search(r'\b(\d{4})\s+([A-ZÄÖÜ][a-zäöüß\s-]+)', full_address)
-            if plz_municipality_match:
-                extracted_plz = plz_municipality_match.group(1)
-                extracted_municipality = plz_municipality_match.group(2).strip()
-                # Remove trailing commas or other punctuation
-                extracted_municipality = re.sub(r'[,;\.]+$', '', extracted_municipality).strip()
-                if extracted_municipality:
-                    municipality_name = extracted_municipality
-                    if not plz:
-                        plz = extracted_plz
-                    logger.debug(f"Extracted municipality '{municipality_name}' and PLZ '{plz}' from address string")
-        
-        # Try to extract municipality name from BFSNR if still not found
-        if not municipality_name:
-            bfsnr = attributes.get("bfsnr")
-            
-            logger.info(f"Attempting to resolve municipality name for BFS number {bfsnr} in canton {canton}")
-            
-            # Try to query database for Gemeinde by BFS number
-            if bfsnr and canton:
-                try:
-                    realEstateInterface = getRealEstateInterface(currentUser)
-                    # Query Gemeinde by BFS number (stored in kontextInformationen)
-                    gemeinden = realEstateInterface.getGemeinden(
-                        recordFilter={"mandateId": currentUser.mandateId}
-                    )
-                    logger.debug(f"Found {len(gemeinden)} Gemeinden in database, searching for BFS {bfsnr}")
-                    for gemeinde in gemeinden:
-                        # Check kontextInformationen for BFS number
-                        for kontext in gemeinde.kontextInformationen:
-                            try:
-                                kontext_data = json.loads(kontext.inhalt) if isinstance(kontext.inhalt, str) else kontext.inhalt
-                                if isinstance(kontext_data, dict):
-                                    kontext_bfsnr = kontext_data.get("bfs_nummer") or kontext_data.get("bfsnr") or kontext_data.get("municipality_code")
-                                    if str(kontext_bfsnr) == str(bfsnr):
-                                        municipality_name = gemeinde.label
-                                        logger.info(f"Found Gemeinde '{municipality_name}' by BFS number {bfsnr} in database")
-                                        break
-                            except (json.JSONDecodeError, AttributeError) as e:
-                                logger.debug(f"Error parsing kontext: {e}")
-                                continue
-                        if municipality_name:
-                            break
-                except Exception as e:
-                    logger.warning(f"Error querying Gemeinde by BFS number: {e}", exc_info=True)
-            
-            # If still not found, try to use Swiss Topo geocoding API to get municipality name from coordinates
-            # This is more reliable than BFS number lookup since coordinates are exact
-            if not municipality_name and centroid:
-                try:
-                    # Use Swiss Topo geocoding to get municipality name from coordinates
-                    geocode_url = "https://api3.geo.admin.ch/rest/services/api/MapServer/identify"
-                    params = {
-                        "geometry": f"{centroid['x']},{centroid['y']}",
-                        "geometryType": "esriGeometryPoint",
-                        "layers": "all:ch.swisstopo.swissboundaries3d-gemeinde-flaeche.fill",
-                        "tolerance": "0",
-                        "returnGeometry": "false",
-                        "sr": "2056"
-                    }
-                    import aiohttp
-                    ssl_context = ssl.create_default_context()
-                    ssl_context.check_hostname = False
-                    ssl_context.verify_mode = ssl.CERT_NONE
-                    connector_aiohttp = aiohttp.TCPConnector(ssl=ssl_context)
-                    async with aiohttp.ClientSession(connector=connector_aiohttp) as session:
-                        async with session.get(geocode_url, params=params) as resp:
-                            if resp.status == 200:
-                                data = await resp.json()
-                                results = data.get("results", [])
-                                if results:
-                                    result_attrs = results[0].get("attributes", {})
-                                    geocoded_municipality = result_attrs.get("name") or result_attrs.get("gemeindename") or result_attrs.get("label")
-                                    if geocoded_municipality:
-                                        municipality_name = connector._clean_municipality_name(str(geocoded_municipality))
-                                        logger.info(f"Found municipality '{municipality_name}' via Swiss Topo geocoding API (from {geocoded_municipality})")
-                except Exception as e:
-                    logger.debug(f"Error querying Swiss Topo geocoding API: {e}", exc_info=True)
-            
-            # If still not found, try expanded Swiss municipalities lookup
-            if not municipality_name and bfsnr:
-                # Expanded Swiss municipalities lookup by BFS number
-                # Source: https://www.bfs.admin.ch/bfs/de/home/grundlagen/agvch.html
-                common_municipalities = {
-                    # Zürich (ZH)
-                    261: "Zürich",
-                    198: "Pfäffikon",  # ZH-198 is Pfäffikon
-                    191: "Uster",  # Uster is ZH-191
-                    3203: "Winterthur",
-                    # Bern (BE)
-                    351: "Bern",
-                    # Basel (BS)
-                    2701: "Basel",
-                    # Genève (GE)
-                    6621: "Genève",
-                    # Vaud (VD)
-                    5586: "Lausanne",
-                    # Luzern (LU)
-                    1061: "Luzern",
-                    # St. Gallen (SG)
-                    230: "St. Gallen",
-                    # Ticino (TI)
-                    5192: "Lugano",
-                    # Schwyz (SZ)
-                    1367: "Schwyz",
-                }
-                
-                if bfsnr in common_municipalities:
-                    municipality_name = common_municipalities[bfsnr]
-                    logger.info(f"Looked up municipality '{municipality_name}' from common list for BFS {bfsnr}")
-            
-            # If still not found, log warning
-            if not municipality_name:
-                logger.warning(f"Could not determine municipality name for BFS number {bfsnr} in canton {canton}. Municipality name will be None.")
-        
-        # Final validation: Don't use EGRID as address
-        if full_address and full_address.startswith("CH") and len(full_address) == 14 and full_address[2:].isdigit():
-            # This is an EGRID, not an address
-            full_address = None
-            logger.debug("Removed EGRID from address field")
-        
-        # Query zone information (wohnzone/bauzone) from ÖREB WFS
-        bauzone = None
-        # Check if geometry has actual data (either rings or coordinates)
-        has_geometry = geometry and (geometry.get("rings") or geometry.get("coordinates"))
-        if canton and has_geometry:
-            try:
-                logger.debug(f"Querying zone information for parcel {attributes.get('label')} in canton {canton}")
-                oereb_connector = OerebWfsConnector()
-                egrid = attributes.get("egris_egrid", "")
-                x = centroid["x"] if centroid else None
-                y = centroid["y"] if centroid else None
-                
-                # Query zone layer using parcel geometry
-                zone_results = await oereb_connector.query_zone_layer(
-                    egrid=egrid,
-                    x=x or 0.0,
-                    y=y or 0.0,
-                    canton=canton,
-                    geometry=geometry
-                )
-                
-                if zone_results and len(zone_results) > 0:
-                    zone_attrs = zone_results[0].get("attributes", {})
-                    typ_gde_abkuerzung = zone_attrs.get("typ_gde_abkuerzung")
-                    if typ_gde_abkuerzung:
-                        bauzone = typ_gde_abkuerzung
-                        logger.info(f"Found bauzone/wohnzone: {bauzone} for parcel {attributes.get('label')}")
-                    else:
-                        logger.debug(f"No typ_gde_abkuerzung found in zone results for parcel {attributes.get('label')}")
-                else:
-                    logger.debug(f"No zone results found for parcel {attributes.get('label')}")
-            except Exception as e:
-                logger.warning(f"Error querying zone information: {e}", exc_info=True)
-                # Continue without zone information if query fails
-        
-        # Build parcel info
-        parcel_info = {
-            "id": attributes.get("label") or attributes.get("number"),
-            "egrid": attributes.get("egris_egrid"),
-            "number": attributes.get("number"),
-            "name": attributes.get("name"),
-            "identnd": attributes.get("identnd"),
-            "canton": attributes.get("ak"),
-            "municipality_code": attributes.get("bfsnr"),
-            "municipality_name": municipality_name,
-            "address": full_address,
-            "plz": plz,
-            "perimeter": extracted_attributes.get("perimeter"),
-            "area_m2": area_m2,
-            "centroid": centroid,
-            "geoportal_url": attributes.get("geoportal_url"),
-            "realestate_type": attributes.get("realestate_type"),
-            "bauzone": bauzone
-        }
-        
-        # Build map view info
-        bbox = parcel_data.get("bbox", [])
-        map_view = {
-            "center": centroid,
-            "zoom_bounds": {
-                "min_x": bbox[0] if len(bbox) >= 4 else None,
-                "min_y": bbox[1] if len(bbox) >= 4 else None,
-                "max_x": bbox[2] if len(bbox) >= 4 else None,
-                "max_y": bbox[3] if len(bbox) >= 4 else None
-            },
-            "geometry_geojson": {
-                "type": "Feature",
-                "geometry": {
-                    "type": "Polygon",
-                    "coordinates": [
-                        [[p["x"], p["y"]] for p in extracted_attributes["perimeter"]["punkte"]]
-                    ] if extracted_attributes.get("perimeter") else []
-                },
-                "properties": {
-                    "id": parcel_info["id"],
-                    "egrid": parcel_info["egrid"],
-                    "number": parcel_info["number"]
-                }
-            }
-        }
-        
-        # Build response
-        response_data = {
-            "parcel": parcel_info,
-            "map_view": map_view
-        }
-        
-        # Fetch adjacent parcels if requested
-        if include_adjacent and parcel_data and parcel_data.get("geometry"):
-            try:
-                # Use the connector's method to find neighboring parcels by sampling along the boundary
-                # This ensures we find all parcels that actually touch the selected parcel
-                selected_parcel_id = parcel_info["id"]
-                adjacent_parcels_raw = await connector.find_neighboring_parcels(
-                    parcel_data=parcel_data,
-                    selected_parcel_id=selected_parcel_id,
-                    sample_distance=20.0,  # Sample every 20 meters (balanced for coverage and speed)
-                    max_sample_points=30,  # Allow up to 30 points to ensure all vertices are covered
-                    max_neighbors=15,  # Find up to 15 neighbors
-                    max_concurrent=50  # Process up to 50 queries concurrently (maximum parallelization)
-                )
-                
-                # Convert adjacent parcels to include GeoJSON geometry (optimized, minimal logging)
-                def convert_parcel_geometry(adj_parcel: Dict[str, Any]) -> Dict[str, Any]:
-                    """Convert a single adjacent parcel to include GeoJSON geometry."""
-                    adj_parcel_with_geo = {
-                        "id": adj_parcel["id"],
-                        "egrid": adj_parcel.get("egrid"),
-                        "number": adj_parcel.get("number"),
-                        "perimeter": adj_parcel.get("perimeter")
-                    }
-                    
-                    # Convert geometry to GeoJSON format if available
-                    adj_geometry = adj_parcel.get("geometry")
-                    adj_perimeter = adj_parcel.get("perimeter")
-                    
-                    if adj_geometry:
-                        # Handle ESRI format (rings)
-                        if "rings" in adj_geometry and adj_geometry["rings"]:
-                            ring = adj_geometry["rings"][0]  # Outer ring
-                            coordinates = [[[p[0], p[1]] for p in ring]]
-                            adj_parcel_with_geo["geometry_geojson"] = {
-                                "type": "Feature",
-                                "geometry": {
-                                    "type": "Polygon",
-                                    "coordinates": coordinates
-                                },
-                                "properties": {
-                                    "id": adj_parcel["id"],
-                                    "egrid": adj_parcel.get("egrid"),
-                                    "number": adj_parcel.get("number")
-                                }
-                            }
-                        # Handle GeoJSON format
-                        elif adj_geometry.get("type") == "Polygon":
-                            adj_parcel_with_geo["geometry_geojson"] = {
-                                "type": "Feature",
-                                "geometry": adj_geometry,
-                                "properties": {
-                                    "id": adj_parcel["id"],
-                                    "egrid": adj_parcel.get("egrid"),
-                                    "number": adj_parcel.get("number")
-                                }
-                            }
-                    
-                    # If no geometry_geojson was created but we have perimeter, create it from perimeter
-                    if "geometry_geojson" not in adj_parcel_with_geo and adj_perimeter and adj_perimeter.get("punkte"):
-                        punkte = adj_perimeter["punkte"]
-                        coordinates = [[[p["x"], p["y"]] for p in punkte]]
-                        adj_parcel_with_geo["geometry_geojson"] = {
-                            "type": "Feature",
-                            "geometry": {
-                                "type": "Polygon",
-                                "coordinates": coordinates
-                            },
-                            "properties": {
-                                "id": adj_parcel["id"],
-                                "egrid": adj_parcel.get("egrid"),
-                                "number": adj_parcel.get("number")
-                            }
-                        }
-                    
-                    return adj_parcel_with_geo
-                
-                # Convert all parcels in parallel (using list comprehension for speed)
-                adjacent_parcels = [convert_parcel_geometry(adj_parcel) for adj_parcel in adjacent_parcels_raw]
-                
-                response_data["adjacent_parcels"] = adjacent_parcels
-                logger.info(f"Found {len(adjacent_parcels)} neighboring parcels for parcel {selected_parcel_id}")
-                
-            except Exception as e:
-                logger.warning(f"Error fetching adjacent parcels: {e}", exc_info=True)
-                response_data["adjacent_parcels"] = []
-        
-        # Fetch BZO documents if requested
-        gemeinde_info = None
-        bzo_documents = []
-        
-        logger.debug(f"Document fetch check: fetch_documents={fetch_documents}, municipality_name={municipality_name}, canton={canton}")
-        
-        if fetch_documents and municipality_name and canton:
-            logger.info(f"Fetching BZO documents for Gemeinde '{municipality_name}' in canton '{canton}'")
-            try:
-                # Get interfaces
-                realEstateInterface = getRealEstateInterface(currentUser)
-                componentInterface = getComponentInterface(currentUser)
-                logger.debug(f"Interfaces initialized for document fetching")
-                
-                # Resolve or create Gemeinde
-                gemeinde = None
-                # First, ensure Land "Schweiz" exists
-                laender = realEstateInterface.getLaender(recordFilter={"label": "Schweiz"})
-                if not laender:
-                    land = Land(
-                        mandateId=currentUser.mandateId,
-                        label="Schweiz",
-                        abk="CH"
-                    )
-                    land = realEstateInterface.createLand(land)
-                    logger.debug(f"Created Land 'Schweiz' with ID: {land.id}")
-                else:
-                    land = laender[0]
-                
-                # Map canton abbreviations to full names
-                canton_names = {
-                    "ZH": "Zürich", "BE": "Bern", "LU": "Luzern", "UR": "Uri", "SZ": "Schwyz",
-                    "OW": "Obwalden", "NW": "Nidwalden", "GL": "Glarus", "ZG": "Zug", "FR": "Freiburg",
-                    "SO": "Solothurn", "BS": "Basel-Stadt", "BL": "Basel-Landschaft", "SH": "Schaffhausen",
-                    "AR": "Appenzell Ausserrhoden", "AI": "Appenzell Innerrhoden", "SG": "St. Gallen",
-                    "GR": "Graubünden", "AG": "Aargau", "TG": "Thurgau", "TI": "Tessin",
-                    "VD": "Waadt", "VS": "Wallis", "NE": "Neuenburg", "GE": "Genf", "JU": "Jura"
-                }
-                
-                # Get or create Kanton
-                kantone = realEstateInterface.getKantone(recordFilter={"abk": canton})
-                if not kantone:
-                    kanton_label = canton_names.get(canton, canton)
-                    kanton_obj = Kanton(
-                        mandateId=currentUser.mandateId,
-                        label=kanton_label,
-                        abk=canton,
-                        id_land=land.id
-                    )
-                    kanton_obj = realEstateInterface.createKanton(kanton_obj)
-                    logger.debug(f"Created Kanton '{kanton_label}' ({canton})")
-                else:
-                    kanton_obj = kantone[0]
-                
-                # Get or create Gemeinde
-                gemeinden = realEstateInterface.getGemeinden(
-                    recordFilter={"label": municipality_name, "id_kanton": kanton_obj.id}
-                )
-                if not gemeinden:
-                    gemeinde = Gemeinde(
-                        mandateId=currentUser.mandateId,
-                        label=municipality_name,
-                        id_kanton=kanton_obj.id,
-                        plz=plz
-                    )
-                    gemeinde = realEstateInterface.createGemeinde(gemeinde)
-                    logger.info(f"Created Gemeinde '{municipality_name}'")
-                else:
-                    gemeinde = gemeinden[0]
-                    logger.debug(f"Found existing Gemeinde '{municipality_name}'")
-                
-                gemeinde_info = {
-                    "id": gemeinde.id,
-                    "label": gemeinde.label,
-                    "plz": gemeinde.plz
-                }
-                
-                # Check if Gemeinde already has BZO documents
-                existing_bzo = False
-                logger.debug(f"Checking for existing BZO documents in Gemeinde '{gemeinde.label}' (has {len(gemeinde.dokumente) if gemeinde.dokumente else 0} documents)")
-                if gemeinde.dokumente:
-                    for doc in gemeinde.dokumente:
-                        if (doc.label and ("BZO" in doc.label.upper() or "BAU UND ZONENORDNUNG" in doc.label.upper() or 
-                            "PLAN D'AMÉNAGEMENT" in doc.label.upper() or "RÈGLEMENT DE CONSTRUCTION" in doc.label.upper() or
-                            "PIANO DI UTILIZZAZIONE" in doc.label.upper() or "REGOLAMENTO EDILIZIO" in doc.label.upper())) or \
-                           (doc.dokumentTyp and doc.dokumentTyp in [DokumentTyp.GEMEINDE_BZO_AKTUELL, DokumentTyp.GEMEINDE_BZO_REVISION]):
-                            existing_bzo = True
-                            logger.info(f"Found existing BZO document: {doc.label} (ID: {doc.id})")
-                            bzo_documents.append({
-                                "id": doc.id,
-                                "label": doc.label,
-                                "dokumentTyp": doc.dokumentTyp.value if doc.dokumentTyp else None,
-                                "dokumentReferenz": doc.dokumentReferenz,
-                                "quelle": doc.quelle,
-                                "mimeType": doc.mimeType
-                            })
-                
-                if existing_bzo:
-                    logger.info(f"Gemeinde '{municipality_name}' already has {len(bzo_documents)} BZO document(s), skipping search")
-                
-                # If no BZO documents found, search and download
-                if not existing_bzo:
-                    logger.info(f"No BZO documents found for {municipality_name}, searching with Tavily...")
-                    
-                    # Determine language
-                    language = _get_language_from_kanton(canton)
-                    
-                    # Generate search query
-                    search_query = _get_bzo_search_query(municipality_name, language)
-                    logger.debug(f"Tavily search query: {search_query}")
-                    
-                    # Initialize Tavily connector
-                    tavily = AiTavily()
-                    
-                    # Search with Tavily
-                    search_results = await tavily._search(
-                        query=search_query,
-                        maxResults=5,
-                        country="switzerland"
-                    )
-                    
-                    if search_results:
-                        # First, check for direct PDF URLs in search results
-                        pdf_urls = []
-                        html_urls = []
-                        
-                        for result in search_results:
-                            url = result.url.lower()
-                            # Check if it's a direct PDF link
-                            if url.endswith('.pdf') or '/pdf/' in url or url.endswith('/pdf'):
-                                if not any(skip in url for skip in ['.html', '.htm', '/page/', '/article/', '/news/']):
-                                    pdf_urls.append(result.url)
-                            else:
-                                # It's an HTML page - we'll crawl it to find PDF links
-                                html_urls.append(result.url)
-                        
-                        # If no direct PDFs found, scrape HTML pages directly to find PDF links
-                        if not pdf_urls and html_urls:
-                            logger.info(f"No direct PDF links found, scraping {len(html_urls)} HTML pages to find PDF documents...")
-                            
-                            # Helper function to scrape HTML and find PDF links
-                            async def scrape_html_for_pdfs(url: str) -> List[str]:
-                                """Scrape an HTML page to find PDF links."""
-                                found_pdfs = []
-                                try:
-                                    ssl_context = ssl.create_default_context()
-                                    ssl_context.check_hostname = False
-                                    ssl_context.verify_mode = ssl.CERT_NONE
-                                    connector_aiohttp = aiohttp.TCPConnector(ssl=ssl_context)
-                                    
-                                    timeout = aiohttp.ClientTimeout(total=15, connect=5)
-                                    headers = {
-                                        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
-                                        'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
-                                        'Accept-Language': 'de-DE,de;q=0.9,en;q=0.8'
-                                    }
-                                    
-                                    async with aiohttp.ClientSession(timeout=timeout, headers=headers, connector=connector_aiohttp) as session:
-                                        async with session.get(url, allow_redirects=True) as response:
-                                            if response.status == 200:
-                                                # Check Content-Type header first
-                                                content_type = response.headers.get('Content-Type', '').lower()
-                                                
-                                                # Read first few bytes to check if it's a PDF
-                                                raw_bytes = await response.read()
-                                                
-                                                # Check if it's actually a PDF by magic bytes
-                                                if raw_bytes.startswith(b'%PDF'):
-                                                    found_pdfs.append(url)
-                                                    logger.info(f"Found direct PDF link (detected by magic bytes): {url}")
-                                                    return found_pdfs
-                                                
-                                                # If Content-Type says it's a PDF, add it
-                                                if 'application/pdf' in content_type:
-                                                    found_pdfs.append(url)
-                                                    logger.info(f"Found direct PDF link (Content-Type): {url}")
-                                                    return found_pdfs
-                                                
-                                                # If URL ends with .pdf, it's likely a PDF
-                                                if url.lower().endswith('.pdf'):
-                                                    found_pdfs.append(url)
-                                                    logger.info(f"Found direct PDF link (URL extension): {url}")
-                                                    return found_pdfs
-                                                
-                                                # Try to decode as text for HTML parsing
-                                                try:
-                                                    # Try UTF-8 first
-                                                    html_content = raw_bytes.decode('utf-8')
-                                                except UnicodeDecodeError:
-                                                    try:
-                                                        # Try ISO-8859-1 (common for German sites)
-                                                        html_content = raw_bytes.decode('iso-8859-1')
-                                                    except UnicodeDecodeError:
-                                                        try:
-                                                            # Try Windows-1252
-                                                            html_content = raw_bytes.decode('windows-1252')
-                                                        except UnicodeDecodeError:
-                                                            # If all else fails, skip this URL
-                                                            logger.warning(f"Could not decode content from {url} (not UTF-8, ISO-8859-1, or Windows-1252), skipping HTML parsing")
-                                                            return found_pdfs
-                                                
-                                                # Look for PDF links in various formats
-                                                # Pattern 1: Direct PDF URLs
-                                                pdf_pattern = r'https?://[^\s<>"\'\)]+\.pdf(?:\?[^\s<>"\'\)]*)?'
-                                                found = re.findall(pdf_pattern, html_content, re.IGNORECASE)
-                                                
-                                                # Pattern 2: Relative PDF links (convert to absolute)
-                                                relative_pattern = r'href=["\']([^"\']+\.pdf[^"\']*)["\']'
-                                                relative_found = re.findall(relative_pattern, html_content, re.IGNORECASE)
-                                                
-                                                # Convert relative URLs to absolute
-                                                base_url = f"{urlparse(url).scheme}://{urlparse(url).netloc}"
-                                                
-                                                for rel_url in relative_found:
-                                                    # Remove query params and fragments for cleaner URLs
-                                                    clean_url = rel_url.split('?')[0].split('#')[0]
-                                                    if clean_url.endswith('.pdf'):
-                                                        abs_url = urljoin(base_url, clean_url)
-                                                        if abs_url not in found:
-                                                            found.append(abs_url)
-                                                
-                                                # Pattern 3: Look in data attributes and other places
-                                                data_pattern = r'data-[^=]*=["\']([^"\']+\.pdf[^"\']*)["\']'
-                                                data_found = re.findall(data_pattern, html_content, re.IGNORECASE)
-                                                for data_url in data_found:
-                                                    clean_url = data_url.split('?')[0].split('#')[0]
-                                                    if clean_url.endswith('.pdf'):
-                                                        abs_url = urljoin(base_url, clean_url) if not clean_url.startswith('http') else clean_url
-                                                        if abs_url not in found:
-                                                            found.append(abs_url)
-                                                
-                                                # Clean and deduplicate URLs
-                                                for pdf_link in found:
-                                                    pdf_link = pdf_link.rstrip('.,;:!?)').strip()
-                                                    # Remove common tracking parameters
-                                                    if '?' in pdf_link:
-                                                        base, params = pdf_link.split('?', 1)
-                                                        # Keep only important params, remove tracking
-                                                        important_params = []
-                                                        for param in params.split('&'):
-                                                            if param.split('=')[0].lower() not in ['utm_source', 'utm_medium', 'utm_campaign', 'ref', 'fbclid', 'gclid']:
-                                                                important_params.append(param)
-                                                        if important_params:
-                                                            pdf_link = f"{base}?{'&'.join(important_params)}"
-                                                        else:
-                                                            pdf_link = base
-                                                    
-                                                    if pdf_link not in found_pdfs and pdf_link.startswith('http'):
-                                                        found_pdfs.append(pdf_link)
-                                                        logger.debug(f"Found PDF link on {url}: {pdf_link}")
-                                                
-                                                logger.info(f"Found {len(found_pdfs)} PDF links on {url}")
-                                                
-                                except Exception as e:
-                                    logger.debug(f"Error scraping {url} for PDFs: {e}", exc_info=True)
-                                
-                                return found_pdfs
-                            
-                            # Scrape HTML pages to find PDF links
-                            for html_url in html_urls[:5]:  # Limit to first 5 URLs
-                                try:
-                                    logger.debug(f"Scraping {html_url} to find PDF links...")
-                                    found_pdfs = await scrape_html_for_pdfs(html_url)
-                                    pdf_urls.extend(found_pdfs)
-                                except Exception as e:
-                                    logger.warning(f"Error scraping {html_url} to find PDFs: {e}", exc_info=True)
-                                    continue
-                            
-                            # Also check rawContent from search results for PDF links
-                            for result in search_results:
-                                if result.rawContent:
-                                    pdf_pattern = r'https?://[^\s<>"\'\)]+\.pdf(?:\?[^\s<>"\'\)]*)?'
-                                    found_pdfs = re.findall(pdf_pattern, result.rawContent, re.IGNORECASE)
-                                    for pdf_link in found_pdfs:
-                                        pdf_link = pdf_link.rstrip('.,;:!?)').strip()
-                                        if pdf_link not in pdf_urls and pdf_link.startswith('http'):
-                                            pdf_urls.append(pdf_link)
-                                            logger.debug(f"Found PDF link in rawContent: {pdf_link}")
-                        
-                        if not pdf_urls:
-                            logger.warning(f"No PDF URLs found in Tavily results for {municipality_name}. Results were HTML pages, not direct PDF links.")
-                            logger.debug(f"Tavily returned URLs: {[r.url for r in search_results]}")
-                        
-                        logger.info(f"Found {len(pdf_urls)} potential PDF documents for {municipality_name}")
-                        
-                        # Helper function to download a single PDF
-                        async def download_pdf(pdf_url: str) -> Optional[bytes]:
-                                """Download a PDF from a URL with retry logic."""
-                                max_retries = 3
-                                retry_delay = 2
-                                
-                                for attempt in range(max_retries):
-                                    try:
-                                        if attempt > 0:
-                                            headers = {
-                                                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36',
-                                                'Accept': '*/*'
-                                            }
-                                        else:
-                                            headers = {
-                                                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
-                                                'Accept': 'application/pdf,application/octet-stream,*/*',
-                                                'Accept-Language': 'de-DE,de;q=0.9,en;q=0.8',
-                                                'Accept-Encoding': 'gzip, deflate, br',
-                                                'Connection': 'keep-alive',
-                                                'Upgrade-Insecure-Requests': '1'
-                                            }
-                                        
-                                        # Create SSL context that doesn't verify certificates (for development)
-                                        ssl_context = ssl.create_default_context()
-                                        ssl_context.check_hostname = False
-                                        ssl_context.verify_mode = ssl.CERT_NONE
-                                        
-                                        # Create connector with SSL context
-                                        connector = aiohttp.TCPConnector(ssl=ssl_context)
-                                        
-                                        timeout = aiohttp.ClientTimeout(total=30, connect=10)
-                                        async with aiohttp.ClientSession(timeout=timeout, headers=headers, connector=connector) as session:
-                                            async with session.get(pdf_url, allow_redirects=True) as response:
-                                                if response.status == 200:
-                                                    # Check content-type header first
-                                                    content_type = response.headers.get('Content-Type', '').lower()
-                                                    if 'text/html' in content_type or 'text/xml' in content_type:
-                                                        logger.warning(f"URL {pdf_url} returned HTML content (Content-Type: {content_type}), skipping")
-                                                        raise Exception("Server returned HTML content instead of PDF")
-                                                    
-                                                    pdf_content = await response.read()
-                                                    
-                                                    if not pdf_content or len(pdf_content) < 100:
-                                                        raise Exception("Downloaded file is too small or empty")
-                                                    
-                                                    # Verify it's actually a PDF
-                                                    if not pdf_content.startswith(b'%PDF'):
-                                                        if pdf_content.startswith(b'<') or pdf_content.startswith(b'<!DOCTYPE'):
-                                                            logger.warning(f"URL {pdf_url} returned HTML content (detected HTML markers), skipping")
-                                                            raise Exception("Server returned HTML instead of PDF")
-                                                        logger.warning(f"Downloaded file from {pdf_url} doesn't appear to be a PDF (no PDF magic bytes), skipping")
-                                                        raise Exception("File doesn't appear to be a valid PDF")
-                                                    
-                                                    return pdf_content
-                                                elif response.status == 406:
-                                                    logger.warning(f"HTTP 406 for {pdf_url}, will retry with minimal headers (attempt {attempt + 1}/{max_retries})")
-                                                    if attempt < max_retries - 1:
-                                                        await asyncio.sleep(retry_delay)
-                                                        continue
-                                                    else:
-                                                        raise Exception(f"HTTP {response.status} (Not Acceptable) - server rejected request after {max_retries} attempts")
-                                                else:
-                                                    raise Exception(f"HTTP {response.status} when downloading PDF")
-                                    except asyncio.TimeoutError:
-                                        logger.warning(f"Timeout downloading PDF from {pdf_url} (attempt {attempt + 1}/{max_retries})")
-                                        if attempt < max_retries - 1:
-                                            await asyncio.sleep(retry_delay)
-                                            continue
-                                        else:
-                                            raise Exception("Connection timeout after retries")
-                                    except aiohttp.ClientError as e:
-                                        logger.warning(f"Connection error downloading PDF from {pdf_url} (attempt {attempt + 1}/{max_retries}): {str(e)}")
-                                        if attempt < max_retries - 1:
-                                            await asyncio.sleep(retry_delay)
-                                            continue
-                                        else:
-                                            raise Exception(f"Connection error: {str(e)}")
-                                    except Exception as e:
-                                        raise
-                                
-                                return None
-                        
-                        # Process PDF URLs
-                        current_dokumente = list(gemeinde.dokumente) if gemeinde.dokumente else []
-                        
-                        # Sanitize Gemeinde name for filename
-                        safe_name = "".join(c for c in municipality_name if c.isalnum() or c in (' ', '-', '_')).strip()
-                        safe_name = safe_name.replace(' ', '_')
-                        if not safe_name:
-                            safe_name = "Gemeinde"
-                        
-                        # Determine base label based on language
-                        if language == 'fr':
-                            base_doc_label = f"Plan d'aménagement local {municipality_name}"
-                        elif language == 'it':
-                            base_doc_label = f"Piano di utilizzazione {municipality_name}"
-                        else:
-                            base_doc_label = f"BZO {municipality_name}"
-                        
-                        # Process each PDF URL
-                        for idx, pdf_url in enumerate(pdf_urls):
-                            try:
-                                logger.info(f"Downloading PDF {idx + 1}/{len(pdf_urls)} from {pdf_url} for {municipality_name}")
-                                pdf_content = await download_pdf(pdf_url)
-                                
-                                if not pdf_content or len(pdf_content) < 100:
-                                    logger.warning(f"Failed to download PDF from {pdf_url} for {municipality_name}")
-                                    continue
-                                
-                                # Create unique file name
-                                if len(pdf_urls) > 1:
-                                    file_name = f"BZO_{safe_name}_{idx + 1}.pdf"
-                                    doc_label = f"{base_doc_label} ({idx + 1})"
-                                else:
-                                    file_name = f"BZO_{safe_name}.pdf"
-                                    doc_label = base_doc_label
-                                
-                                # Store file using ComponentObjects
-                                try:
-                                    file_item = componentInterface.createFile(
-                                        name=file_name,
-                                        mimeType="application/pdf",
-                                        content=pdf_content
-                                    )
-                                    
-                                    componentInterface.createFileData(file_item.id, pdf_content)
-                                    logger.info(f"Stored file {file_name} with ID {file_item.id}")
-                                except Exception as e:
-                                    logger.error(f"Error storing file {file_name}: {str(e)}", exc_info=True)
-                                    continue
-                                
-                                # Create Dokument record
-                                dokument = Dokument(
-                                    mandateId=currentUser.mandateId,
-                                    label=doc_label,
-                                    versionsbezeichnung="Aktuell",
-                                    dokumentTyp=DokumentTyp.GEMEINDE_BZO_AKTUELL,
-                                    dokumentReferenz=file_item.id,
-                                    quelle=pdf_url,
-                                    mimeType="application/pdf",
-                                    kategorienTags=["BZO", "Bauordnung", municipality_name]
-                                )
-                                
-                                # Create Dokument record
-                                created_dokument = realEstateInterface.createDokument(dokument)
-                                logger.info(f"Created Dokument record with ID {created_dokument.id}")
-                                
-                                current_dokumente.append(created_dokument)
-                                
-                                # Add to response
-                                bzo_documents.append({
-                                    "id": created_dokument.id,
-                                    "label": created_dokument.label,
-                                    "dokumentTyp": created_dokument.dokumentTyp.value if created_dokument.dokumentTyp else None,
-                                    "dokumentReferenz": created_dokument.dokumentReferenz,
-                                    "quelle": created_dokument.quelle,
-                                    "mimeType": created_dokument.mimeType
-                                })
-                                
-                            except Exception as e:
-                                logger.error(f"Error processing PDF {pdf_url}: {str(e)}", exc_info=True)
-                                continue
-                        
-                        # Update Gemeinde with new dokumente
-                        if bzo_documents:
-                            updated_gemeinde = realEstateInterface.updateGemeinde(
-                                gemeinde.id,
-                                {"dokumente": current_dokumente}
-                            )
-                            if updated_gemeinde:
-                                logger.info(f"Successfully created {len(bzo_documents)} BZO document(s) for {municipality_name}")
-                    else:
-                        logger.warning(f"No search results found for {municipality_name}")
-                
-            except Exception as e:
-                logger.error(f"Error fetching BZO documents for {municipality_name}: {e}", exc_info=True)
-                # Continue without documents - don't fail the request
-        elif fetch_documents:
-            if not municipality_name:
-                logger.warning("fetch_documents=true but municipality_name is not available, skipping document fetch")
-            elif not canton:
-                logger.warning("fetch_documents=true but canton is not available, skipping document fetch")
-        
-        # Add Gemeinde and documents to response if available
-        logger.debug(f"Adding to response: gemeinde_info={gemeinde_info is not None}, bzo_documents count={len(bzo_documents)}")
-        if gemeinde_info:
-            response_data["gemeinde"] = gemeinde_info
-            logger.debug(f"Added gemeinde_info to response: {gemeinde_info}")
-        if bzo_documents:
-            response_data["documents"] = bzo_documents
-            logger.info(f"Added {len(bzo_documents)} BZO documents to response")
-        else:
-            logger.debug("No BZO documents to add to response")
-        
-        return response_data
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error searching parcel: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error searching parcel: {str(e)}"
-        )
-
-
-@router.post("/projekt/{projekt_id}/add-parcel", response_model=Dict[str, Any])
-@limiter.limit("60/minute")
-async def add_parcel_to_project(
-    request: Request,
-    projekt_id: str = Path(..., description="Projekt ID"),
-    body: Dict[str, Any] = Body(...),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Add a parcel to an existing project.
-    
-    This endpoint can either:
-    1. Link an existing Parzelle to the Projekt
-    2. Create a new Parzelle from location data and link it
-    
-    Request Body:
-    Option 1 - Link existing parcel:
-    {
-        "parcelId": "existing-parcel-id"
-    }
-    
-    Option 2 - Create new parcel from location:
-    {
-        "location": "Hauptstrasse 42, 8000 Zürich"
-    }
-    
-    Option 3 - Create new parcel with custom data:
-    {
-        "parcelData": {
-            "label": "Parzelle 123",
-            "strasseNr": "Hauptstrasse 42",
-            "plz": "8000",
-            "bauzone": "W3",
-            ...
-        }
-    }
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "projekt": {...},  // Updated Projekt
-        "parzelle": {...}  // Parcel that was added
-    }
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for POST /api/realestate/projekt/{projekt_id}/add-parcel from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Validate CSRF token format
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Adding parcel to project {projekt_id} for user {currentUser.id} (mandate: {currentUser.mandateId})")
-        
-        # Get interface
-        realEstateInterface = getRealEstateInterface(currentUser)
-        
-        # Fetch existing Projekt
-        projekte = realEstateInterface.getProjekte(
-            recordFilter={"id": projekt_id, "mandateId": currentUser.mandateId}
-        )
-        if not projekte:
-            raise HTTPException(
-                status_code=status.HTTP_404_NOT_FOUND,
-                detail=f"Projekt {projekt_id} not found"
-            )
-        projekt = projekte[0]
-        
-        # Determine which option was used
-        parcel_id = body.get("parcelId")
-        location = body.get("location")
-        parcel_data_dict = body.get("parcelData")
-        
-        parzelle = None
-        
-        # Option 1: Link existing parcel
-        if parcel_id:
-            logger.info(f"Linking existing parcel {parcel_id}")
-            parcels = realEstateInterface.getParzellen(
-                recordFilter={"id": parcel_id, "mandateId": currentUser.mandateId}
-            )
-            if not parcels:
-                raise HTTPException(
-                    status_code=status.HTTP_404_NOT_FOUND,
-                    detail=f"Parzelle {parcel_id} not found"
-                )
-            parzelle = parcels[0]
-        
-        # Option 2: Create from location
-        elif location:
-            logger.info(f"Creating parcel from location: {location}")
-            
-            # Initialize connector and search for parcel
-            connector = SwissTopoMapServerConnector()
-            parcel_data = await connector.search_parcel(location)
-            
-            if not parcel_data:
-                raise HTTPException(
-                    status_code=status.HTTP_404_NOT_FOUND,
-                    detail=f"No parcel found at location: {location}"
-                )
-            
-            # Extract attributes
-            extracted_attributes = connector.extract_parcel_attributes(parcel_data)
-            attributes = parcel_data.get("attributes", {})
-            
-            # Create Parzelle
-            parzelle_create_data = {
-                "mandateId": currentUser.mandateId,
-                "label": extracted_attributes.get("label") or attributes.get("number") or "Unknown",
-                "parzellenAliasTags": [attributes.get("egris_egrid")] if attributes.get("egris_egrid") else [],
-                "eigentuemerschaft": None,
-                "strasseNr": location if not location.replace(",", "").replace(".", "").replace(" ", "").isdigit() else None,
-                "plz": None,
-                "perimeter": extracted_attributes.get("perimeter"),
-                "baulinie": None,
-                "kontextGemeinde": None,
-                "bauzone": None,
-                "az": None,
-                "bz": None,
-                "vollgeschossZahl": None,
-                "anrechenbarDachgeschoss": None,
-                "anrechenbarUntergeschoss": None,
-                "gebaeudehoeheMax": None,
-                "regelnGrenzabstand": [],
-                "regelnMehrlaengenzuschlag": [],
-                "regelnMehrhoehenzuschlag": [],
-                "parzelleBebaut": None,
-                "parzelleErschlossen": None,
-                "parzelleHanglage": None,
-                "laermschutzzone": None,
-                "hochwasserschutzzone": None,
-                "grundwasserschutzzone": None,
-                "parzellenNachbarschaft": [],
-                "dokumente": [],
-                "kontextInformationen": [
-                    Kontext(
-                        thema="Swiss Topo Data",
-                        inhalt=json.dumps({
-                            "egrid": attributes.get("egris_egrid"),
-                            "identnd": attributes.get("identnd"),
-                            "canton": attributes.get("ak"),
-                            "municipality_code": attributes.get("bfsnr"),
-                            "geoportal_url": attributes.get("geoportal_url")
-                        }, ensure_ascii=False)
-                    )
-                ]
-            }
-            
-            parzelle_instance = Parzelle(**parzelle_create_data)
-            parzelle = realEstateInterface.createParzelle(parzelle_instance)
-        
-        # Option 3: Create from custom data
-        elif parcel_data_dict:
-            logger.info(f"Creating parcel from custom data")
-            parcel_data_dict["mandateId"] = currentUser.mandateId
-            parzelle_instance = Parzelle(**parcel_data_dict)
-            parzelle = realEstateInterface.createParzelle(parzelle_instance)
-        
-        else:
-            raise ValueError("One of 'parcelId', 'location', or 'parcelData' is required")
-        
-        # Add parcel to project
-        if parzelle not in projekt.parzellen:
-            projekt.parzellen.append(parzelle)
-        
-        # Update projekt perimeter if needed (use first parcel's perimeter)
-        if not projekt.perimeter and parzelle.perimeter:
-            projekt.perimeter = parzelle.perimeter
-        
-        # Update Projekt
-        updated_projekt = realEstateInterface.updateProjekt(projekt)
-        
-        logger.info(f"Added Parzelle {parzelle.id} to Projekt {projekt_id}")
-        
-        return {
-            "projekt": updated_projekt.model_dump(),
-            "parzelle": parzelle.model_dump()
-        }
-        
-    except ValueError as e:
-        logger.error(f"Validation error in add_parcel_to_project: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_400_BAD_REQUEST,
-            detail=f"Validation error: {str(e)}"
-        )
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error adding parcel to project: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error adding parcel to project: {str(e)}"
-        )
-
-
-@router.get("/bzo-information", response_model=Dict[str, Any])
-@limiter.limit("30/minute")
-async def get_bzo_information(
-    request: Request,
-    gemeinde: str = Query(..., description="Gemeinde name or ID"),
-    bauzone: str = Query(..., description="Bauzone code (e.g., W3, W2/30)"),
-    total_area_m2: Optional[float] = Query(None, description="Total parcel area (m²) for Machbarkeitsstudie"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Extract BZO information from PDF documents for a specific Bauzone in a Gemeinde.
-    
-    Uses the BZO extraction pipeline to extract content from BZO PDF documents for the
-    specified Gemeinde, then uses AI to search for relevant information specific
-    to the specified Bauzone.
-    
-    The workflow:
-    1. Finds BZO documents for the Gemeinde (by name or ID)
-    2. Extracts content from PDFs using the BZO extraction pipeline
-    3. Filters rules, zones, and articles by Bauzone
-    4. Uses AI to generate a summary and find relevant information
-    
-    Query Parameters:
-    - gemeinde: Gemeinde name (e.g., "Zürich") or ID
-    - bauzone: Bauzone code (e.g., "W3", "W2/30", "Z3")
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "bauzone": "W3",
-        "gemeinde": {
-            "id": "...",
-            "label": "...",
-            "plz": "..."
-        },
-        "extracted_content": {
-            "zones": [...],  // Zone information filtered by Bauzone
-            "rules": [...],  // Rules filtered by Bauzone
-            "articles": [...],  // Articles filtered by Bauzone
-            "total_zones": N,
-            "total_rules": N,
-            "total_articles": N
-        },
-        "ai_summary": "...",  // AI-generated summary
-        "relevant_rules": [...],  // Rules specifically for this Bauzone
-        "documents_processed": [  // List of document IDs processed
-            {
-                "id": "...",
-                "label": "...",
-                "dokumentTyp": "..."
-            }
-        ],
-        "errors": [...],
-        "warnings": [...]
-    }
-    
-    Examples:
-    - GET /api/realestate/bzo-information?gemeinde=Zürich&bauzone=W3
-    - GET /api/realestate/bzo-information?gemeinde=Uster&bauzone=W2/30
-    
-    Raises:
-    - 404: Gemeinde not found
-    - 404: No BZO documents found for Gemeinde
-    - 500: Error during extraction or processing
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for GET /api/realestate/bzo-information from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for GET /api/realestate/bzo-information from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for GET /api/realestate/bzo-information from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Extracting BZO information for Gemeinde '{gemeinde}', Bauzone '{bauzone}' (user: {currentUser.id}, mandate: {currentUser.mandateId})")
-        
-        # Call the feature function
-        result = await extract_bzo_information(
-            currentUser=currentUser,
-            gemeinde=gemeinde,
-            bauzone=bauzone,
-            total_area_m2=total_area_m2,
-        )
-        
-        return result
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error extracting BZO information for Gemeinde '{gemeinde}', Bauzone '{bauzone}': {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error extracting BZO information: {str(e)}"
-        )
-
diff --git a/modules/routes/routeRealEstateScraping.py b/modules/routes/routeRealEstateScraping.py
deleted file mode 100644
index abb54299..00000000
--- a/modules/routes/routeRealEstateScraping.py
+++ /dev/null
@@ -1,881 +0,0 @@
-"""
-Real Estate scraping routes for the backend API.
-Implements endpoints for scraping real estate data from external sources.
-"""
-
-import logging
-import json
-import aiohttp
-import asyncio
-from typing import Optional, Dict, Any
-from fastapi import APIRouter, HTTPException, Depends, Body, Request, Query, status
-
-# Import auth modules
-from modules.auth import limiter, getCurrentUser
-
-# Import models
-from modules.datamodels.datamodelUam import User
-from modules.datamodels.datamodelRealEstate import (
-    Gemeinde,
-    Kanton,
-    Dokument,
-    Kontext,
-    DokumentTyp,
-)
-
-# Import interfaces
-from modules.interfaces.interfaceDbRealEstateObjects import getInterface as getRealEstateInterface
-from modules.interfaces.interfaceDbComponentObjects import getInterface as getComponentInterface
-
-# Import scraping script
-from modules.features.realEstate.scrapeSwissTopo import scrape_switzerland
-
-# Import Swiss Topo MapServer connector
-from modules.connectors.connectorSwissTopoMapServer import SwissTopoMapServerConnector
-from modules.connectors.connectorOerebWfs import OerebWfsConnector
-
-# Import Tavily connector for BZO document search
-from modules.aicore.aicorePluginTavily import AiTavily
-from modules.shared.i18nRegistry import apiRouteContext
-routeApiMsg = apiRouteContext("routeRealEstateScraping")
-
-# Configure logger
-logger = logging.getLogger(__name__)
-
-# Create router for real estate scraping endpoints
-router = APIRouter(
-    prefix="/api/realestate",
-    tags=["Real Estate Scraping"],
-    responses={
-        404: {"description": "Not found"},
-        400: {"description": "Bad request"},
-        401: {"description": "Unauthorized"},
-        403: {"description": "Forbidden"},
-        500: {"description": "Internal server error"}
-    }
-)
-
-
-@router.post("/scrape-switzerland", response_model=Dict[str, Any])
-@limiter.limit("5/hour")  # Limit to 5 requests per hour (scraping is resource-intensive)
-async def scrape_switzerland_route(
-    request: Request,
-    body: Dict[str, Any] = Body(..., description="Scraping parameters"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Scrape Kanton Zürich systematically using Swiss Topo connector and save parcel data to database.
-    
-    This endpoint divides Kanton Zürich into a grid and queries parcels at each grid point,
-    then deduplicates and saves unique parcels to the database. For each parcel, it also
-    queries the ÖREB WFS service to retrieve bauzone information.
-    
-    **WARNING**: This is a resource-intensive operation that may take a long time
-    and make many API requests. Use with caution.
-    
-    Request Body:
-    {
-        "grid_size": 500.0,  // Grid cell size in meters (default: 500m)
-        "max_concurrent": 50,  // Maximum concurrent API requests (default: 50)
-        "batch_size": 100  // Number of parcels to process before saving (default: 100)
-    }
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "success": true,
-        "stats": {
-            "total_queries": 1234,
-            "successful_queries": 1200,
-            "failed_queries": 34,
-            "unique_parcels_found": 500,
-            "parcels_saved": 450,
-            "parcels_skipped": 50,
-            "error_count": 5,
-            "errors": [...]
-        }
-    }
-    
-    Example:
-    - POST /api/realestate/scrape-switzerland
-      Body: {"grid_size": 1000.0, "max_concurrent": 5, "batch_size": 50}
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for POST /api/realestate/scrape-switzerland from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for POST /api/realestate/scrape-switzerland from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for POST /api/realestate/scrape-switzerland from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Extract parameters from body with defaults
-        grid_size = body.get("grid_size", 500.0)
-        max_concurrent = body.get("max_concurrent", 50)
-        batch_size = body.get("batch_size", 100)
-        
-        # Validate parameters
-        if grid_size <= 0 or grid_size > 10000:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=routeApiMsg("grid_size must be between 0 and 10000 meters")
-            )
-        
-        if max_concurrent <= 0 or max_concurrent > 200:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=routeApiMsg("max_concurrent must be between 1 and 200")
-            )
-        
-        if batch_size <= 0 or batch_size > 1000:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail=routeApiMsg("batch_size must be between 1 and 1000")
-            )
-        
-        logger.info(
-            f"Starting Switzerland scraping for user {currentUser.id} (mandate: {currentUser.mandateId}) "
-            f"with grid_size={grid_size}, max_concurrent={max_concurrent}, batch_size={batch_size}"
-        )
-        
-        # Run scraping operation
-        result = await scrape_switzerland(
-            current_user=currentUser,
-            grid_size=grid_size,
-            max_concurrent=max_concurrent,
-            batch_size=batch_size
-        )
-        
-        logger.info(
-            f"Scraping completed for user {currentUser.id}: "
-            f"{result['stats']['parcels_saved']} parcels saved"
-        )
-        
-        return result
-        
-    except HTTPException:
-        raise
-    except ValueError as e:
-        logger.error(f"Validation error in scrape_switzerland_route: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_400_BAD_REQUEST,
-            detail=f"Validation error: {str(e)}"
-        )
-    except Exception as e:
-        logger.error(f"Error scraping Switzerland: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error scraping Switzerland: {str(e)}"
-        )
-
-
-@router.get("/gemeinden", response_model=Dict[str, Any])
-@limiter.limit("60/minute")
-async def get_all_gemeinden(
-    request: Request,
-    only_current: bool = Query(True, description="Only return current municipalities (exclude historical)"),
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Fetch all Gemeinden (municipalities) from the Swiss Topo MapServer connector
-    and save them to the database.
-    
-    This endpoint:
-    1. Fetches all Swiss municipalities from the Swiss Federal Office of Topography
-    2. Saves them to the database (skipping duplicates based on BFS number)
-    3. Creates Kantone (cantons) as needed
-    4. Returns statistics about the import operation
-    
-    Query Parameters:
-    - only_current: If True, only return current municipalities (default: True).
-                   If False, return all municipalities including historical ones.
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "gemeinden": [
-            {
-                "id": "uuid",
-                "mandateId": "uuid",
-                "label": "Bern",
-                "id_kanton": "uuid",
-                "kontextInformationen": [...],
-                ...
-            },
-            ...
-        ],
-        "count": 2162,
-        "stats": {
-            "gemeinden_created": 2100,
-            "gemeinden_skipped": 62,
-            "kantone_created": 26,
-            "error_count": 0,
-            "errors": []
-        }
-    }
-    
-    Example:
-    - GET /api/realestate/gemeinden
-    - GET /api/realestate/gemeinden?only_current=false
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for GET /api/realestate/gemeinden from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for GET /api/realestate/gemeinden from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for GET /api/realestate/gemeinden from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Fetching all Gemeinden for user {currentUser.id} (mandate: {currentUser.mandateId}), only_current={only_current}")
-        
-        # Initialize connectors and fetch all gemeinden
-        oereb_connector = OerebWfsConnector()
-        connector = SwissTopoMapServerConnector(oereb_connector=oereb_connector)
-        gemeinden_data = await connector.get_all_gemeinden(only_current=only_current)
-        
-        # Get interface for database operations
-        realEstateInterface = getRealEstateInterface(currentUser)
-        
-        # Statistics
-        gemeinden_created = 0
-        gemeinden_skipped = 0
-        kantone_created = 0
-        errors = []
-        
-        # Cache for Kanton UUIDs
-        kanton_cache: Dict[str, str] = {}
-        
-        # Helper function to find Gemeinde by BFS number
-        def find_gemeinde_by_bfs_nummer(bfs_nummer: str) -> Optional[Gemeinde]:
-            """Find existing Gemeinde by BFS number (stored in kontextInformationen)."""
-            try:
-                gemeinden = realEstateInterface.getGemeinden(
-                    recordFilter={"mandateId": currentUser.mandateId}
-                )
-                
-                for gemeinde in gemeinden:
-                    # Check kontextInformationen for bfs_nummer
-                    for kontext in gemeinde.kontextInformationen:
-                        try:
-                            kontext_data = json.loads(kontext.inhalt) if isinstance(kontext.inhalt, str) else kontext.inhalt
-                            if isinstance(kontext_data, dict):
-                                if str(kontext_data.get("bfs_nummer")) == str(bfs_nummer):
-                                    return gemeinde
-                        except (json.JSONDecodeError, AttributeError):
-                            continue
-                
-                return None
-            except Exception as e:
-                logger.error(f"Error finding Gemeinde by BFS number {bfs_nummer}: {e}", exc_info=True)
-                return None
-        
-        # Helper function to get or create Kanton
-        def get_or_create_kanton(kanton_abk: str) -> Optional[str]:
-            """Get or create a Kanton by abbreviation."""
-            nonlocal kantone_created, errors
-            
-            if not kanton_abk:
-                return None
-            
-            # Check cache first
-            if kanton_abk in kanton_cache:
-                return kanton_cache[kanton_abk]
-            
-            # Check if exists
-            kantone = realEstateInterface.getKantone(
-                recordFilter={
-                    "mandateId": currentUser.mandateId,
-                    "abk": kanton_abk
-                }
-            )
-            
-            if kantone:
-                kanton_cache[kanton_abk] = kantone[0].id
-                return kantone[0].id
-            
-            # Create new Kanton
-            try:
-                # Map common abbreviations to full names
-                kanton_names = {
-                    "AG": "Aargau", "AI": "Appenzell Innerrhoden", "AR": "Appenzell Ausserrhoden",
-                    "BE": "Bern", "BL": "Basel-Landschaft", "BS": "Basel-Stadt",
-                    "FR": "Freiburg", "GE": "Genf", "GL": "Glarus", "GR": "Graubünden",
-                    "JU": "Jura", "LU": "Luzern", "NE": "Neuenburg", "NW": "Nidwalden",
-                    "OW": "Obwalden", "SG": "St. Gallen", "SH": "Schaffhausen", "SO": "Solothurn",
-                    "SZ": "Schwyz", "TG": "Thurgau", "TI": "Tessin", "UR": "Uri",
-                    "VD": "Waadt", "VS": "Wallis", "ZG": "Zug", "ZH": "Zürich"
-                }
-                
-                kanton_label = kanton_names.get(kanton_abk, kanton_abk)
-                
-                kanton = Kanton(
-                    mandateId=currentUser.mandateId,
-                    label=kanton_label,
-                    abk=kanton_abk
-                )
-                
-                created_kanton = realEstateInterface.createKanton(kanton)
-                if created_kanton and created_kanton.id:
-                    kanton_cache[kanton_abk] = created_kanton.id
-                    kantone_created += 1
-                    logger.info(f"Created new Kanton: {kanton_label} ({kanton_abk})")
-                    return created_kanton.id
-            except Exception as e:
-                error_msg = f"Error creating Kanton {kanton_abk}: {e}"
-                logger.error(error_msg, exc_info=True)
-                errors.append(error_msg)
-            
-            return None
-        
-        # Process each gemeinde and save to database
-        saved_gemeinden = []
-        for gemeinde_data in gemeinden_data:
-            try:
-                gemeinde_name = gemeinde_data.get("name")
-                bfs_nummer = gemeinde_data.get("bfs_nummer")
-                kanton_abk = gemeinde_data.get("kanton")
-                
-                if not gemeinde_name or not bfs_nummer:
-                    logger.warning(f"Skipping Gemeinde with missing data: {gemeinde_data}")
-                    gemeinden_skipped += 1
-                    continue
-                
-                # Check if Gemeinde already exists
-                existing_gemeinde = find_gemeinde_by_bfs_nummer(str(bfs_nummer))
-                if existing_gemeinde:
-                    logger.debug(f"Gemeinde {gemeinde_name} (BFS: {bfs_nummer}) already exists, skipping")
-                    gemeinden_skipped += 1
-                    saved_gemeinden.append(existing_gemeinde.model_dump() if hasattr(existing_gemeinde, 'model_dump') else existing_gemeinde)
-                    continue
-                
-                # Get or create Kanton
-                kanton_id = get_or_create_kanton(kanton_abk) if kanton_abk else None
-                
-                # Create new Gemeinde
-                gemeinde = Gemeinde(
-                    mandateId=currentUser.mandateId,
-                    label=gemeinde_name,
-                    id_kanton=kanton_id,
-                    kontextInformationen=[
-                        Kontext(
-                            thema="BFS Nummer",
-                            inhalt=json.dumps({"bfs_nummer": bfs_nummer}, ensure_ascii=False)
-                        )
-                    ]
-                )
-                
-                created_gemeinde = realEstateInterface.createGemeinde(gemeinde)
-                if created_gemeinde and created_gemeinde.id:
-                    gemeinden_created += 1
-                    logger.info(f"Created new Gemeinde: {gemeinde_name} (BFS: {bfs_nummer})")
-                    saved_gemeinden.append(created_gemeinde.model_dump() if hasattr(created_gemeinde, 'model_dump') else created_gemeinde)
-                else:
-                    error_msg = f"Failed to create Gemeinde {gemeinde_name} (BFS: {bfs_nummer})"
-                    logger.error(error_msg)
-                    errors.append(error_msg)
-                    gemeinden_skipped += 1
-                    
-            except Exception as e:
-                error_msg = f"Error processing Gemeinde {gemeinde_data.get('name', 'Unknown')}: {str(e)}"
-                logger.error(error_msg, exc_info=True)
-                errors.append(error_msg)
-                gemeinden_skipped += 1
-        
-        logger.info(
-            f"Gemeinden import completed: {gemeinden_created} created, "
-            f"{gemeinden_skipped} skipped, {kantone_created} Kantone created"
-        )
-        
-        return {
-            "gemeinden": saved_gemeinden,
-            "count": len(saved_gemeinden),
-            "stats": {
-                "gemeinden_created": gemeinden_created,
-                "gemeinden_skipped": gemeinden_skipped,
-                "kantone_created": kantone_created,
-                "error_count": len(errors),
-                "errors": errors[:10]  # Return first 10 errors
-            }
-        }
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error fetching all Gemeinden: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error fetching Gemeinden: {str(e)}"
-        )
-
-
-def _get_language_from_kanton(kanton_abk: Optional[str]) -> str:
-    """
-    Determine language (German/French/Italian) based on Kanton abbreviation.
-    
-    Args:
-        kanton_abk: Kanton abbreviation (e.g., 'ZH', 'VD', 'TI')
-    
-    Returns:
-        Language code: 'de' (German), 'fr' (French), or 'it' (Italian)
-    """
-    if not kanton_abk:
-        return 'de'  # Default to German
-    
-    # French-speaking cantons
-    french_cantons = {'VD', 'GE', 'NE', 'JU'}
-    # Italian-speaking canton
-    italian_cantons = {'TI'}
-    
-    kanton_upper = kanton_abk.upper()
-    if kanton_upper in french_cantons:
-        return 'fr'
-    elif kanton_upper in italian_cantons:
-        return 'it'
-    else:
-        return 'de'  # Default to German
-
-
-def _get_bzo_search_query(gemeinde_label: str, language: str) -> str:
-    """
-    Generate language-specific BZO search query for a Gemeinde.
-    
-    Args:
-        gemeinde_label: Name of the Gemeinde
-        language: Language code ('de', 'fr', 'it')
-    
-    Returns:
-        Search query string
-    """
-    if language == 'fr':
-        # French: Plan d'aménagement local or Règlement de construction
-        return f"Plan d'aménagement local {gemeinde_label} OR Règlement de construction {gemeinde_label}"
-    elif language == 'it':
-        # Italian: Piano di utilizzazione or Regolamento edilizio
-        return f"Piano di utilizzazione {gemeinde_label} OR Regolamento edilizio {gemeinde_label}"
-    else:
-        # German: Bau und Zonenordnung
-        return f"Bau und Zonenordnung {gemeinde_label}"
-
-
-@router.post("/gemeinden/fetch-bzo-documents", response_model=Dict[str, Any])
-@limiter.limit("10/hour")  # Resource-intensive operation
-async def fetch_bzo_documents(
-    request: Request,
-    currentUser: User = Depends(getCurrentUser)
-) -> Dict[str, Any]:
-    """
-    Search for and download Bau und Zonenordnung (BZO) documents for all Gemeinden.
-    
-    This endpoint:
-    1. Fetches all Gemeinden from the database
-    2. For each Gemeinde, determines language based on Kanton
-    3. Uses Tavily search to find BZO documents (up to 5 results)
-    4. Downloads all PDF files found and stores them with content
-    5. Creates Dokument records for each PDF and links them to Gemeinde's dokumente field
-    6. Skips Gemeinden that already have BZO documents
-    
-    Note: If Tavily returns multiple PDF results, all of them will be downloaded
-    and saved as separate Dokument records.
-    
-    Headers:
-    - X-CSRF-Token: CSRF token (required for security)
-    
-    Returns:
-    {
-        "success": true,
-        "stats": {
-            "gemeinden_processed": 100,
-            "documents_created": 85,
-            "documents_skipped": 15,
-            "errors": []
-        },
-        "results": [
-            {
-                "gemeinde_id": "...",
-                "gemeinde_label": "Zürich",
-                "status": "created|skipped|error",
-                "dokument_ids": ["...", "..."],  // List of created document IDs (can be multiple)
-                "error": null
-            }
-        ]
-    }
-    """
-    try:
-        # Validate CSRF token
-        csrf_token = request.headers.get("X-CSRF-Token") or request.headers.get("x-csrf-token")
-        if not csrf_token:
-            logger.warning(f"CSRF token missing for POST /api/realestate/gemeinden/fetch-bzo-documents from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("CSRF token missing. Please include X-CSRF-Token header.")
-            )
-        
-        # Basic CSRF token format validation
-        if not isinstance(csrf_token, str) or len(csrf_token) < 16 or len(csrf_token) > 64:
-            logger.warning(f"Invalid CSRF token format for POST /api/realestate/gemeinden/fetch-bzo-documents from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        # Validate token is hex string
-        try:
-            int(csrf_token, 16)
-        except ValueError:
-            logger.warning(f"CSRF token is not a valid hex string for POST /api/realestate/gemeinden/fetch-bzo-documents from user {currentUser.id}")
-            raise HTTPException(
-                status_code=status.HTTP_403_FORBIDDEN,
-                detail=routeApiMsg("Invalid CSRF token format")
-            )
-        
-        logger.info(f"Starting BZO document fetch for user {currentUser.id} (mandate: {currentUser.mandateId})")
-        
-        # Get interfaces
-        realEstateInterface = getRealEstateInterface(currentUser)
-        componentInterface = getComponentInterface(currentUser)
-        
-        # Initialize Tavily connector
-        tavily = AiTavily()
-        
-        # Get all Gemeinden
-        gemeinden = realEstateInterface.getGemeinden(
-            recordFilter={"mandateId": currentUser.mandateId}
-        )
-        
-        logger.info(f"Found {len(gemeinden)} Gemeinden to process")
-        
-        # Statistics
-        stats = {
-            "gemeinden_processed": 0,
-            "documents_created": 0,
-            "documents_skipped": 0,
-            "errors": []
-        }
-        results = []
-        
-        # Process each Gemeinde
-        for gemeinde in gemeinden:
-            gemeinde_result = {
-                "gemeinde_id": gemeinde.id,
-                "gemeinde_label": gemeinde.label,
-                "status": None,
-                "dokument_ids": [],  # Changed to list to support multiple documents
-                "error": None
-            }
-            
-            try:
-                stats["gemeinden_processed"] += 1
-                
-                # Check if Gemeinde already has a BZO document
-                existing_bzo = False
-                if gemeinde.dokumente:
-                    for doc in gemeinde.dokumente:
-                        # Check if it's a BZO document by label or dokumentTyp
-                        if (doc.label and ("BZO" in doc.label.upper() or "BAU UND ZONENORDNUNG" in doc.label.upper() or 
-                            "PLAN D'AMÉNAGEMENT" in doc.label.upper() or "RÈGLEMENT DE CONSTRUCTION" in doc.label.upper() or
-                            "PIANO DI UTILIZZAZIONE" in doc.label.upper() or "REGOLAMENTO EDILIZIO" in doc.label.upper())) or \
-                           (doc.dokumentTyp and doc.dokumentTyp in [DokumentTyp.GEMEINDE_BZO_AKTUELL, DokumentTyp.GEMEINDE_BZO_REVISION]):
-                            existing_bzo = True
-                            break
-                
-                if existing_bzo:
-                    logger.debug(f"Gemeinde {gemeinde.label} already has BZO document, skipping")
-                    gemeinde_result["status"] = "skipped"
-                    stats["documents_skipped"] += 1
-                    results.append(gemeinde_result)
-                    continue
-                
-                # Get Kanton to determine language
-                kanton_abk = None
-                if gemeinde.id_kanton:
-                    kanton = realEstateInterface.getKanton(gemeinde.id_kanton)
-                    if kanton:
-                        kanton_abk = kanton.abk
-                
-                # Determine language
-                language = _get_language_from_kanton(kanton_abk)
-                
-                # Generate search query
-                search_query = _get_bzo_search_query(gemeinde.label, language)
-                logger.info(f"Searching for BZO document for {gemeinde.label} (language: {language}) with query: {search_query}")
-                
-                # Search with Tavily using the private _search method
-                search_results = await tavily._search(
-                    query=search_query,
-                    maxResults=5,
-                    country="switzerland"
-                )
-                
-                if not search_results:
-                    logger.warning(f"No search results found for {gemeinde.label}")
-                    gemeinde_result["status"] = "error"
-                    gemeinde_result["error"] = "No search results found"
-                    stats["errors"].append(f"{gemeinde.label}: No search results found")
-                    results.append(gemeinde_result)
-                    continue
-                
-                # Find all PDF URLs from search results
-                pdf_urls = []
-                for result in search_results:
-                    url = result.url.lower()
-                    if url.endswith('.pdf') or 'pdf' in url:
-                        pdf_urls.append(result.url)
-                
-                # If no PDF URLs found, try to use all results (they might be PDFs even without .pdf extension)
-                if not pdf_urls:
-                    pdf_urls = [result.url for result in search_results]
-                    logger.info(f"No explicit PDF URLs found for {gemeinde.label}, trying all {len(pdf_urls)} results")
-                
-                logger.info(f"Found {len(pdf_urls)} potential PDF documents for {gemeinde.label}")
-                
-                # Helper function to download a single PDF
-                async def download_pdf(pdf_url: str) -> Optional[bytes]:
-                    """Download a PDF from a URL with retry logic."""
-                    max_retries = 3
-                    retry_delay = 2
-                    
-                    for attempt in range(max_retries):
-                        try:
-                            # Create headers - use minimal headers on retry after 406 error
-                            if attempt > 0:
-                                # Minimal headers for retry
-                                headers = {
-                                    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36',
-                                    'Accept': '*/*'
-                                }
-                            else:
-                                # Full headers for first attempt
-                                headers = {
-                                    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
-                                    'Accept': 'application/pdf,application/octet-stream,*/*',
-                                    'Accept-Language': 'de-DE,de;q=0.9,en;q=0.8',
-                                    'Accept-Encoding': 'gzip, deflate, br',
-                                    'Connection': 'keep-alive',
-                                    'Upgrade-Insecure-Requests': '1'
-                                }
-                            
-                            timeout = aiohttp.ClientTimeout(total=30, connect=10)
-                            async with aiohttp.ClientSession(timeout=timeout, headers=headers) as session:
-                                async with session.get(pdf_url, allow_redirects=True) as response:
-                                    if response.status == 200:
-                                        pdf_content = await response.read()
-                                        
-                                        if not pdf_content or len(pdf_content) < 100:  # Minimum size check
-                                            raise Exception("Downloaded file is too small or empty")
-                                        
-                                        # Verify it's actually a PDF (check PDF magic bytes)
-                                        if not pdf_content.startswith(b'%PDF'):
-                                            # Check if it's HTML (common error page)
-                                            if pdf_content.startswith(b'<') or pdf_content.startswith(b'<!DOCTYPE'):
-                                                raise Exception("Server returned HTML instead of PDF")
-                                            logger.warning(f"Downloaded file from {pdf_url} doesn't appear to be a PDF, but continuing anyway")
-                                        
-                                        # Success - return content
-                                        return pdf_content
-                                    elif response.status == 406:
-                                        # Not Acceptable - try with minimal headers on next attempt
-                                        logger.warning(f"HTTP 406 for {pdf_url}, will retry with minimal headers (attempt {attempt + 1}/{max_retries})")
-                                        if attempt < max_retries - 1:
-                                            await asyncio.sleep(retry_delay)
-                                            continue
-                                        else:
-                                            raise Exception(f"HTTP {response.status} (Not Acceptable) - server rejected request after {max_retries} attempts")
-                                    elif response.status in [301, 302, 303, 307, 308]:
-                                        # Redirect - should be handled by allow_redirects=True, but log it
-                                        logger.warning(f"Redirect {response.status} for {pdf_url}, following...")
-                                        pdf_content = await response.read()
-                                        return pdf_content
-                                    else:
-                                        raise Exception(f"HTTP {response.status} when downloading PDF")
-                        except asyncio.TimeoutError:
-                            logger.warning(f"Timeout downloading PDF from {pdf_url} (attempt {attempt + 1}/{max_retries})")
-                            if attempt < max_retries - 1:
-                                await asyncio.sleep(retry_delay)
-                                continue
-                            else:
-                                raise Exception("Connection timeout after retries")
-                        except aiohttp.ClientError as e:
-                            logger.warning(f"Connection error downloading PDF from {pdf_url} (attempt {attempt + 1}/{max_retries}): {str(e)}")
-                            if attempt < max_retries - 1:
-                                await asyncio.sleep(retry_delay)
-                                continue
-                            else:
-                                raise Exception(f"Connection error: {str(e)}")
-                        except Exception as e:
-                            # For other errors, don't retry
-                            raise
-                    
-                    return None
-                
-                # Process all PDF URLs
-                created_dokumente = []
-                current_dokumente = list(gemeinde.dokumente) if gemeinde.dokumente else []
-                
-                # Sanitize Gemeinde name for filename
-                safe_name = "".join(c for c in gemeinde.label if c.isalnum() or c in (' ', '-', '_')).strip()
-                safe_name = safe_name.replace(' ', '_')
-                if not safe_name:
-                    safe_name = "Gemeinde"
-                
-                # Determine base label based on language
-                if language == 'fr':
-                    base_doc_label = f"Plan d'aménagement local {gemeinde.label}"
-                elif language == 'it':
-                    base_doc_label = f"Piano di utilizzazione {gemeinde.label}"
-                else:
-                    base_doc_label = f"BZO {gemeinde.label}"
-                
-                # Process each PDF URL
-                for idx, pdf_url in enumerate(pdf_urls):
-                    try:
-                        logger.info(f"Downloading PDF {idx + 1}/{len(pdf_urls)} from {pdf_url} for {gemeinde.label}")
-                        pdf_content = await download_pdf(pdf_url)
-                        
-                        if not pdf_content:
-                            logger.warning(f"Failed to download PDF from {pdf_url} for {gemeinde.label}")
-                            continue
-                        
-                        # Additional validation
-                        if len(pdf_content) < 100:
-                            logger.warning(f"Downloaded file from {pdf_url} is too small for {gemeinde.label}")
-                            continue
-                        
-                        # Create unique file name (add index if multiple documents)
-                        if len(pdf_urls) > 1:
-                            file_name = f"BZO_{safe_name}_{idx + 1}.pdf"
-                            doc_label = f"{base_doc_label} ({idx + 1})"
-                        else:
-                            file_name = f"BZO_{safe_name}.pdf"
-                            doc_label = base_doc_label
-                        
-                        # Store file using ComponentObjects
-                        try:
-                            file_item = componentInterface.createFile(
-                                name=file_name,
-                                mimeType="application/pdf",
-                                content=pdf_content
-                            )
-                            
-                            # Store file data
-                            componentInterface.createFileData(file_item.id, pdf_content)
-                            
-                            logger.info(f"Stored file {file_name} with ID {file_item.id} for {gemeinde.label}")
-                        except Exception as e:
-                            logger.error(f"Error storing file {file_name} for {gemeinde.label}: {str(e)}", exc_info=True)
-                            stats["errors"].append(f"{gemeinde.label}: File storage failed for {pdf_url} - {str(e)}")
-                            continue
-                        
-                        # Create Dokument record
-                        dokument = Dokument(
-                            mandateId=currentUser.mandateId,
-                            label=doc_label,
-                            versionsbezeichnung="Aktuell",
-                            dokumentTyp=DokumentTyp.GEMEINDE_BZO_AKTUELL,
-                            dokumentReferenz=file_item.id,  # FileId from ComponentObjects
-                            quelle=pdf_url,  # Original URL
-                            mimeType="application/pdf",
-                            kategorienTags=["BZO", "Bauordnung", gemeinde.label]
-                        )
-                        
-                        # Create Dokument record in the Dokument table
-                        created_dokument = realEstateInterface.createDokument(dokument)
-                        logger.info(f"Created Dokument record with ID {created_dokument.id} for {gemeinde.label} (from {pdf_url})")
-                        
-                        created_dokumente.append(created_dokument)
-                        current_dokumente.append(created_dokument)
-                        gemeinde_result["dokument_ids"].append(created_dokument.id)
-                        
-                    except Exception as e:
-                        logger.error(f"Error processing PDF {pdf_url} for {gemeinde.label}: {str(e)}", exc_info=True)
-                        stats["errors"].append(f"{gemeinde.label}: Error processing PDF {pdf_url} - {str(e)}")
-                        continue
-                
-                # Update Gemeinde with all new dokumente
-                if created_dokumente:
-                    updated_gemeinde = realEstateInterface.updateGemeinde(
-                        gemeinde.id,
-                        {"dokumente": current_dokumente}
-                    )
-                    
-                    if updated_gemeinde:
-                        logger.info(f"Successfully created {len(created_dokumente)} BZO document(s) for {gemeinde.label}")
-                        gemeinde_result["status"] = "created"
-                        stats["documents_created"] += len(created_dokumente)
-                    else:
-                        raise Exception("Failed to update Gemeinde")
-                else:
-                    # No documents were successfully created
-                    gemeinde_result["status"] = "error"
-                    gemeinde_result["error"] = "No PDFs could be downloaded or processed"
-                    stats["errors"].append(f"{gemeinde.label}: No PDFs could be downloaded or processed")
-                
-            except Exception as e:
-                logger.error(f"Error processing Gemeinde {gemeinde.label}: {str(e)}", exc_info=True)
-                gemeinde_result["status"] = "error"
-                gemeinde_result["error"] = str(e)
-                stats["errors"].append(f"{gemeinde.label}: {str(e)}")
-            
-            results.append(gemeinde_result)
-        
-        logger.info(
-            f"BZO document fetch completed: {stats['documents_created']} created, "
-            f"{stats['documents_skipped']} skipped, {len(stats['errors'])} errors"
-        )
-        
-        return {
-            "success": True,
-            "stats": stats,
-            "results": results
-        }
-        
-    except HTTPException:
-        raise
-    except Exception as e:
-        logger.error(f"Error fetching BZO documents: {str(e)}", exc_info=True)
-        raise HTTPException(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            detail=f"Error fetching BZO documents: {str(e)}"
-        )
diff --git a/modules/serviceCenter/services/serviceAi/subDocumentIntents.py b/modules/serviceCenter/services/serviceAi/subDocumentIntents.py
index d4d7fae7..7d47c18f 100644
--- a/modules/serviceCenter/services/serviceAi/subDocumentIntents.py
+++ b/modules/serviceCenter/services/serviceAi/subDocumentIntents.py
@@ -13,7 +13,7 @@ import logging
 from typing import Dict, Any, List, Optional
 
 from modules.datamodels.datamodelChat import ChatDocument
-from modules.datamodels.datamodelExtraction import DocumentIntent
+from modules.datamodels.datamodelExtraction import DocumentIntent, ContentExtracted
 from modules.shared.workflowState import checkWorkflowStopped
 
 logger = logging.getLogger(__name__)
diff --git a/modules/serviceCenter/services/serviceAi/subJsonResponseHandling.py b/modules/serviceCenter/services/serviceAi/subJsonResponseHandling.py
index 3adb613c..1945c550 100644
--- a/modules/serviceCenter/services/serviceAi/subJsonResponseHandling.py
+++ b/modules/serviceCenter/services/serviceAi/subJsonResponseHandling.py
@@ -12,10 +12,18 @@ Handles merging of JSON responses from multiple AI iterations, including:
 """
 import json
 import logging
-import re
 from typing import Dict, Any, List, Optional, Tuple
 
-from modules.shared.jsonUtils import extractJsonString, repairBrokenJson, extractSectionsFromDocument
+from modules.shared.jsonUtils import (
+    extractJsonString,
+    repairBrokenJson,
+    extractSectionsFromDocument,
+    stripCodeFences,
+    normalizeJsonText,
+    closeJsonStructures,
+    tryParseJson,
+    extractFirstBalancedJson,
+)
 from modules.datamodels.datamodelAi import JsonAccumulationState
 
 logger = logging.getLogger(__name__)
diff --git a/modules/serviceCenter/services/serviceGeneration/renderers/rendererPptx.py b/modules/serviceCenter/services/serviceGeneration/renderers/rendererPptx.py
index 0b502e79..36d399d8 100644
--- a/modules/serviceCenter/services/serviceGeneration/renderers/rendererPptx.py
+++ b/modules/serviceCenter/services/serviceGeneration/renderers/rendererPptx.py
@@ -3,7 +3,6 @@
 import logging
 import base64
 import io
-import json
 import re
 from datetime import datetime, UTC
 from typing import Dict, Any, Optional, List
@@ -200,7 +199,6 @@ class RendererPptx(BaseRenderer):
                     logger.warning(f"Could not clear placeholders: {str(placeholder_error)}")
                 
                 # Add title as textbox
-                from pptx.util import Inches
                 titleBox = slide.shapes.add_textbox(Inches(0.5), Inches(0.2), prs.slide_width - Inches(1), Inches(0.6))
                 titleFrame = titleBox.text_frame
                 titleFrame.text = slide_data.get("title", "Slide")
@@ -299,8 +297,6 @@ class RendererPptx(BaseRenderer):
             
             # Convert to base64
             pptx_bytes = buffer.getvalue()
-            pptx_base64 = base64.b64encode(pptx_bytes).decode('utf-8')
-            
             logger.info(f"Successfully rendered PowerPoint presentation: {len(pptx_bytes)} bytes")
             
             # Determine filename from document or title
@@ -1247,6 +1243,7 @@ class RendererPptx(BaseRenderer):
         try:
             from pptx.util import Inches, Pt
             from pptx.enum.text import PP_ALIGN
+            from pptx.dml.color import RGBColor
             
             if not images:
                 logger.debug("No images to render in frame")
diff --git a/modules/workflowAutomation/engine/executors/actionNodeExecutor.py b/modules/workflowAutomation/engine/executors/actionNodeExecutor.py
index dc88c7ab..799d1606 100644
--- a/modules/workflowAutomation/engine/executors/actionNodeExecutor.py
+++ b/modules/workflowAutomation/engine/executors/actionNodeExecutor.py
@@ -18,7 +18,6 @@ from modules.nodeCatalog.portTypes import (
     normalizeToSchema,
 )
 from modules.datamodels.serviceExceptions import SubscriptionInactiveException as _SubscriptionInactiveException, BillingContextError as _BillingContextError
-from modules.workflowAutomation.engine.executors.inputExecutor import PauseForHumanTaskError
 from modules.workflows.methods.methodContext.actions.extractContent import (
     PRESENTATION_KIND,
     build_presentation_envelope_from_plain_text,
diff --git a/modules/workflowAutomation/engine/executors/flowExecutor.py b/modules/workflowAutomation/engine/executors/flowExecutor.py
index 7a296204..0f5f85d1 100644
--- a/modules/workflowAutomation/engine/executors/flowExecutor.py
+++ b/modules/workflowAutomation/engine/executors/flowExecutor.py
@@ -21,7 +21,6 @@ class FlowExecutor:
     ) -> Any:
         nodeType = node.get("type", "")
         nodeOutputs = context.get("nodeOutputs", {})
-        connectionMap = context.get("connectionMap", {})
         nodeId = node.get("id", "")
         inputSources = context.get("inputSources", {}).get(nodeId, {})
         logger.info(
@@ -151,6 +150,8 @@ class FlowExecutor:
             else:
                 nodes.append({"id": producer_id, "type": ""})
         return {"nodes": nodes, "targetNodeId": node.get("id")}
+
+    def _compare_dates(self, left: Any, right: Any, op) -> bool:
         """Compare left/right as dates; op(a,b) is the comparison."""
 
         def parse(v):
@@ -211,7 +212,6 @@ class FlowExecutor:
         from modules.workflowAutomation.engine.graphUtils import resolveParameterReferences
         from modules.workflowAutomation.editor.switchOutput import (
             build_switch_combined_output,
-            build_switch_default_payload,
         )
 
         value = resolveParameterReferences(valueExpr, nodeOutputs)