gateway/connectors/connector_aichat_anthropic.py

import logging
import httpx
from typing import Dict, Any, List, Optional, Union
from fastapi import HTTPException
from modules.utility import APP_CONFIG

# Logger konfigurieren
logger = logging.getLogger(__name__)

# Konfigurationsdaten laden
def load_config_data():
    return {
        "api_key": APP_CONFIG.get('Connector_AiAnthropic_API_SECRET'),
        "api_url": APP_CONFIG.get('Connector_AiAnthropic_API_URL'),
        "model_name": APP_CONFIG.get('Connector_AiAnthropic_MODEL_NAME'),
        "temperature": float(APP_CONFIG.get('Connector_AiAnthropic_TEMPERATURE')),
        "max_tokens": int(APP_CONFIG.get('Connector_AiAnthropic_MAX_TOKENS'))
    }

class ChatService:
    """
    Connector für die Kommunikation mit der Anthropic API.
    """

    def __init__(self):
        # Konfiguration laden
        self.config = load_config_data()
        self.api_key = self.config["api_key"]
        self.api_url = self.config["api_url"]
        self.model_name = self.config["model_name"]

        # HttpClient für API-Aufrufe
        self.http_client = httpx.AsyncClient(
            timeout=120.0,  # Längeres Timeout für komplexe Anfragen
            headers={
                "x-api-key": self.api_key,
                "anthropic-version": "2023-06-01",  # Anthropic API Version
                "Content-Type": "application/json"
            }
        )

        logger.info(f"Anthropic Connector initialisiert mit Modell: {self.model_name}")

    async def call_api(self, messages: List[Dict[str, Any]], temperature: float = None, max_tokens: int = None) -> Dict[str, Any]:
        """
        Ruft die Anthropic API mit den gegebenen Nachrichten auf.

        Args:
            messages: Liste von Nachrichten im OpenAI-Format (role, content)
            temperature: Temperatur für die Antwortgenerierung (0.0-1.0)
            max_tokens: Maximale Anzahl der Token in der Antwort

        Returns:
            Die Antwort umgewandelt ins OpenAI-Format

        Raises:
            HTTPException: Bei Fehlern in der API-Kommunikation
        """
        try:
            # OpenAI-Format in Anthropic-Format umwandeln
            formatted_messages = self._convert_to_anthropic_format(messages)

            # Verwende Parameter aus der Konfiguration, falls keine überschrieben wurden
            if temperature is None:
                temperature = self.config.get("temperature", 0.2)

            if max_tokens is None:
                max_tokens = self.config.get("max_tokens", 2000)

            # Anthropic API Payload erstellen
            payload = {
                "model": self.model_name,
                "messages": formatted_messages,
                "temperature": temperature,
                "max_tokens": max_tokens
            }

            response = await self.http_client.post(
                self.api_url,
                json=payload
            )

            if response.status_code != 200:
                logger.error(f"Anthropic API-Fehler: {response.status_code} - {response.text}")
                raise HTTPException(status_code=500, detail="Fehler bei der Kommunikation mit Anthropic API")

            # Antwort im Anthropic-Format in OpenAI-Format umwandeln
            anthropic_response = response.json()
            openai_formatted_response = self._convert_to_openai_format(anthropic_response)

            return openai_formatted_response

        except Exception as e:
            logger.error(f"Fehler beim Aufruf der Anthropic API: {str(e)}")
            raise HTTPException(status_code=500, detail=f"Fehler beim Aufruf der Anthropic API: {str(e)}")

    def _convert_to_anthropic_format(self, openai_messages: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
        """
        Konvertiert Nachrichten vom OpenAI-Format ins Anthropic-Format.

        OpenAI verwendet:
        [{"role": "system", "content": "..."},
         {"role": "user", "content": "..."},
         {"role": "assistant", "content": "..."}]

        Anthropic verwendet:
        [{"role": "user", "content": "..."},
         {"role": "assistant", "content": "..."}]

        Anmerkung: Anthropic hat kein direktes System-Message-Äquivalent,
        daher fügen wir System-Nachrichten in die erste User-Nachricht ein.
        """
        anthropic_messages = []
        system_content = ""

        # Extrahiere zuerst alle System-Nachrichten
        for msg in openai_messages:
            if msg.get("role") == "system":
                system_content += msg.get("content", "") + "\n\n"

        # Konvertiere die restlichen Nachrichten
        for i, msg in enumerate(openai_messages):
            role = msg.get("role")
            content = msg.get("content", "")

            # System-Nachrichten überspringen (bereits extrahiert)
            if role == "system":
                continue

            # Für die erste User-Nachricht: System-Inhalte voranstellen, falls vorhanden
            if role == "user" and system_content and not any(m.get("role") == "user" for m in anthropic_messages):
                if isinstance(content, str):
                    content = system_content + content
                elif isinstance(content, list):
                    # Wenn content ein Array ist (für Multimodal-Nachrichten)
                    text_parts = []
                    for part in content:
                        if part.get("type") == "text":
                            text_parts.append(part)

                    if text_parts:
                        text_parts[0]["text"] = system_content + text_parts[0].get("text", "")

            # Anthropic unterstützt nur "user" und "assistant" als Rollen
            if role not in ["user", "assistant"]:
                role = "user"

            anthropic_messages.append({"role": role, "content": content})

        return anthropic_messages

    def _convert_to_openai_format(self, anthropic_response: Dict[str, Any]) -> Dict[str, Any]:
        """
        Konvertiert eine Antwort vom Anthropic-Format ins OpenAI-Format.
        """
        # Extrahiere Inhalt aus Anthropic-Antwort
        content = ""
        if "content" in anthropic_response:
            if isinstance(anthropic_response["content"], list):
                # Inhalt ist eine Liste von Teilen (bei neueren API-Versionen)
                for part in anthropic_response["content"]:
                    if part.get("type") == "text":
                        content += part.get("text", "")
            else:
                # Direkter Inhalt als String (bei älteren API-Versionen)
                content = anthropic_response["content"]

        # Erstelle OpenAI-formatierte Antwort
        return {
            "id": anthropic_response.get("id", ""),
            "object": "chat.completion",
            "created": anthropic_response.get("created", 0),
            "model": anthropic_response.get("model", self.model_name),
            "choices": [
                {
                    "message": {
                        "role": "assistant",
                        "content": content
                    },
                    "index": 0,
                    "finish_reason": "stop"
                }
            ]
        }

    async def analyze_image(self, image_data: Union[str, bytes], mime_type: str = None, prompt: str = "Describe this image") -> str:
        """
        Analysiert ein Bild mit der OpenAI Vision API.

        Args:
            image_data: Entweder ein Dateipfad (str) oder Bilddaten (bytes)
            mime_type: Der MIME-Typ des Bildes (optional, nur für Binärdaten)
            prompt: Der Prompt für die Analyse

        Returns:
            Die Antwort der OpenAI Vision API als Text
        """
        try:
            # Unterscheide zwischen Dateipfad und Binärdaten
            if isinstance(image_data, str):
                # Es ist ein Dateipfad - importiere filehandling nur bei Bedarf
                from gateway.gwserver.modules import agentservice_filemanager as file_handler
                base64_data, auto_mime_type = file_handler.encode_file_to_base64(image_data)
                mime_type = mime_type or auto_mime_type
            else:
                # Es sind Binärdaten
                import base64
                base64_data = base64.b64encode(image_data).decode('utf-8')
                # MIME-Typ muss angegeben sein für Binärdaten
                if not mime_type:
                    # Fallback auf generischen Bildtyp
                    mime_type = "image/png"

            # Bereite den Payload für die Vision API vor
            messages = [
                {
                    "role": "user",
                    "content": [
                        {"type": "text", "text": prompt},
                        {
                            "type": "image_url",
                            "image_url": {
                                "url": f"data:{mime_type};base64,{base64_data}"
                            }
                        }
                    ]
                }
            ]

            # Verwende die bestehende call_api Funktion mit dem Vision-Modell
            response = await self.call_api(messages)

            # Inhalt extrahieren und zurückgeben
            return response["choices"][0]["message"]["content"]

        except Exception as e:
            logger.error(f"Fehler bei der Bildanalyse: {str(e)}", exc_info=True)
            return f"[Fehler bei der Bildanalyse: {str(e)}]"