472 lines
20 KiB
Python
472 lines
20 KiB
Python
# Copyright (c) 2025 Patrick Motsch
|
|
# All rights reserved.
|
|
import logging
|
|
import httpx
|
|
from typing import List
|
|
from fastapi import HTTPException
|
|
from modules.shared.configuration import APP_CONFIG
|
|
from .aicoreBase import BaseConnectorAi
|
|
from modules.datamodels.datamodelAi import AiModel, PriorityEnum, ProcessingModeEnum, OperationTypeEnum, AiModelCall, AiModelResponse, createOperationTypeRatings, AiCallPromptWebSearch, AiCallPromptWebCrawl, AiCallOptions
|
|
from modules.datamodels.datamodelTools import CountryCodes
|
|
|
|
# Configure logger
|
|
logger = logging.getLogger(__name__)
|
|
|
|
def loadConfigData():
|
|
"""Load configuration data for Perplexity connector"""
|
|
return {
|
|
"apiKey": APP_CONFIG.get('Connector_AiPerplexity_API_SECRET'),
|
|
}
|
|
|
|
class AiPerplexity(BaseConnectorAi):
|
|
"""Connector for communication with the Perplexity API."""
|
|
|
|
def __init__(self):
|
|
super().__init__()
|
|
# Load configuration
|
|
self.config = loadConfigData()
|
|
self.apiKey = self.config["apiKey"]
|
|
|
|
# HttpClient for API calls
|
|
self.httpClient = httpx.AsyncClient(
|
|
timeout=600.0, # Timeout set to 600 seconds (10 minutes) for complex requests that may take longer
|
|
headers={
|
|
"Authorization": f"Bearer {self.apiKey}",
|
|
"Content-Type": "application/json",
|
|
"Accept": "application/json"
|
|
}
|
|
)
|
|
|
|
logger.info("Perplexity Connector initialized")
|
|
|
|
def getConnectorType(self) -> str:
|
|
"""Get the connector type identifier."""
|
|
return "perplexity"
|
|
|
|
def _convertIsoCodeToCountryName(self, isoCode: str) -> str:
|
|
"""
|
|
Convert ISO-2 country code to Perplexity country name.
|
|
Uses centralized CountryCodes mapping.
|
|
"""
|
|
return CountryCodes.getForPerplexity(isoCode)
|
|
|
|
def getModels(self) -> List[AiModel]:
|
|
"""Get all available Perplexity models."""
|
|
return [
|
|
AiModel(
|
|
name="sonar",
|
|
displayName="Perplexity Sonar",
|
|
connectorType="perplexity",
|
|
apiUrl="https://api.perplexity.ai/chat/completions",
|
|
temperature=0.2,
|
|
maxTokens=24000, # Increased for detailed web crawl responses (Perplexity supports up to 25k)
|
|
contextLength=32000,
|
|
costPer1kTokensInput=0.005,
|
|
costPer1kTokensOutput=0.005,
|
|
speedRating=8,
|
|
qualityRating=8,
|
|
# capabilities removed (not used in business logic)
|
|
functionCall=self._routeWebOperation,
|
|
priority=PriorityEnum.BALANCED,
|
|
processingMode=ProcessingModeEnum.ADVANCED,
|
|
operationTypes=createOperationTypeRatings(
|
|
(OperationTypeEnum.WEB_SEARCH_DATA, 9),
|
|
(OperationTypeEnum.WEB_CRAWL, 7)
|
|
),
|
|
version="sonar",
|
|
calculatePriceUsd=lambda processingTime, bytesSent, bytesReceived: (bytesSent / 4 / 1000) * 0.005 + (bytesReceived / 4 / 1000) * 0.005
|
|
),
|
|
AiModel(
|
|
name="sonar-pro",
|
|
displayName="Perplexity Sonar Pro",
|
|
connectorType="perplexity",
|
|
apiUrl="https://api.perplexity.ai/chat/completions",
|
|
temperature=0.2,
|
|
maxTokens=24000, # Increased for detailed web crawl responses (Perplexity supports up to 25k)
|
|
contextLength=32000,
|
|
costPer1kTokensInput=0.01,
|
|
costPer1kTokensOutput=0.01,
|
|
speedRating=6, # Slower due to AI analysis
|
|
qualityRating=9, # Best AI analysis quality
|
|
# capabilities removed (not used in business logic)
|
|
functionCall=self._routeWebOperation,
|
|
priority=PriorityEnum.QUALITY,
|
|
processingMode=ProcessingModeEnum.DETAILED,
|
|
operationTypes=createOperationTypeRatings(
|
|
(OperationTypeEnum.WEB_SEARCH_DATA, 9),
|
|
(OperationTypeEnum.WEB_CRAWL, 8)
|
|
),
|
|
version="sonar-pro",
|
|
calculatePriceUsd=lambda processingTime, bytesSent, bytesReceived: (bytesSent / 4 / 1000) * 0.01 + (bytesReceived / 4 / 1000) * 0.01
|
|
)
|
|
]
|
|
|
|
async def callAiBasic(self, modelCall: AiModelCall) -> AiModelResponse:
|
|
"""
|
|
Calls the Perplexity API with the given messages using standardized pattern.
|
|
|
|
Args:
|
|
modelCall: AiModelCall with messages and options
|
|
|
|
Returns:
|
|
AiModelResponse with content and metadata
|
|
|
|
Raises:
|
|
HTTPException: For errors in API communication
|
|
"""
|
|
try:
|
|
# Extract parameters from modelCall
|
|
messages = modelCall.messages
|
|
model = modelCall.model
|
|
options = modelCall.options
|
|
temperature = getattr(options, "temperature", None)
|
|
if temperature is None:
|
|
temperature = model.temperature
|
|
maxTokens = model.maxTokens
|
|
|
|
payload = {
|
|
"model": model.name,
|
|
"messages": messages,
|
|
"temperature": temperature,
|
|
"max_tokens": maxTokens
|
|
}
|
|
|
|
response = await self.httpClient.post(
|
|
model.apiUrl,
|
|
json=payload
|
|
)
|
|
|
|
if response.status_code != 200:
|
|
errorDetail = f"Perplexity API error: {response.status_code} - {response.text}"
|
|
logger.error(errorDetail)
|
|
|
|
# Provide more specific error messages based on status code
|
|
if response.status_code == 429:
|
|
errorMessage = "Rate limit exceeded. Please wait before making another request."
|
|
elif response.status_code == 401:
|
|
errorMessage = "Invalid API key. Please check your Perplexity API configuration."
|
|
elif response.status_code == 400:
|
|
errorMessage = f"Invalid request to Perplexity API: {response.text}"
|
|
else:
|
|
errorMessage = f"Perplexity API error ({response.status_code}): {response.text}"
|
|
|
|
raise HTTPException(status_code=500, detail=errorMessage)
|
|
|
|
apiResponse = response.json()
|
|
content = apiResponse["choices"][0]["message"]["content"]
|
|
|
|
return AiModelResponse(
|
|
content=content,
|
|
success=True,
|
|
modelId=model.name,
|
|
metadata={"response_id": apiResponse.get("id", "")}
|
|
)
|
|
|
|
except Exception as e:
|
|
logger.error(f"Error calling Perplexity API: {str(e)}")
|
|
raise HTTPException(status_code=500, detail=f"Error calling Perplexity API: {str(e)}")
|
|
|
|
|
|
|
|
|
|
|
|
async def _testConnection(self) -> bool:
|
|
"""
|
|
Tests the connection to the Perplexity API.
|
|
|
|
Returns:
|
|
True if connection is successful, False otherwise
|
|
"""
|
|
try:
|
|
# Try a simple test message
|
|
testMessages = [
|
|
{"role": "user", "content": "Hello, please respond with just 'OK' to confirm the connection works."}
|
|
]
|
|
|
|
# Create a model call for testing
|
|
model = self.getModels()[0] # Get first model for testing
|
|
testCall = AiModelCall(
|
|
messages=testMessages,
|
|
model=model,
|
|
options=AiCallOptions()
|
|
)
|
|
|
|
response = await self.callAiBasic(testCall)
|
|
return response.success and len(response.content.strip()) > 0
|
|
|
|
except Exception as e:
|
|
logger.error(f"Perplexity connection test failed: {str(e)}")
|
|
return False
|
|
|
|
async def _routeWebOperation(self, modelCall: AiModelCall) -> AiModelResponse:
|
|
"""
|
|
Route web operation based on operation type.
|
|
|
|
Args:
|
|
modelCall: AiModelCall with messages and options
|
|
|
|
Returns:
|
|
AiModelResponse based on operation type
|
|
"""
|
|
operationType = modelCall.options.operationType
|
|
|
|
if operationType == OperationTypeEnum.WEB_SEARCH_DATA:
|
|
return await self.webSearch(modelCall)
|
|
elif operationType == OperationTypeEnum.WEB_CRAWL:
|
|
return await self.webCrawl(modelCall)
|
|
else:
|
|
# Fallback to basic call
|
|
return await self.callAiBasic(modelCall)
|
|
|
|
def _getDepthInstructions(self, maxDepth: int) -> str:
|
|
"""
|
|
Map maxDepth (numeric) to instructional text for LLM.
|
|
|
|
Args:
|
|
maxDepth: 1 (fast/overview), 2 (general/standard), 3 (deep/comprehensive)
|
|
|
|
Returns:
|
|
Instructional text for the LLM
|
|
"""
|
|
depthMap = {
|
|
1: "Basic overview - extract main content from the main page only",
|
|
2: "Standard crawl - extract content from main page and linked pages (2 levels deep)",
|
|
3: "Deep crawl - comprehensively extract content from main page and all accessible linked pages (3+ levels deep)"
|
|
}
|
|
return depthMap.get(maxDepth, depthMap[2])
|
|
|
|
def _getWidthInstructions(self, maxWidth: int) -> str:
|
|
"""
|
|
Map maxWidth (numeric) to instructional text for LLM.
|
|
|
|
Args:
|
|
maxWidth: Number of pages to crawl at each level (default: 10)
|
|
|
|
Returns:
|
|
Instructional text for the LLM
|
|
"""
|
|
if maxWidth <= 5:
|
|
return f"Focused crawl - limit to {maxWidth} most relevant pages per level"
|
|
elif maxWidth <= 15:
|
|
return f"Standard breadth - crawl up to {maxWidth} pages per level"
|
|
elif maxWidth <= 30:
|
|
return f"Wide crawl - crawl up to {maxWidth} pages per level, prioritize quality"
|
|
else:
|
|
return f"Extensive crawl - crawl up to {maxWidth} pages per level, comprehensive coverage"
|
|
|
|
async def webSearch(self, modelCall: AiModelCall) -> AiModelResponse:
|
|
"""
|
|
WEB_SEARCH_DATA operation - returns list of URLs based on search query.
|
|
|
|
Args:
|
|
modelCall: AiModelCall with AiCallPromptWebSearch as prompt
|
|
|
|
Returns:
|
|
AiModelResponse with JSON list of URLs
|
|
"""
|
|
try:
|
|
# Extract parameters
|
|
messages = modelCall.messages
|
|
model = modelCall.model
|
|
options = modelCall.options
|
|
temperature = getattr(options, "temperature", None) or model.temperature
|
|
maxTokens = model.maxTokens
|
|
|
|
# Parse prompt JSON - find user message (not system message)
|
|
promptContent = ""
|
|
if messages:
|
|
for msg in messages:
|
|
if msg.get("role") == "user":
|
|
promptContent = msg.get("content", "")
|
|
break
|
|
# Fallback to first message if no user message found
|
|
if not promptContent and len(messages) > 0:
|
|
promptContent = messages[0].get("content", "")
|
|
|
|
import json
|
|
promptData = json.loads(promptContent)
|
|
|
|
# Create Pydantic model
|
|
webSearchPrompt = AiCallPromptWebSearch(**promptData)
|
|
|
|
# Convert ISO country code to country name
|
|
countryName = webSearchPrompt.country
|
|
if countryName:
|
|
countryName = self._convertIsoCodeToCountryName(countryName)
|
|
|
|
# Build search request for Perplexity
|
|
searchPrompt = f"""Search the web for: {webSearchPrompt.instruction}
|
|
|
|
Return a JSON array of {webSearchPrompt.maxNumberPages} most relevant URLs.
|
|
{'' if not countryName else f'Focus on results from {countryName}.'}
|
|
|
|
Return ONLY a JSON array of URLs, no additional text:
|
|
[
|
|
"https://example1.com/page",
|
|
"https://example2.com/article",
|
|
"https://example3.com/resource"
|
|
]"""
|
|
|
|
payload = {
|
|
"model": model.name,
|
|
"messages": [{"role": "user", "content": searchPrompt}],
|
|
"temperature": temperature,
|
|
"max_tokens": maxTokens
|
|
}
|
|
|
|
response = await self.httpClient.post(model.apiUrl, json=payload)
|
|
|
|
if response.status_code != 200:
|
|
raise HTTPException(status_code=500, detail=f"Perplexity Web Search API error: {response.text}")
|
|
|
|
# Check if response body is empty or invalid
|
|
responseText = response.text
|
|
if not responseText or not responseText.strip():
|
|
raise HTTPException(status_code=500, detail="Perplexity Web Search API returned empty response")
|
|
|
|
try:
|
|
apiResponse = response.json()
|
|
except Exception as jsonError:
|
|
logger.error(f"Failed to parse Perplexity response as JSON. Status: {response.status_code}, Response: {responseText[:500]}")
|
|
raise HTTPException(status_code=500, detail=f"Perplexity Web Search API returned invalid JSON: {str(jsonError)}")
|
|
|
|
if "choices" not in apiResponse or not apiResponse["choices"]:
|
|
raise HTTPException(status_code=500, detail="Perplexity Web Search API response missing 'choices' field")
|
|
|
|
content = apiResponse["choices"][0]["message"]["content"]
|
|
|
|
return AiModelResponse(
|
|
content=content,
|
|
success=True,
|
|
modelId=model.name,
|
|
metadata={"response_id": apiResponse.get("id", ""), "operation": "WEB_SEARCH_DATA"}
|
|
)
|
|
|
|
except Exception as e:
|
|
logger.error(f"Error in Perplexity web search: {str(e)}")
|
|
raise HTTPException(status_code=500, detail=f"Error in Perplexity web search: {str(e)}")
|
|
|
|
async def webCrawl(self, modelCall: AiModelCall) -> AiModelResponse:
|
|
"""
|
|
WEB_CRAWL operation - crawls ONE URL and returns content.
|
|
|
|
Perplexity API Parameters Used:
|
|
- messages: The prompt containing URL and instruction
|
|
- max_tokens: Maximum response length
|
|
- max_results: Number of search results (1-20, default: 10)
|
|
- temperature: Response randomness (not web search specific)
|
|
|
|
Pagination: Perplexity does NOT return paginated responses.
|
|
A single response contains all results within max_tokens limit.
|
|
|
|
Args:
|
|
modelCall: AiModelCall with AiCallPromptWebCrawl as prompt
|
|
|
|
Returns:
|
|
AiModelResponse with crawl results as JSON object
|
|
"""
|
|
try:
|
|
# Extract parameters
|
|
messages = modelCall.messages
|
|
model = modelCall.model
|
|
options = modelCall.options
|
|
temperature = getattr(options, "temperature", None) or model.temperature
|
|
maxTokens = model.maxTokens
|
|
|
|
# Parse prompt JSON - find user message (not system message)
|
|
promptContent = ""
|
|
if messages:
|
|
for msg in messages:
|
|
if msg.get("role") == "user":
|
|
promptContent = msg.get("content", "")
|
|
break
|
|
# Fallback to first message if no user message found
|
|
if not promptContent and len(messages) > 0:
|
|
promptContent = messages[0].get("content", "")
|
|
|
|
import json
|
|
promptData = json.loads(promptContent)
|
|
|
|
# Create Pydantic model
|
|
webCrawlPrompt = AiCallPromptWebCrawl(**promptData)
|
|
|
|
# Build crawl request for Perplexity - ONE URL
|
|
# Match playground prompt style: just URL + question
|
|
# This allows Perplexity to return detailed multi-source results
|
|
crawlPrompt = f"{webCrawlPrompt.url}: {webCrawlPrompt.instruction}"
|
|
|
|
# Build payload with optional Perplexity parameters
|
|
# Note: max_tokens_per_page may not be supported by chat/completions endpoint
|
|
# The playground Python SDK might use a different internal API
|
|
maxResults = min(webCrawlPrompt.maxWidth or 10, 20) # Max 20 results
|
|
|
|
payload = {
|
|
"model": model.name,
|
|
"messages": [{"role": "user", "content": crawlPrompt}],
|
|
"temperature": temperature,
|
|
"max_tokens": maxTokens, # Use model's configured maxTokens (24000)
|
|
"max_results": maxResults,
|
|
"return_citations": True # Request citations explicitly
|
|
}
|
|
|
|
logger.info(f"Perplexity crawl payload: model={model.name}, prompt_length={len(crawlPrompt)}, max_tokens={maxTokens}, max_results={maxResults}")
|
|
|
|
response = await self.httpClient.post(model.apiUrl, json=payload)
|
|
|
|
if response.status_code != 200:
|
|
raise HTTPException(status_code=500, detail=f"Perplexity Web Crawl API error: {response.text}")
|
|
|
|
# Check if response body is empty or invalid
|
|
responseText = response.text
|
|
if not responseText or not responseText.strip():
|
|
raise HTTPException(status_code=500, detail="Perplexity Web Crawl API returned empty response")
|
|
|
|
try:
|
|
apiResponse = response.json()
|
|
except Exception as jsonError:
|
|
logger.error(f"Failed to parse Perplexity response as JSON. Status: {response.status_code}, Response: {responseText[:500]}")
|
|
raise HTTPException(status_code=500, detail=f"Perplexity Web Crawl API returned invalid JSON: {str(jsonError)}")
|
|
|
|
if "choices" not in apiResponse or not apiResponse["choices"]:
|
|
raise HTTPException(status_code=500, detail="Perplexity Web Crawl API response missing 'choices' field")
|
|
|
|
# Extract the main content
|
|
content = apiResponse["choices"][0]["message"]["content"]
|
|
|
|
# Check for citations or search results in the response
|
|
citations = apiResponse.get("citations", [])
|
|
searchResults = apiResponse.get("search_results", [])
|
|
|
|
# Log what we found
|
|
if citations:
|
|
logger.info(f"Found {len(citations)} citations in response")
|
|
if searchResults:
|
|
logger.info(f"Found {len(searchResults)} search results in response")
|
|
logger.debug(f"API response keys: {list(apiResponse.keys())}")
|
|
|
|
# Build comprehensive response with citations if available
|
|
import json
|
|
responseData = {
|
|
"content": content,
|
|
"citations": citations if citations else [],
|
|
"search_results": searchResults if searchResults else []
|
|
}
|
|
|
|
# Return comprehensive response
|
|
return AiModelResponse(
|
|
content=json.dumps(responseData, indent=2) if (citations or searchResults) else content,
|
|
success=True,
|
|
modelId=model.name,
|
|
metadata={
|
|
"response_id": apiResponse.get("id", ""),
|
|
"operation": "WEB_CRAWL",
|
|
"url": webCrawlPrompt.url,
|
|
"actualPromptSent": crawlPrompt,
|
|
"has_citations": len(citations) > 0,
|
|
"has_search_results": len(searchResults) > 0
|
|
}
|
|
)
|
|
|
|
except Exception as e:
|
|
logger.error(f"Error in Perplexity web crawl: {str(e)}")
|
|
raise HTTPException(status_code=500, detail=f"Error in Perplexity web crawl: {str(e)}")
|