neues text model
This commit is contained in:
parent
a96da92704
commit
d322281cda
2 changed files with 10 additions and 10 deletions
10
app.py
10
app.py
|
|
@ -187,11 +187,11 @@ rateLimiter = RateLimiter(
|
||||||
|
|
||||||
# Model mapping: external name -> internal Ollama model name
|
# Model mapping: external name -> internal Ollama model name
|
||||||
# Production models (optimized for 32GB RAM server):
|
# Production models (optimized for 32GB RAM server):
|
||||||
# - deepseek-ocr: 3.34B params, 8K context, ~6.7GB RAM
|
# - qwen2.5:7b: 7.6B params, 128K context, ~4.7GB RAM (Text)
|
||||||
# - qwen2.5vl:7b: 8.29B params, 125K context, ~6GB RAM
|
# - qwen2.5vl:7b: 8.29B params, 125K context, ~6GB RAM (Vision)
|
||||||
# - granite3.2-vision: 2B params, 16K context, ~2.4GB RAM
|
# - granite3.2-vision: 2B params, 16K context, ~2.4GB RAM (Vision)
|
||||||
MODEL_MAPPING = {
|
MODEL_MAPPING = {
|
||||||
"poweron-ocr-general": "deepseek-ocr",
|
"poweron-text-general": "qwen2.5:7b",
|
||||||
"poweron-vision-general": "qwen2.5vl:7b",
|
"poweron-vision-general": "qwen2.5vl:7b",
|
||||||
"poweron-vision-deep": "granite3.2-vision",
|
"poweron-vision-deep": "granite3.2-vision",
|
||||||
}
|
}
|
||||||
|
|
@ -536,7 +536,7 @@ async def _analyzeDocument(
|
||||||
|
|
||||||
# Model-specific context lengths (actual model limits)
|
# Model-specific context lengths (actual model limits)
|
||||||
modelContextLengths = {
|
modelContextLengths = {
|
||||||
"deepseek-ocr": 8192, # 8K context
|
"qwen2.5:7b": 32768, # Use 32K (model supports 128K but RAM limited)
|
||||||
"qwen2.5vl:7b": 32768, # Use 32K (model supports 125K but RAM limited)
|
"qwen2.5vl:7b": 32768, # Use 32K (model supports 125K but RAM limited)
|
||||||
"granite3.2-vision": 16000, # 16K context
|
"granite3.2-vision": 16000, # 16K context
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -824,11 +824,11 @@ Falls ein Feld nicht erkennbar ist, setze den Wert auf null.</textarea>
|
||||||
ollamaModel: 'granite3.2-vision'
|
ollamaModel: 'granite3.2-vision'
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
name: 'poweron-ocr-general',
|
name: 'poweron-text-general',
|
||||||
displayName: 'PowerOn OCR General',
|
displayName: 'PowerOn Text General',
|
||||||
description: 'Text-Extraktion / OCR (deepseek-ocr)',
|
description: 'Text-Verarbeitung / Analyse (qwen2.5:7b)',
|
||||||
isVision: false, // Text model - no image required
|
isVision: false, // Text model - no image required
|
||||||
ollamaModel: 'deepseek-ocr'
|
ollamaModel: 'qwen2.5:7b'
|
||||||
}
|
}
|
||||||
];
|
];
|
||||||
|
|
||||||
|
|
@ -1174,7 +1174,7 @@ Falls ein Feld nicht erkennbar ist, setze den Wert auf null.</textarea>
|
||||||
|
|
||||||
// Model-specific context lengths
|
// Model-specific context lengths
|
||||||
const modelContextLengths = {
|
const modelContextLengths = {
|
||||||
'deepseek-ocr': 8192,
|
'qwen2.5:7b': 32768,
|
||||||
'qwen2.5vl:7b': 32768,
|
'qwen2.5vl:7b': 32768,
|
||||||
'granite3.2-vision': 16000
|
'granite3.2-vision': 16000
|
||||||
};
|
};
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue