diff --git a/AppImage/config/verified_ai_models.json b/AppImage/config/verified_ai_models.json index e6d446cc..fb81221d 100644 --- a/AppImage/config/verified_ai_models.json +++ b/AppImage/config/verified_ai_models.json @@ -19,10 +19,11 @@ "models": [ "gemini-2.5-flash", "gemini-2.5-pro", - "gemini-2.0-flash-lite" + "gemini-1.5-flash" ], - "recommended": "gemini-2.5-flash", - "_deprecated": ["gemini-2.0-flash", "gemini-1.0-pro", "gemini-pro"] + "recommended": "gemini-1.5-flash", + "_note": "gemini-2.5-* may have availability issues. gemini-1.5-flash is more stable.", + "_deprecated": ["gemini-2.0-flash", "gemini-2.0-flash-lite", "gemini-1.0-pro", "gemini-pro"] }, "openai": { diff --git a/AppImage/scripts/notification_templates.py b/AppImage/scripts/notification_templates.py index 0e93fdc3..a78f0144 100644 --- a/AppImage/scripts/notification_templates.py +++ b/AppImage/scripts/notification_templates.py @@ -1270,10 +1270,11 @@ AI_LANGUAGES = { # Token limits for different detail levels # max_tokens is a LIMIT, not fixed consumption - you only pay for tokens actually generated +# Note: Some providers (especially Gemini) may have lower default limits, so we use generous values AI_DETAIL_TOKENS = { - 'brief': 300, # Short messages, 2-3 lines - 'standard': 1000, # Standard messages, sufficient for 15-20 VMs - 'detailed': 2000, # Complete technical reports with all details + 'brief': 500, # Short messages, 2-3 lines + 'standard': 1500, # Standard messages, sufficient for 15-20 VMs + 'detailed': 3000, # Complete technical reports with all details } # System prompt template - informative, no recommendations