diff --git a/src/llm_core.py b/src/llm_core.py index 1cbe6e7..eb23057 100644 --- a/src/llm_core.py +++ b/src/llm_core.py @@ -420,7 +420,7 @@ def _restricts_temperature(model: str) -> bool: return any(m.startswith(p) or f"/{p}" in m for p in _FIXED_TEMPERATURE_MODELS) # Models that support structured thinking — may output without opening tag -_THINKING_MODEL_PATTERNS = ("qwen3", "qwq", "deepseek-r1", "deepseek-reasoner", "minimax", "m2-reap") +_THINKING_MODEL_PATTERNS = ("qwen3", "qwq", "deepseek-r1", "deepseek-reasoner", "minimax", "m2-reap", "gemma") def _supports_thinking(model: str) -> bool: """Check if model supports structured thinking output.""" diff --git a/src/model_context.py b/src/model_context.py index c812041..6fdd23e 100644 --- a/src/model_context.py +++ b/src/model_context.py @@ -83,6 +83,7 @@ KNOWN_CONTEXT_WINDOWS = { 'gemini-2.0-flash': 1048576, 'gemini-1.5-pro': 1048576, 'gemini-1.5-flash': 1048576, + 'gemma-4': 262144, 'gemma-3': 128000, 'gemma-2': 8192,