Agent mode treated local /v1 endpoints, including Ollama on :11434, as native-tool-capable by host/model heuristics. On Ollama's OpenAI-compatible surface some models that advertise tool support stop after a single token when schemas are sent (issue #1567). Default local Ollama /v1 back to fenced tool blocks unless the endpoint explicitly has supports_tools=True. Also compare both the runtime chat URL and the normalized endpoint base when reading ModelEndpoint.supports_tools. That keeps a saved base URL such as http://localhost:11434/v1 effective when the active session URL is /v1/chat/completions. Tests: .venv/bin/python -m pytest tests/test_tool_support_heuristic.py
155 lines
5.8 KiB
Python
155 lines
5.8 KiB
Python
"""Regression tests for the tool-support heuristic in stream_agent_loop.
|
|
|
|
Verifies two critical cases:
|
|
1. local Ollama endpoints must NOT enable native tool schemas by default
|
|
(some models terminate after one token with schemas).
|
|
2. api.deepseek.com must still be treated as tool-capable via the host
|
|
allow-list (_API_HOSTS), so cloud deepseek users keep working.
|
|
"""
|
|
import pytest
|
|
from src.agent_loop import _API_HOSTS, _endpoint_lookup_keys, _is_ollama_openai_compat_url
|
|
from src.llm_core import _is_ollama_native_url
|
|
|
|
|
|
def _compute_is_api_model(model: str, endpoint_url: str, endpoint_supports=None) -> bool:
|
|
"""Replicate the heuristic from stream_agent_loop without side effects."""
|
|
model_lc = model.lower()
|
|
|
|
model_supports_tools = any(kw in model_lc for kw in (
|
|
"gpt-4", "gpt-5", "gpt-o", "claude", "gemini", "gemma",
|
|
"qwen3", "qwen2.5", "mixtral", "mistral", "llama-3.1", "llama-3.2",
|
|
"llama-3.3", "llama-4",
|
|
"minimax", "kimi", "yi-", "phi-3", "phi-4", "command-r",
|
|
"glm-4", "internlm", "hermes",
|
|
"deepseek-v", "deepseek-chat",
|
|
))
|
|
model_no_tools = any(kw in model_lc for kw in (
|
|
"deepseek-r1",
|
|
))
|
|
|
|
if endpoint_supports is True:
|
|
return True
|
|
if (
|
|
endpoint_supports is False
|
|
or model_no_tools
|
|
or _is_ollama_native_url(endpoint_url)
|
|
or _is_ollama_openai_compat_url(endpoint_url)
|
|
):
|
|
return False
|
|
return any(h in endpoint_url for h in _API_HOSTS) or model_supports_tools
|
|
|
|
|
|
class TestDeepSeekToolSupport:
|
|
# --- local Ollama cases (must NOT get native tool schemas by default) ---
|
|
|
|
def test_deepseek_r1_7b_local_ollama_no_tools(self):
|
|
result = _compute_is_api_model(
|
|
"deepseek-r1:7b", "http://localhost:11434/v1"
|
|
)
|
|
assert result is False, (
|
|
"deepseek-r1:7b on Ollama must not enable tool schemas "
|
|
"(Ollama returns HTTP 400 for this model)"
|
|
)
|
|
|
|
def test_deepseek_r1_14b_local_no_tools(self):
|
|
assert _compute_is_api_model("deepseek-r1:14b", "http://localhost:11434/v1") is False
|
|
|
|
def test_deepseek_r1_70b_local_no_tools(self):
|
|
assert _compute_is_api_model("deepseek-r1:70b", "http://127.0.0.1:11434/v1") is False
|
|
|
|
def test_deepseek_r1_via_docker_no_tools(self):
|
|
assert _compute_is_api_model(
|
|
"deepseek-r1:7b", "http://host.docker.internal:11434/v1"
|
|
) is False
|
|
|
|
def test_qwen_local_ollama_defaults_to_fenced_tools(self):
|
|
assert _compute_is_api_model(
|
|
"qwen3.5:4b", "http://localhost:11434/v1"
|
|
) is False
|
|
|
|
def test_gemma_local_ollama_defaults_to_fenced_tools(self):
|
|
assert _compute_is_api_model(
|
|
"gemma4:e4b", "http://host.docker.internal:11434/v1"
|
|
) is False
|
|
|
|
def test_qwen_native_ollama_defaults_to_fenced_tools(self):
|
|
assert _compute_is_api_model(
|
|
"qwen3.5:4b", "http://localhost:11434/api/chat"
|
|
) is False
|
|
|
|
# --- cloud API cases (must still get tool schemas) ---
|
|
|
|
def test_deepseek_cloud_api_gets_tools(self):
|
|
result = _compute_is_api_model(
|
|
"deepseek-chat", "https://api.deepseek.com/v1"
|
|
)
|
|
assert result is True, (
|
|
"api.deepseek.com must be treated as tool-capable via _API_HOSTS"
|
|
)
|
|
|
|
def test_deepseek_v3_cloud_gets_tools(self):
|
|
assert _compute_is_api_model("deepseek-v3", "https://api.deepseek.com/v1") is True
|
|
|
|
def test_deepseek_v2_cloud_gets_tools(self):
|
|
assert _compute_is_api_model("deepseek-v2.5", "https://api.deepseek.com/v1") is True
|
|
|
|
# --- endpoint_supports override takes priority ---
|
|
|
|
def test_endpoint_supports_true_overrides_blocklist(self):
|
|
"""A user who explicitly sets supports_tools=True on their endpoint
|
|
can force tool schemas even for deepseek-r1 (e.g. custom server)."""
|
|
result = _compute_is_api_model(
|
|
"deepseek-r1:7b", "http://localhost:11434/v1", endpoint_supports=True
|
|
)
|
|
assert result is True
|
|
|
|
def test_endpoint_supports_true_overrides_ollama_default(self):
|
|
"""A user can still explicitly opt a known-good Ollama endpoint into
|
|
native schemas."""
|
|
result = _compute_is_api_model(
|
|
"qwen3.5:4b", "http://localhost:11434/v1", endpoint_supports=True
|
|
)
|
|
assert result is True
|
|
|
|
def test_endpoint_supports_true_overrides_native_ollama_default(self):
|
|
result = _compute_is_api_model(
|
|
"qwen3.5:4b", "http://localhost:11434/api/chat", endpoint_supports=True
|
|
)
|
|
assert result is True
|
|
|
|
def test_endpoint_supports_false_overrides_cloud(self):
|
|
"""supports_tools=False on an endpoint gates even cloud APIs."""
|
|
result = _compute_is_api_model(
|
|
"deepseek-chat", "https://api.deepseek.com/v1", endpoint_supports=False
|
|
)
|
|
assert result is False
|
|
|
|
# --- other local models unaffected ---
|
|
|
|
def test_qwen_local_non_ollama_still_gets_tools(self):
|
|
assert _compute_is_api_model("qwen2.5:14b", "http://localhost:8000/v1") is True
|
|
|
|
def test_llama_local_non_ollama_gets_tools_via_host(self):
|
|
assert _compute_is_api_model("llama3.2:3b", "http://localhost:8000/v1") is True
|
|
|
|
|
|
class TestApiHostsContainsDeepSeek:
|
|
def test_api_deepseek_com_in_api_hosts(self):
|
|
assert "api.deepseek.com" in _API_HOSTS
|
|
|
|
def test_deepseek_com_in_api_hosts(self):
|
|
assert "deepseek.com" in _API_HOSTS
|
|
|
|
|
|
class TestEndpointLookupKeys:
|
|
def test_chat_completions_url_matches_endpoint_base(self):
|
|
keys = _endpoint_lookup_keys("http://localhost:11434/v1/chat/completions")
|
|
|
|
assert "http://localhost:11434/v1" in keys
|
|
assert "http://localhost:11434/v1/" in keys
|
|
|
|
def test_native_ollama_chat_url_matches_api_base(self):
|
|
keys = _endpoint_lookup_keys("http://host.docker.internal:11434/api/chat")
|
|
|
|
assert "http://host.docker.internal:11434/api" in keys
|