From fb8a744caebc92fdfbfa74f5ea9b4deef1960779 Mon Sep 17 00:00:00 2001
From: Afonso Coutinho <afonso@omelhorsite.pt>
Date: Wed, 3 Jun 2026 06:24:11 +0100
Subject: [PATCH] fix: skill retrieval boosts on tag substrings (e.g. 'ai' tag
 for any 'email' query) (#1406)

* fix: match skill tags as whole tokens, not substrings, in retrieval

* test: skill tag matching uses whole tokens, not substrings

* test: give skill fixtures status=published so they reach the scoring path
---
 services/memory/skills.py            |  5 +++-
 tests/test_skills_tag_token_match.py | 36 ++++++++++++++++++++++++++++
 2 files changed, 40 insertions(+), 1 deletion(-)
 create mode 100644 tests/test_skills_tag_token_match.py

diff --git a/services/memory/skills.py b/services/memory/skills.py
index ee0dd26..87f74d5 100644
--- a/services/memory/skills.py
+++ b/services/memory/skills.py
@@ -650,7 +650,10 @@ class SkillsManager:
             ])
             score = _jaccard(query_tokens, _tokenize(text))
             for tag in sk.get("tags", []) or []:
-                if tag and tag in query.lower():
+                # Match tags as whole tokens, not substrings: `tag in query`
+                # boosted e.g. a "ai" tag for any query containing "email".
+                tag_tokens = _tokenize(tag)
+                if tag_tokens and tag_tokens <= query_tokens:
                     score = max(score, 0.3) * 1.3
             if query.lower() in (sk.get("description") or "").lower():
                 score = max(score, 0.6)
diff --git a/tests/test_skills_tag_token_match.py b/tests/test_skills_tag_token_match.py
new file mode 100644
index 0000000..6da0e24
--- /dev/null
+++ b/tests/test_skills_tag_token_match.py
@@ -0,0 +1,36 @@
+"""Regression: skill retrieval must match tags as whole tokens, not substrings."""
+import sys
+from unittest.mock import MagicMock
+
+# Stub heavy deps so importing the skills manager doesn't pull DB / FastAPI.
+for _mod in ("sqlalchemy", "sqlalchemy.orm", "sqlalchemy.ext", "sqlalchemy.ext.declarative"):
+    if _mod not in sys.modules:
+        try:
+            __import__(_mod)
+        except ImportError:
+            sys.modules[_mod] = MagicMock()
+
+from services.memory.skills import SkillsManager  # noqa: E402
+
+
+def _skill(name, description, tags):
+    # status must be published/draft or get_relevant_skills filters the skill
+    # out before the tag-scoring path runs.
+    return {"name": name, "description": description, "when_to_use": "",
+            "tags": tags, "procedure": [], "status": "published"}
+
+
+def test_tag_substring_does_not_boost(tmp_path):
+    sm = SkillsManager(str(tmp_path))
+    skills = [_skill("ml-helper", "machine learning helper", ["ai"])]
+    # "ai" appears only as a substring of "email", not as a whole token, so it
+    # must not boost this unrelated skill into the results.
+    out = sm.get_relevant_skills("send me an email about lunch tomorrow", skills=skills)
+    assert out == []
+
+
+def test_tag_whole_token_still_boosts(tmp_path):
+    sm = SkillsManager(str(tmp_path))
+    skills = [_skill("git-helper", "version control stuff", ["git"])]
+    out = sm.get_relevant_skills("help me with git rebase", skills=skills)
+    assert any(s["name"] == "git-helper" for s in out)