fix: research source extraction crashes on a non-dict finding (#1714)

2026-06-03 05:34:40 +01:00
parent 29e19f326a
commit f6f86c4b34
2 changed files with 17 additions and 0 deletions
--- a/src/research_handler.py
+++ b/src/research_handler.py
@@ -461,6 +461,8 @@ class ResearchHandler:
        seen = set()
        sources = []
        for f in findings:
            if not isinstance(f, dict):
                continue
            url = f.get("url", "")
            title = f.get("title", "") or url
            summary = f.get("summary", "") or f.get("evidence", "")
--- a/tests/test_research_handler_sources_nondict.py
+++ b/tests/test_research_handler_sources_nondict.py
@@ -0,0 +1,15 @@
 from src.research_handler import ResearchHandler
 def test_extract_sources_skips_non_dict_findings():
    # findings come from the DeepResearcher result list / cached JSON; a
    # malformed entry (None or a bare string) made the old loop call .get on a
    # non-dict and crash, dropping every real source in the set.
    findings = [
        {"url": "https://a.com", "title": "A", "summary": "real analysis of the topic"},
        "junk-row",
        None,
        {"url": "https://b.com", "summary": "more genuine detail here"},
    ]
    out = ResearchHandler._extract_sources(findings)
    assert [s["url"] for s in out] == ["https://a.com", "https://b.com"]