Spaces:

VibecoderMcSwaggins
/

DeepBoner

Paused

VibecoderMcSwaggins commited on 6 days ago

Commit

e6f0fda

1 Parent(s): c7f5590

fix: PubMed JSON parsing (SPEC-20)

Moves JSON parsing inside try/except block to handle API
maintenance pages gracefully. Adds JSONDecodeError handling.

- Add `import json` at top of file
- Move `search_resp.json()` inside try block (line 84)
- Add `except json.JSONDecodeError` handler with warning log
- Return empty list on invalid JSON (graceful degradation)
- Add unit test for maintenance page scenario

Fixes: production crash on PubMed maintenance pages

Files changed (2) hide show

src/tools/pubmed.py +9 -1
tests/unit/tools/test_pubmed.py +23 -0

src/tools/pubmed.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """PubMed search tool using NCBI E-utilities."""
 from typing import Any
 import httpx
@@ -80,12 +81,19 @@ class PubMedTool:
                     params=search_params,
                 )
                 search_resp.raise_for_status()
             except httpx.HTTPStatusError as e:
                 if e.response.status_code == self.HTTP_TOO_MANY_REQUESTS:
                     raise RateLimitError("PubMed rate limit exceeded") from e
                 raise SearchError(f"PubMed search failed: {e}") from e
-            search_data = search_resp.json()
             pmids = search_data.get("esearchresult", {}).get("idlist", [])
             if not pmids:

 """PubMed search tool using NCBI E-utilities."""
+import json
 from typing import Any
 import httpx
                     params=search_params,
                 )
                 search_resp.raise_for_status()
+                search_data = search_resp.json()
             except httpx.HTTPStatusError as e:
                 if e.response.status_code == self.HTTP_TOO_MANY_REQUESTS:
                     raise RateLimitError("PubMed rate limit exceeded") from e
                 raise SearchError(f"PubMed search failed: {e}") from e
+            except json.JSONDecodeError as e:
+                logger.warning(
+                    "PubMed returned invalid JSON (possible maintenance page)",
+                    error=str(e),
+                    response_preview=search_resp.text[:200] if search_resp else "N/A",
+                )
+                return []
             pmids = search_data.get("esearchresult", {}).get("idlist", [])
             if not pmids:

tests/unit/tools/test_pubmed.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """Unit tests for PubMed tool."""
 from unittest.mock import AsyncMock, MagicMock
 import pytest
@@ -150,3 +151,25 @@ class TestPubMedTool:
         assert "help" not in term.lower()
         # "low libido" should be expanded
         assert "HSDD" in term or "hypoactive" in term

 """Unit tests for PubMed tool."""
+import json
 from unittest.mock import AsyncMock, MagicMock
 import pytest
         assert "help" not in term.lower()
         # "low libido" should be expanded
         assert "HSDD" in term or "hypoactive" in term
+    @pytest.mark.asyncio
+    async def test_search_handles_maintenance_page(self, mocker):
+        """PubMedTool should gracefully handle non-JSON responses (maintenance pages)."""
+        # Mock response that returns HTML instead of JSON (maintenance page)
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_response.text = "<html><body>Service Temporarily Unavailable</body></html>"
+        mock_response.json.side_effect = json.JSONDecodeError("Expecting value", "", 0)
+        mock_response.raise_for_status = MagicMock()
+        mock_client = AsyncMock()
+        mock_client.get = AsyncMock(return_value=mock_response)
+        mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+        mock_client.__aexit__ = AsyncMock(return_value=None)
+        mocker.patch("httpx.AsyncClient", return_value=mock_client)
+        tool = PubMedTool()
+        # Should return empty list, not crash
+        results = await tool.search("test query")
+        assert results == []