fix(extraction-cache): resolve wpid via context at cross-run cache sites (SKY-8992) (#5604)

2026-04-28 03:30:10 +00:00 · 2026-04-22 15:45:43 -07:00 · 2026-04-22 15:45:43 -07:00 · 108ec030e6
commit 108ec030e6
parent b97a4f54c0
2 changed files with 126 additions and 6 deletions
--- a/tests/unit/test_extract_information_wpid_fallback.py
+++ b/tests/unit/test_extract_information_wpid_fallback.py
@ -0,0 +1,120 @@
+"""Regression test for SKY-8992 — cross-run cache wpid fallback.
+
+``task.workflow_permanent_id`` is ``None`` on almost every fetch path (the
+``tasks`` DB table has no such column; only ``get_tasks()`` populates it via
+an outer join). Without a fallback, every cross-run cache call received
+``workflow_permanent_id=None`` and the cloud override's guard short-circuited
+before writing to Redis. Assert the handler now falls back to
+``skyvern_context`` so the cache calls carry a non-None wpid.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from unittest.mock import AsyncMock, MagicMock
+
+
+def _run_extract_information_and_capture_cache_calls(
+    monkeypatch,
+    *,
+    task_wpid: str | None,
+    context_wpid: str | None,
+) -> dict[str, object]:
+    from skyvern.webeye.actions import handler
+
+    captured: dict[str, object] = {}
+
+    def fake_load_prompt_with_elements_tracked(**kwargs):
+        return "rendered-prompt", {
+            "extracted_text": kwargs.get("extracted_text"),
+            "previous_extracted_information": kwargs.get("previous_extracted_information"),
+            "extracted_information_schema": kwargs.get("extracted_information_schema"),
+        }
+
+    async def fake_llm_handler(**_kwargs):
+        # Return a dict so ``isinstance(json_response, (dict, list, str))`` is True
+        # and the dual-write block is entered.
+        return {"result": "ok"}
+
+    lookup_mock = AsyncMock(return_value=None)
+    store_mock = AsyncMock(return_value=None)
+    agent_function_stub = MagicMock()
+    agent_function_stub.lookup_cross_run_extraction_cache = lookup_mock
+    agent_function_stub.store_cross_run_extraction_cache = store_mock
+
+    monkeypatch.setattr(handler, "load_prompt_with_elements_tracked", fake_load_prompt_with_elements_tracked)
+    monkeypatch.setattr(
+        handler,
+        "ensure_context",
+        lambda: MagicMock(tz_info=None, workflow_permanent_id=context_wpid),
+    )
+    monkeypatch.setattr(handler.service_utils, "is_cua_task", AsyncMock(return_value=False))
+    monkeypatch.setattr(
+        handler.LLMAPIHandlerFactory,
+        "get_override_llm_api_handler",
+        lambda llm_key, default: fake_llm_handler,
+    )
+    # Force a non-None cache_key so the lookup + store paths both execute.
+    monkeypatch.setattr(handler.extraction_cache, "compute_cache_key", lambda **_: "cachekey_test")
+    monkeypatch.setattr(handler.extraction_cache, "store", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(handler.app, "AGENT_FUNCTION", agent_function_stub)
+
+    refreshed = MagicMock()
+    refreshed.extracted_text = "TXT"
+    refreshed.url = "https://example.test"
+    refreshed.screenshots = []
+    refreshed.last_used_element_tree_html = "<a>link</a>"
+    refreshed.build_element_tree = MagicMock(return_value="<a>link</a>")
+    refreshed.support_economy_elements_tree = MagicMock(return_value=False)
+
+    scraped_page = MagicMock()
+    scraped_page.refresh = AsyncMock(return_value=refreshed)
+    scraped_page.screenshots = []
+
+    task = MagicMock()
+    task.navigation_goal = None
+    task.navigation_payload = None
+    task.extracted_information = None
+    task.extracted_information_schema = {"type": "object"}
+    task.data_extraction_goal = "Extract documents"
+    task.error_code_mapping = None
+    task.llm_key = None
+    task.workflow_run_id = "wr_test"
+    task.workflow_permanent_id = task_wpid
+    task.task_id = "tsk_test"
+    task.include_extracted_text = True
+
+    asyncio.run(
+        handler.extract_information_for_navigation_goal(
+            task=task, step=MagicMock(retry_index=0), scraped_page=scraped_page
+        )
+    )
+
+    captured["lookup_calls"] = lookup_mock.await_args_list
+    captured["store_calls"] = store_mock.await_args_list
+    return captured
+
+
+def test_cache_calls_use_context_wpid_when_task_wpid_is_none(monkeypatch) -> None:
+    captured = _run_extract_information_and_capture_cache_calls(
+        monkeypatch,
+        task_wpid=None,
+        context_wpid="wpid_from_context",
+    )
+    # Both lookup and store should receive the context wpid as the first positional arg.
+    assert captured["lookup_calls"], "lookup_cross_run_extraction_cache was not awaited"
+    assert captured["lookup_calls"][0].args[0] == "wpid_from_context"
+    assert captured["store_calls"], "store_cross_run_extraction_cache was not awaited"
+    assert captured["store_calls"][0].args[0] == "wpid_from_context"
+
+
+def test_cache_calls_prefer_task_wpid_when_both_are_set(monkeypatch) -> None:
+    # Belt-and-suspenders: if a caller ever does populate task.workflow_permanent_id,
+    # the task value wins (matches the ``a or b`` precedence).
+    captured = _run_extract_information_and_capture_cache_calls(
+        monkeypatch,
+        task_wpid="wpid_from_task",
+        context_wpid="wpid_from_context",
+    )
+    assert captured["lookup_calls"][0].args[0] == "wpid_from_task"
+    assert captured["store_calls"][0].args[0] == "wpid_from_task"