test(backend): teach fake chat LLM Gmail tool-call flow

2026-05-11 13:10:54 +00:00 · 2026-05-07 03:16:02 +05:30 · 2026-05-07 03:16:02 +05:30 · 7864cbbeea
commit 7864cbbeea
parent 2b7d713db6
2 changed files with 85 additions and 5 deletions
--- a/surfsense_backend/tests/e2e/fakes/chat_llm.py
+++ b/surfsense_backend/tests/e2e/fakes/chat_llm.py
@ -14,6 +14,8 @@ from langchain_core.outputs import ChatGeneration, ChatGenerationChunk, ChatResu

 DRIVE_CANARY_TOKEN = "SURFSENSE_E2E_CANARY_TOKEN_DRIVE_001"
 GMAIL_CANARY_TOKEN = "SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
+GMAIL_CANARY_SUBJECT = "E2E Canary Email"
+GMAIL_CANARY_MESSAGE_ID = "fake-msg-canary-001"
 NO_RELEVANT_CONTENT_SENTINEL = "No relevant indexed content found."
 NO_RELEVANT_CONTENT_QUERY = "E2E_NO_RELEVANT_CONTENT_SMOKE"

@ -42,6 +44,10 @@ def _contains_any(text: str, needles: tuple[str, ...]) -> bool:
    return any(needle.lower() in lowered for needle in needles)


+def _latest_tool_message(messages: list[BaseMessage]) -> BaseMessage | None:
+    return next((message for message in reversed(messages) if message.type == "tool"), None)
+
+
 class FakeChatLLM(BaseChatModel):
    @property
    def _llm_type(self) -> str:
@ -63,17 +69,26 @@ class FakeChatLLM(BaseChatModel):
            return NO_RELEVANT_CONTENT_SENTINEL

        prompt_text = _messages_to_text(messages)
+        latest_tool = _latest_tool_message(messages)
+        latest_tool_name = getattr(latest_tool, "name", None)
+        latest_tool_text = _content_to_text(latest_tool.content) if latest_tool else ""
+
+        if latest_tool_name == "read_gmail_email" and GMAIL_CANARY_TOKEN in latest_tool_text:
+            return f"Gmail live tool content found: {GMAIL_CANARY_TOKEN}"
+        if latest_tool_name == "search_gmail" and GMAIL_CANARY_MESSAGE_ID in latest_tool_text:
+            return "Reading the matching Gmail message next."
+
        wants_gmail = _contains_any(
            latest_human,
-            ("gmail", "email", "message", "E2E Canary Email"),
+            ("gmail", "email", "message", GMAIL_CANARY_SUBJECT),
        )
        wants_drive = _contains_any(
            latest_human,
            ("drive", "file", "e2e-canary.txt"),
        )
        has_gmail_evidence = (
-            "E2E Canary Email" in prompt_text
-            or "fake-msg-canary-001" in prompt_text
+            GMAIL_CANARY_SUBJECT in prompt_text
+            or GMAIL_CANARY_MESSAGE_ID in prompt_text
            or GMAIL_CANARY_TOKEN in prompt_text
        )
        has_drive_evidence = (
@ -92,6 +107,51 @@ class FakeChatLLM(BaseChatModel):
            return f"Drive content found: {DRIVE_CANARY_TOKEN}"
        return NO_RELEVANT_CONTENT_SENTINEL

+    def _tool_call_message_for(self, messages: list[BaseMessage]) -> AIMessage | None:
+        latest_human = next(
+            (
+                _content_to_text(message.content)
+                for message in reversed(messages)
+                if message.type == "human"
+            ),
+            "",
+        )
+        latest_tool = _latest_tool_message(messages)
+        latest_tool_name = getattr(latest_tool, "name", None)
+        latest_tool_text = _content_to_text(latest_tool.content) if latest_tool else ""
+
+        if latest_tool_name == "search_gmail" and GMAIL_CANARY_MESSAGE_ID in latest_tool_text:
+            return AIMessage(
+                content="",
+                tool_calls=[
+                    {
+                        "name": "read_gmail_email",
+                        "args": {"message_id": GMAIL_CANARY_MESSAGE_ID},
+                        "id": "call_e2e_read_gmail",
+                    }
+                ],
+            )
+
+        if latest_tool is None and _contains_any(
+            latest_human,
+            ("gmail", "email", "message", GMAIL_CANARY_SUBJECT),
+        ):
+            return AIMessage(
+                content="",
+                tool_calls=[
+                    {
+                        "name": "search_gmail",
+                        "args": {
+                            "query": f"subject:{GMAIL_CANARY_SUBJECT}",
+                            "max_results": 5,
+                        },
+                        "id": "call_e2e_search_gmail",
+                    }
+                ],
+            )
+
+        return None
+
    def _generate(
        self,
        messages: list[BaseMessage],
@ -100,7 +160,9 @@ class FakeChatLLM(BaseChatModel):
        **kwargs: Any,
    ) -> ChatResult:
        del stop, run_manager, kwargs
-        message = AIMessage(content=self._response_for(messages), tool_calls=[])
+        message = self._tool_call_message_for(messages) or AIMessage(
+            content=self._response_for(messages), tool_calls=[]
+        )
        return ChatResult(generations=[ChatGeneration(message=message)])

    async def _astream(
@ -111,6 +173,24 @@ class FakeChatLLM(BaseChatModel):
        **kwargs: Any,
    ) -> AsyncIterator[ChatGenerationChunk]:
        del stop, run_manager, kwargs
+        tool_call_message = self._tool_call_message_for(messages)
+        if tool_call_message:
+            for tool_call in tool_call_message.tool_calls:
+                yield ChatGenerationChunk(
+                    message=AIMessageChunk(
+                        content="",
+                        tool_call_chunks=[
+                            {
+                                "name": tool_call["name"],
+                                "args": json.dumps(tool_call["args"]),
+                                "id": tool_call["id"],
+                                "index": 0,
+                            }
+                        ],
+                    )
+                )
+            return
+
        yield ChatGenerationChunk(
            message=AIMessageChunk(content=self._response_for(messages))
        )
--- a/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json
+++ b/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json
@ -19,7 +19,7 @@
      "from": "sender@surfsense.example",
      "to": "e2e-fake@surfsense.example",
      "date": "Mon, 10 Feb 2025 11:00:00 +0000",
-      "messageText": "This Gmail message body proves the Composio Gmail indexer fetched message details. SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
+      "messageText": "This Gmail message body proves the Composio Gmail live tool fetched message details. SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
    },
    "fake-msg-planning-001": {
      "id": "fake-msg-planning-001",