From 7864cbbeea409aed41732113dd096af4aaeeec55 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 7 May 2026 03:16:02 +0530
Subject: [PATCH] test(backend): teach fake chat LLM Gmail tool-call flow

---
 surfsense_backend/tests/e2e/fakes/chat_llm.py | 88 ++++++++++++++++++-
 .../e2e/fakes/fixtures/gmail_messages.json    |  2 +-
 2 files changed, 85 insertions(+), 5 deletions(-)

diff --git a/surfsense_backend/tests/e2e/fakes/chat_llm.py b/surfsense_backend/tests/e2e/fakes/chat_llm.py
index 06948d769..7b66f3b21 100644
--- a/surfsense_backend/tests/e2e/fakes/chat_llm.py
+++ b/surfsense_backend/tests/e2e/fakes/chat_llm.py
@@ -14,6 +14,8 @@ from langchain_core.outputs import ChatGeneration, ChatGenerationChunk, ChatResu
 
 DRIVE_CANARY_TOKEN = "SURFSENSE_E2E_CANARY_TOKEN_DRIVE_001"
 GMAIL_CANARY_TOKEN = "SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
+GMAIL_CANARY_SUBJECT = "E2E Canary Email"
+GMAIL_CANARY_MESSAGE_ID = "fake-msg-canary-001"
 NO_RELEVANT_CONTENT_SENTINEL = "No relevant indexed content found."
 NO_RELEVANT_CONTENT_QUERY = "E2E_NO_RELEVANT_CONTENT_SMOKE"
 
@@ -42,6 +44,10 @@ def _contains_any(text: str, needles: tuple[str, ...]) -> bool:
     return any(needle.lower() in lowered for needle in needles)
 
 
+def _latest_tool_message(messages: list[BaseMessage]) -> BaseMessage | None:
+    return next((message for message in reversed(messages) if message.type == "tool"), None)
+
+
 class FakeChatLLM(BaseChatModel):
     @property
     def _llm_type(self) -> str:
@@ -63,17 +69,26 @@ class FakeChatLLM(BaseChatModel):
             return NO_RELEVANT_CONTENT_SENTINEL
 
         prompt_text = _messages_to_text(messages)
+        latest_tool = _latest_tool_message(messages)
+        latest_tool_name = getattr(latest_tool, "name", None)
+        latest_tool_text = _content_to_text(latest_tool.content) if latest_tool else ""
+
+        if latest_tool_name == "read_gmail_email" and GMAIL_CANARY_TOKEN in latest_tool_text:
+            return f"Gmail live tool content found: {GMAIL_CANARY_TOKEN}"
+        if latest_tool_name == "search_gmail" and GMAIL_CANARY_MESSAGE_ID in latest_tool_text:
+            return "Reading the matching Gmail message next."
+
         wants_gmail = _contains_any(
             latest_human,
-            ("gmail", "email", "message", "E2E Canary Email"),
+            ("gmail", "email", "message", GMAIL_CANARY_SUBJECT),
         )
         wants_drive = _contains_any(
             latest_human,
             ("drive", "file", "e2e-canary.txt"),
         )
         has_gmail_evidence = (
-            "E2E Canary Email" in prompt_text
-            or "fake-msg-canary-001" in prompt_text
+            GMAIL_CANARY_SUBJECT in prompt_text
+            or GMAIL_CANARY_MESSAGE_ID in prompt_text
             or GMAIL_CANARY_TOKEN in prompt_text
         )
         has_drive_evidence = (
@@ -92,6 +107,51 @@ class FakeChatLLM(BaseChatModel):
             return f"Drive content found: {DRIVE_CANARY_TOKEN}"
         return NO_RELEVANT_CONTENT_SENTINEL
 
+    def _tool_call_message_for(self, messages: list[BaseMessage]) -> AIMessage | None:
+        latest_human = next(
+            (
+                _content_to_text(message.content)
+                for message in reversed(messages)
+                if message.type == "human"
+            ),
+            "",
+        )
+        latest_tool = _latest_tool_message(messages)
+        latest_tool_name = getattr(latest_tool, "name", None)
+        latest_tool_text = _content_to_text(latest_tool.content) if latest_tool else ""
+
+        if latest_tool_name == "search_gmail" and GMAIL_CANARY_MESSAGE_ID in latest_tool_text:
+            return AIMessage(
+                content="",
+                tool_calls=[
+                    {
+                        "name": "read_gmail_email",
+                        "args": {"message_id": GMAIL_CANARY_MESSAGE_ID},
+                        "id": "call_e2e_read_gmail",
+                    }
+                ],
+            )
+
+        if latest_tool is None and _contains_any(
+            latest_human,
+            ("gmail", "email", "message", GMAIL_CANARY_SUBJECT),
+        ):
+            return AIMessage(
+                content="",
+                tool_calls=[
+                    {
+                        "name": "search_gmail",
+                        "args": {
+                            "query": f"subject:{GMAIL_CANARY_SUBJECT}",
+                            "max_results": 5,
+                        },
+                        "id": "call_e2e_search_gmail",
+                    }
+                ],
+            )
+
+        return None
+
     def _generate(
         self,
         messages: list[BaseMessage],
@@ -100,7 +160,9 @@ class FakeChatLLM(BaseChatModel):
         **kwargs: Any,
     ) -> ChatResult:
         del stop, run_manager, kwargs
-        message = AIMessage(content=self._response_for(messages), tool_calls=[])
+        message = self._tool_call_message_for(messages) or AIMessage(
+            content=self._response_for(messages), tool_calls=[]
+        )
         return ChatResult(generations=[ChatGeneration(message=message)])
 
     async def _astream(
@@ -111,6 +173,24 @@ class FakeChatLLM(BaseChatModel):
         **kwargs: Any,
     ) -> AsyncIterator[ChatGenerationChunk]:
         del stop, run_manager, kwargs
+        tool_call_message = self._tool_call_message_for(messages)
+        if tool_call_message:
+            for tool_call in tool_call_message.tool_calls:
+                yield ChatGenerationChunk(
+                    message=AIMessageChunk(
+                        content="",
+                        tool_call_chunks=[
+                            {
+                                "name": tool_call["name"],
+                                "args": json.dumps(tool_call["args"]),
+                                "id": tool_call["id"],
+                                "index": 0,
+                            }
+                        ],
+                    )
+                )
+            return
+
         yield ChatGenerationChunk(
             message=AIMessageChunk(content=self._response_for(messages))
         )
diff --git a/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json b/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json
index c86dee404..74bbd9965 100644
--- a/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json
+++ b/surfsense_backend/tests/e2e/fakes/fixtures/gmail_messages.json
@@ -19,7 +19,7 @@
       "from": "sender@surfsense.example",
       "to": "e2e-fake@surfsense.example",
       "date": "Mon, 10 Feb 2025 11:00:00 +0000",
-      "messageText": "This Gmail message body proves the Composio Gmail indexer fetched message details. SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
+      "messageText": "This Gmail message body proves the Composio Gmail live tool fetched message details. SURFSENSE_E2E_CANARY_TOKEN_GMAIL_001"
     },
     "fake-msg-planning-001": {
       "id": "fake-msg-planning-001",