fix(chat): stop 429 retry spiral and add get_weather coord fallback

- search_places: detect HTTP 429 and mark retryable=False to stop the retry loop immediately instead of spiraling until MAX_ITERATIONS - get_weather: extract collection coordinates (lat/lng from first location with coords) and retry when LLM omits required params; uses sync_to_async for the DB query in the async view - AITravelChat: deduplicate context-only tools (get_trip_details, get_weather) in the render pipeline to prevent duplicate place cards from appearing when the retry loop causes multiple get_trip_details calls - Tests: 5 new tests covering 429 non-retryable path and weather coord fallback; all 39 chat tests pass
2026-03-10 19:18:55 +00:00
parent de8625c17f
commit 635e0df0ab
4 changed files with 321 additions and 3 deletions
--- a/backend/server/chat/agent_tools.py
+++ b/backend/server/chat/agent_tools.py
@@ -196,6 +196,10 @@ def search_places(
            "category": category,
            "results": results,
        }
+    except requests.HTTPError as exc:
+        if exc.response is not None and exc.response.status_code == 429:
+            return {"error": f"Places API request failed: {exc}", "retryable": False}
+        return {"error": f"Places API request failed: {exc}"}
    except requests.RequestException as exc:
        return {"error": f"Places API request failed: {exc}"}
    except (TypeError, ValueError) as exc:
--- a/backend/server/chat/tests.py
+++ b/backend/server/chat/tests.py
@@ -1,6 +1,8 @@
 import json
 from unittest import mock
-from unittest.mock import patch
+from unittest.mock import MagicMock, patch
+
+import requests as _requests

 from django.contrib.auth import get_user_model
 from django.test import TestCase
@@ -11,6 +13,7 @@ from chat.agent_tools import (
    add_to_itinerary,
    execute_tool,
    get_trip_details,
+    search_places,
    web_search,
 )
 from chat.views import ChatViewSet
@@ -997,3 +1000,218 @@ class ChatViewSetToolExecutionFailureLoopTests(APITransactionTestCase):
                for payload in json_payloads
            )
        )
+
+
+class SearchPlaces429NonRetryableTests(TestCase):
+    """search_places must return retryable=False on HTTP 429."""
+
+    def test_429_response_marks_result_non_retryable(self):
+        mock_response = MagicMock()
+        mock_response.status_code = 429
+        http_error = _requests.HTTPError(response=mock_response)
+
+        with patch("chat.agent_tools.requests.get", side_effect=http_error):
+            result = search_places(
+                user=None,
+                location="Paris, France",
+            )
+
+        self.assertIn("error", result)
+        self.assertFalse(
+            result.get("retryable", True),
+            "429 error must set retryable=False to prevent retry spiral",
+        )
+
+    def test_non_429_http_error_is_retryable_by_default(self):
+        mock_response = MagicMock()
+        mock_response.status_code = 500
+        http_error = _requests.HTTPError(response=mock_response)
+
+        with patch("chat.agent_tools.requests.get", side_effect=http_error):
+            result = search_places(
+                user=None,
+                location="Paris, France",
+            )
+
+        self.assertIn("error", result)
+        self.assertTrue(
+            result.get("retryable", True),
+            "Non-429 HTTP errors should remain retryable (default=True)",
+        )
+
+    def test_generic_request_exception_is_retryable_by_default(self):
+        conn_error = _requests.ConnectionError("timeout")
+
+        with patch("chat.agent_tools.requests.get", side_effect=conn_error):
+            result = search_places(
+                user=None,
+                location="Paris, France",
+            )
+
+        self.assertIn("error", result)
+        self.assertTrue(
+            result.get("retryable", True),
+            "Generic RequestException should remain retryable",
+        )
+
+
+class GetWeatherCoordFallbackTests(APITransactionTestCase):
+    """get_weather lat/lng required param should be retried with collection location coords."""
+
+    @patch("chat.views.execute_tool")
+    @patch("chat.views.stream_chat_completion")
+    @patch("integrations.utils.auto_profile.update_auto_preference_profile")
+    def test_get_weather_retries_with_collection_coordinates(
+        self,
+        _mock_auto_profile,
+        mock_stream_chat_completion,
+        mock_execute_tool,
+    ):
+        user = User.objects.create_user(
+            username="weather-coord-user",
+            email="weather-coord-user@example.com",
+            password="password123",
+        )
+        self.client.force_authenticate(user=user)
+
+        collection = Collection.objects.create(
+            user_id=user.id,
+            name="Paris Trip",
+        )
+        paris_location = Location.objects.create(
+            user_id=user.id,
+            name="Paris",
+            latitude=48.8566,
+            longitude=2.3522,
+        )
+        collection.locations.add(paris_location)
+
+        conversation_response = self.client.post(
+            "/api/chat/conversations/",
+            {"title": "Weather Coord Fallback Test"},
+            format="json",
+        )
+        self.assertEqual(conversation_response.status_code, 201)
+        conversation_id = conversation_response.json()["id"]
+
+        async def weather_stream(*args, **kwargs):
+            # LLM calls get_weather without coordinates
+            yield 'data: {"tool_calls": [{"index": 0, "id": "call_w1", "type": "function", "function": {"name": "get_weather", "arguments": "{}"}}]}\n\n'
+            yield "data: [DONE]\n\n"
+
+        async def success_stream(*args, **kwargs):
+            yield 'data: {"content": "The weather in Paris is sunny."}\n\n'
+            yield "data: [DONE]\n\n"
+
+        mock_stream_chat_completion.side_effect = [weather_stream(), success_stream()]
+        mock_execute_tool.side_effect = [
+            # First call: no lat/lon
+            {"error": "latitude and longitude are required"},
+            # Retry call: with injected coords from collection — succeeds
+            {"temperature": 22, "condition": "sunny", "location": "Paris"},
+        ]
+
+        response = self.client.post(
+            f"/api/chat/conversations/{conversation_id}/send_message/",
+            {
+                "message": "What's the weather like?",
+                "collection_id": str(collection.id),
+            },
+            format="json",
+        )
+
+        self.assertEqual(response.status_code, 200)
+        chunks = [
+            chunk.decode("utf-8")
+            if isinstance(chunk, (bytes, bytearray))
+            else str(chunk)
+            for chunk in response.streaming_content
+        ]
+        payload_lines = [
+            chunk.strip()[len("data: ") :]
+            for chunk in chunks
+            if chunk.strip().startswith("data: ")
+        ]
+        json_payloads = [json.loads(p) for p in payload_lines if p != "[DONE]"]
+
+        # Verify the retry happened with coordinates (execute_tool called twice)
+        self.assertEqual(
+            mock_execute_tool.call_count,
+            2,
+            "Expected exactly 2 execute_tool calls: initial + coord retry",
+        )
+        # Verify no tool_execution_error surfaced to the user
+        self.assertFalse(
+            any(
+                payload.get("error_category") == "tool_execution_error"
+                for payload in json_payloads
+            ),
+            "Should not emit tool_execution_error when coord retry succeeds",
+        )
+
+        # Verify coordinates were passed in the retry call
+        retry_kwargs = mock_execute_tool.call_args_list[1][1]
+        self.assertAlmostEqual(retry_kwargs.get("latitude"), 48.8566, places=3)
+        self.assertAlmostEqual(retry_kwargs.get("longitude"), 2.3522, places=3)
+
+    @patch("chat.views.execute_tool")
+    @patch("chat.views.stream_chat_completion")
+    @patch("integrations.utils.auto_profile.update_auto_preference_profile")
+    def test_get_weather_missing_coords_no_collection_emits_error(
+        self,
+        _mock_auto_profile,
+        mock_stream_chat_completion,
+        mock_execute_tool,
+    ):
+        user = User.objects.create_user(
+            username="weather-no-collection-user",
+            email="weather-no-collection-user@example.com",
+            password="password123",
+        )
+        self.client.force_authenticate(user=user)
+
+        conversation_response = self.client.post(
+            "/api/chat/conversations/",
+            {"title": "Weather No Collection Test"},
+            format="json",
+        )
+        self.assertEqual(conversation_response.status_code, 201)
+        conversation_id = conversation_response.json()["id"]
+
+        async def weather_stream(*args, **kwargs):
+            yield 'data: {"tool_calls": [{"index": 0, "id": "call_w2", "type": "function", "function": {"name": "get_weather", "arguments": "{}"}}]}\n\n'
+            yield "data: [DONE]\n\n"
+
+        mock_stream_chat_completion.side_effect = weather_stream
+        mock_execute_tool.return_value = {
+            "error": "latitude and longitude are required"
+        }
+
+        response = self.client.post(
+            f"/api/chat/conversations/{conversation_id}/send_message/",
+            {"message": "What's the weather like?"},
+            format="json",
+        )
+
+        self.assertEqual(response.status_code, 200)
+        chunks = [
+            chunk.decode("utf-8")
+            if isinstance(chunk, (bytes, bytearray))
+            else str(chunk)
+            for chunk in response.streaming_content
+        ]
+        payload_lines = [
+            chunk.strip()[len("data: ") :]
+            for chunk in chunks
+            if chunk.strip().startswith("data: ")
+        ]
+        json_payloads = [json.loads(p) for p in payload_lines if p != "[DONE]"]
+
+        # No collection means no coord fallback — should emit tool_validation_error
+        self.assertTrue(
+            any(
+                payload.get("error_category") == "tool_validation_error"
+                for payload in json_payloads
+            ),
+            "Should emit tool_validation_error when no collection coords available",
+        )
--- a/backend/server/chat/views/init.py
+++ b/backend/server/chat/views/init.py
@@ -248,6 +248,34 @@ class ChatViewSet(viewsets.ModelViewSet):
            result,
        ) or cls._is_search_places_geocode_error(tool_name, result)

+    @classmethod
+    def _is_get_weather_missing_latlong_error(cls, tool_name, result):
+        """True when get_weather was called without latitude/longitude."""
+        if tool_name != "get_weather" or not cls._is_required_param_tool_error(result):
+            return False
+
+        error_text = (result or {}).get("error") if isinstance(result, dict) else ""
+        if not isinstance(error_text, str):
+            return False
+
+        normalized_error = error_text.strip().lower()
+        return "latitude" in normalized_error or "longitude" in normalized_error
+
+    @staticmethod
+    def _extract_collection_coordinates(collection):
+        """Return (lat, lon) from the first geocoded location in the collection, or None."""
+        if collection is None:
+            return None
+        for location in collection.locations.all():
+            lat = getattr(location, "latitude", None)
+            lon = getattr(location, "longitude", None)
+            if lat is not None and lon is not None:
+                try:
+                    return float(lat), float(lon)
+                except (TypeError, ValueError):
+                    continue
+        return None
+
    @staticmethod
    def _build_search_places_location_clarification_message():
        return (
@@ -703,6 +731,54 @@ class ChatViewSet(viewsets.ModelViewSet):
                                    "error": "Could not search places at the provided itinerary locations"
                                }

+                        attempted_weather_coord_retry = False
+                        if self._is_get_weather_missing_latlong_error(
+                            function_name, result
+                        ):
+                            coords = await sync_to_async(
+                                self._extract_collection_coordinates,
+                                thread_sensitive=True,
+                            )(collection)
+                            if coords is not None:
+                                retry_lat, retry_lon = coords
+                                retry_arguments = dict(prepared_arguments)
+                                retry_arguments["latitude"] = retry_lat
+                                retry_arguments["longitude"] = retry_lon
+                                attempted_weather_coord_retry = True
+                                retry_result = await sync_to_async(
+                                    execute_tool,
+                                    thread_sensitive=True,
+                                )(
+                                    function_name,
+                                    request.user,
+                                    **retry_arguments,
+                                )
+                                if not self._is_required_param_tool_error(
+                                    retry_result
+                                ) and not self._is_execution_failure_tool_error(
+                                    retry_result
+                                ):
+                                    result = retry_result
+                                    tool_call_for_history = {
+                                        **tool_call,
+                                        "function": {
+                                            **function_payload,
+                                            "name": function_name,
+                                            "arguments": json.dumps(retry_arguments),
+                                        },
+                                    }
+
+                            # If retry was attempted but still failed, convert to an
+                            # execution failure — never ask the user for coordinates
+                            # they implied via collection context.
+                            if (
+                                attempted_weather_coord_retry
+                                and self._is_required_param_tool_error(result)
+                            ):
+                                result = {
+                                    "error": "Could not fetch weather for the collection locations"
+                                }
+
                        if self._is_required_param_tool_error(result):
                            assistant_message_kwargs = {
                                "conversation": conversation,
--- a/frontend/src/lib/components/AITravelChat.svelte
+++ b/frontend/src/lib/components/AITravelChat.svelte
@@ -348,7 +348,9 @@
 		return [...next, toolResult];
 	}

-	function uniqueToolResultsByCallId(toolResults: ToolResultEntry[] | undefined): ToolResultEntry[] {
+	function uniqueToolResultsByCallId(
+		toolResults: ToolResultEntry[] | undefined
+	): ToolResultEntry[] {
 		if (!toolResults) {
 			return [];
 		}
@@ -368,6 +370,24 @@
 		return unique;
 	}

+	// Context-loading tools that should render at most once per message, even if
+	// the retry loop caused the LLM to call them multiple times.
+	const CONTEXT_ONLY_TOOLS = new Set(['get_trip_details', 'get_weather']);
+
+	function deduplicateContextTools(toolResults: ToolResultEntry[]): ToolResultEntry[] {
+		const seenContextTool = new Set<string>();
+		return toolResults.filter((result) => {
+			const name = result.name;
+			if (name && CONTEXT_ONLY_TOOLS.has(name)) {
+				if (seenContextTool.has(name)) {
+					return false;
+				}
+				seenContextTool.add(name);
+			}
+			return true;
+		});
+	}
+
 	function rebuildConversationMessages(rawMessages: ChatMessage[]): ChatMessage[] {
 		const rebuilt = rawMessages.map((msg) => ({
 			...msg,
@@ -936,7 +956,7 @@
 											<div class="whitespace-pre-wrap">{msg.content}</div>
 											{#if msg.role === 'assistant' && msg.tool_results}
 												<div class="mt-2 space-y-2">
-													{#each uniqueToolResultsByCallId(msg.tool_results) as result}
+													{#each deduplicateContextTools(uniqueToolResultsByCallId(msg.tool_results)) as result}
 														{#if hasPlaceResults(result)}
 															<div class="grid gap-2">
 																{#each getPlaceResults(result) as place}