Cherry-pick: fix: maximum observation length + error (codegen-sh#919)

Zeeeepa · web-flow · commit a23b52084bd7 · 2025-04-17T18:33:01.000+01:00
diff --git a/docs/changelog/changelog.mdx b/docs/changelog/changelog.mdx
@@ -4,6 +4,11 @@ icon: "clock"
 iconType: "solid"
 ---
 
+<Update label="v0.52.12" description="March 19, 2025">
+### [Renames search functionality](https://github.com/codegen-sh/codegen-sdk/releases/tag/v0.52.12)
+- Renamed search functionality to ripgrep
+</Update>
+
 <Update label="v0.52.11" description="March 19, 2025">
 ### [Fixes error, updates docs, adds TypeScript feature.](https://github.com/codegen-sh/codegen-sdk/releases/tag/v0.52.11)
 - Fix LLM truncation error
diff --git a/src/codegen/extensions/langchain/graph.py b/src/codegen/extensions/langchain/graph.py
@@ -155,15 +155,27 @@ def format_header(header_type: str) -> str:
 
         # Format messages with appropriate headers
         formatted_messages = []
-        for msg in to_summarize:  # No need for slice when iterating full list
+        image_urls = []  # Track image URLs for the summary prompt
+
+        for msg in to_summarize:
             if isinstance(msg, HumanMessage):
-                formatted_messages.append(format_header("human") + msg.content)
+                # Now we know content is always a list
+                for item in msg.content:
+                    if item.get("type") == "text":
+                        text_content = item.get("text", "")
+                        if text_content:
+                            formatted_messages.append(format_header("human") + text_content)
+                    elif item.get("type") == "image_url":
+                        image_url = item.get("image_url", {}).get("url")
+                        if image_url:
+                            # We are not including any string data in the summary for image. The image will be present itself!
+                            image_urls.append({"type": "image_url", "image_url": {"url": image_url}})
             elif isinstance(msg, AIMessage):
                 # Check for summary message using additional_kwargs
                 if msg.additional_kwargs.get("is_summary"):
                     formatted_messages.append(format_header("summary") + msg.content)
                 elif isinstance(msg.content, list) and len(msg.content) > 0 and isinstance(msg.content[0], dict):
-                    for item in msg.content:  # No need for slice when iterating full list
+                    for item in msg.content:
                         if item.get("type") == "text":
                             formatted_messages.append(format_header("ai") + item["text"])
                         elif item.get("type") == "tool_use":
@@ -173,16 +185,25 @@ def format_header(header_type: str) -> str:
             elif isinstance(msg, ToolMessage):
                 formatted_messages.append(format_header("tool_response") + msg.content)
 
-        conversation = "\n".join(formatted_messages)  # No need for slice when joining full list
+        conversation = "\n".join(formatted_messages)
 
         summary_llm = LLM(
             model_provider="anthropic",
             model_name="claude-3-5-sonnet-latest",
             temperature=0.3,
         )
 
-        chain = ChatPromptTemplate.from_template(SUMMARIZE_CONVERSATION_PROMPT) | summary_llm
-        new_summary = chain.invoke({"conversation": conversation}).content
+        # Choose template based on whether we have images
+        summarizer_content = [{"type": "text", "text": SUMMARIZE_CONVERSATION_PROMPT}]
+        for image_url in image_urls:
+            summarizer_content.append(image_url)
+
+        chain = ChatPromptTemplate([("human", summarizer_content)]) | summary_llm
+        new_summary = chain.invoke(
+            {
+                "conversation": conversation,
+            }
+        ).content
 
         return {"messages": {"type": "summarize", "summary": new_summary, "tail": tail, "head": head}}
 
@@ -199,7 +220,7 @@ def should_continue(self, state: GraphState) -> Literal["tools", "summarize_conv
             return "summarize_conversation"
 
         # Summarize if the last message exceeds the max input tokens of the model - 10000 tokens
-        elif isinstance(last_message, AIMessage) and not just_summarized and curr_input_tokens > (max_input_tokens - 10000):
+        elif isinstance(last_message, AIMessage) and not just_summarized and curr_input_tokens > (max_input_tokens - 30000):
             return "summarize_conversation"
 
         elif hasattr(last_message, "tool_calls") and last_message.tool_calls:
diff --git a/src/codegen/extensions/tools/observation.py b/src/codegen/extensions/tools/observation.py
@@ -6,6 +6,10 @@
 from langchain_core.messages import ToolMessage
 from pydantic import BaseModel, Field
 
+from codegen.shared.logging.get_logger import get_logger
+
+logger = get_logger(__name__)
+
 
 class Observation(BaseModel):
     """Base class for all tool observations.
@@ -44,14 +48,18 @@ def __repr__(self) -> str:
         """Get detailed string representation of the observation."""
         return f"{self.__class__.__name__}({self.model_dump_json()})"
 
-    def render_as_string(self) -> str:
+    def render_as_string(self, max_tokens: int = 8000) -> str:
         """Render the observation as a string.
 
         This is used for string representation and as the content field
         in the ToolMessage. Subclasses can override this to customize
         their string output format.
         """
-        return json.dumps(self.model_dump(), indent=2)
+        rendered = json.dumps(self.model_dump(), indent=2)
+        if 3 * len(rendered) > max_tokens:
+            logger.error(f"Observation is too long to render: {len(rendered) * 3} tokens")
+            return rendered[:max_tokens] + "\n\n...truncated...\n\n"
+        return rendered
 
     def render(self, tool_call_id: Optional[str] = None) -> ToolMessage | str:
         """Render the observation as a ToolMessage or string.