Visual browsing in CodeAct using set-of-marks annotated webpage screenshots (#6464)

2026-03-22 13:47:19 +08:00 · 2025-02-01 15:56:11 -05:00
parent eb8d1600c3
commit a593d9bc6d
4 changed files with 50 additions and 5 deletions
--- a/openhands/core/message.py
+++ b/openhands/core/message.py
@@ -101,7 +101,11 @@ class Message(BaseModel):
            # See discussion here for details: https://github.com/BerriAI/litellm/issues/6422#issuecomment-2438765472
            if self.role == 'tool' and item.cache_prompt:
                role_tool_with_prompt_caching = True
-                d.pop('cache_control')
+                if isinstance(d, dict):
+                    d.pop('cache_control')
+                elif isinstance(d, list):
+                    for d_item in d:
+                        d_item.pop('cache_control')
            if isinstance(item, TextContent):
                content.append(d)
            elif isinstance(item, ImageContent) and self.vision_enabled: