Visual browsing in CodeAct using set-of-marks annotated webpage screenshots (#6464)

This commit is contained in:
Aditya Bharat Soni
2025-02-01 15:56:11 -05:00
committed by GitHub
parent eb8d1600c3
commit a593d9bc6d
4 changed files with 50 additions and 5 deletions

View File

@@ -101,7 +101,11 @@ class Message(BaseModel):
# See discussion here for details: https://github.com/BerriAI/litellm/issues/6422#issuecomment-2438765472
if self.role == 'tool' and item.cache_prompt:
role_tool_with_prompt_caching = True
d.pop('cache_control')
if isinstance(d, dict):
d.pop('cache_control')
elif isinstance(d, list):
for d_item in d:
d_item.pop('cache_control')
if isinstance(item, TextContent):
content.append(d)
elif isinstance(item, ImageContent) and self.vision_enabled: