refactor: use AgentSettings.create_agent() for V1 agent creation

Replace manual Agent construction with settings.create_agent() when SDK AgentSettings are available. This makes settings the single source of truth for LLM, tools, condenser, critic, and agent context. Key changes: - _get_default_critic() eliminated — replaced by _apply_critic_proxy() which sets critic_server_url/critic_model_name on the settings, then lets the SDK's build_critic() do the construction. - _create_agent_with_context() settings path: populate tools + agent_context on settings, call create_agent(), apply runtime-only overrides (mcp_config, system_prompt) via model_copy. - Legacy path (no agent_settings) kept for backward compat. - Tests updated: agent_context now in Agent() constructor, mcp_config/system_prompt in model_copy. Co-authored-by: openhands <openhands@all-hands.dev>
2026-03-22 13:47:19 +08:00 · 2026-03-17 11:30:02 +00:00
parent bab9a45590
commit 9990870060
2 changed files with 133 additions and 105 deletions
--- a/openhands/app_server/app_conversation/live_status_app_conversation_service.py
+++ b/openhands/app_server/app_conversation/live_status_app_conversation_service.py
@@ -88,8 +88,6 @@ from openhands.app_server.utils.llm_metadata import (
 from openhands.integrations.provider import ProviderType
 from openhands.integrations.service_types import SuggestedTask
 from openhands.sdk import Agent, AgentContext, LocalWorkspace
-from openhands.sdk.critic import IterativeRefinementConfig
-from openhands.sdk.critic.impl.api import APIBasedCritic
 from openhands.sdk.hooks import HookConfig
 from openhands.sdk.llm import LLM
 from openhands.sdk.plugin import PluginSource
@@ -126,34 +124,41 @@ Your role ends when the plan is finalized. Implementation is handled by the code
 </IMPORTANT_PLANNING_BOUNDARIES>"""


-def _get_default_critic(
-    llm: LLM, settings: AgentSettings, _agent: Agent | None = None
-) -> APIBasedCritic | None:
-    if not settings.critic.enabled:
-        return None
+_CRITIC_PROXY_PATTERN = re.compile(
+    r'^https?://llm-proxy\.[^./]+\.all-hands\.dev'
+)
+
+
+def _apply_critic_proxy(settings: AgentSettings, llm: LLM) -> AgentSettings:
+    """Route the critic through the LLM proxy when available.
+
+    If the LLM base URL matches the OpenHands proxy pattern, configure the
+    critic to use the proxy's ``/vllm`` endpoint.  Otherwise disable the
+    critic (external users don't have access to the hosted service).
+    """
+    if not settings.verification.critic_enabled:
+        return settings

    base_url = llm.base_url
-    api_key = llm.api_key
-    if base_url is None or api_key is None:
-        return None
-
-    pattern = r'^https?://llm-proxy\.[^./]+\.all-hands\.dev'
-    if not re.match(pattern, base_url):
-        return None
-
-    iterative_refinement = None
-    if settings.critic.enable_iterative_refinement:
-        iterative_refinement = IterativeRefinementConfig(
-            success_threshold=settings.critic.threshold,
-            max_iterations=settings.critic.max_refinement_iterations,
+    if base_url and _CRITIC_PROXY_PATTERN.match(base_url):
+        return settings.model_copy(
+            update={
+                'verification': settings.verification.model_copy(
+                    update={
+                        'critic_server_url': f'{base_url.rstrip("/")}/vllm',
+                        'critic_model_name': 'critic',
+                    }
+                ),
+            }
        )

-    return APIBasedCritic(
-        server_url=f'{base_url.rstrip("/")}/vllm',
-        api_key=api_key,
-        model_name='critic',
-        mode=settings.critic.mode,
-        iterative_refinement=iterative_refinement,
+    # No proxy → disable critic
+    return settings.model_copy(
+        update={
+            'verification': settings.verification.model_copy(
+                update={'critic_enabled': False}
+            ),
+        }
    )


@@ -1172,6 +1177,12 @@ class LiveStatusAppConversationService(AppConversationServiceBase):
    ) -> Agent:
        """Create an agent with appropriate tools and context based on agent type.

+        When *agent_settings* is provided the agent is built via
+        ``AgentSettings.create_agent()`` which wires LLM, condenser,
+        tools, agent_context and critic from the settings object.
+        Runtime-only overrides (MCP config, system-prompt tweaks) are
+        applied via ``model_copy`` afterwards.
+
        Args:
            llm: Configured LLM instance
            agent_type: Type of agent to create (PLAN or DEFAULT)
@@ -1186,61 +1197,68 @@ class LiveStatusAppConversationService(AppConversationServiceBase):
        Returns:
            Configured Agent instance with context
        """
-        if agent_settings is None:
-            condenser = self._create_condenser(llm, agent_type, condenser_max_size)
-            critic = None
-        else:
-            condenser = (
-                self._create_condenser(
-                    llm,
-                    agent_type,
-                    agent_settings.condenser.max_size,
-                )
-                if agent_settings.condenser.enabled
-                else None
-            )
-            critic = _get_default_critic(llm, agent_settings)
-
-        if agent_type == AgentType.PLAN:
-            plan_path = None
-            if working_dir:
-                plan_path = self._compute_plan_path(working_dir, git_provider)
-
-            agent = Agent(
-                llm=llm,
-                tools=get_planning_tools(plan_path=plan_path),
-                system_prompt_filename='system_prompt_planning.j2',
-                system_prompt_kwargs={'plan_structure': format_plan_structure()},
-                condenser=condenser,
-                critic=critic,
-                security_analyzer=None,
-                mcp_config=mcp_config,
-            )
-        else:
-            agent = Agent(
-                llm=llm,
-                tools=get_default_tools(enable_browser=True),
-                system_prompt_kwargs={'cli_mode': False},
-                condenser=condenser,
-                critic=critic,
-                mcp_config=mcp_config,
-            )
-
-        effective_system_message_suffix = system_message_suffix
-        if agent_type == AgentType.PLAN:
-            if system_message_suffix:
-                effective_system_message_suffix = (
-                    f'{PLANNING_AGENT_INSTRUCTION}\n\n{system_message_suffix}'
-                )
-            else:
-                effective_system_message_suffix = PLANNING_AGENT_INSTRUCTION
-
-        agent_context = AgentContext(
-            system_message_suffix=effective_system_message_suffix, secrets=secrets
+        # -- Determine tools based on agent type --
+        plan_path = None
+        if agent_type == AgentType.PLAN and working_dir:
+            plan_path = self._compute_plan_path(working_dir, git_provider)
+        tools = (
+            get_planning_tools(plan_path=plan_path)
+            if agent_type == AgentType.PLAN
+            else get_default_tools(enable_browser=True)
        )
-        agent = agent.model_copy(update={'agent_context': agent_context})

-        return agent
+        # -- Build system message suffix --
+        effective_suffix = system_message_suffix
+        if agent_type == AgentType.PLAN:
+            effective_suffix = (
+                f'{PLANNING_AGENT_INSTRUCTION}\n\n{system_message_suffix}'
+                if system_message_suffix
+                else PLANNING_AGENT_INSTRUCTION
+            )
+
+        # -- Build the agent from settings when available --
+        if agent_settings is not None:
+            # Route critic through the LLM proxy (or disable it).
+            agent_settings = _apply_critic_proxy(agent_settings, llm)
+
+            # Populate runtime-determined fields, then let
+            # create_agent() wire LLM, condenser, critic, etc.
+            agent_settings = agent_settings.model_copy(
+                update={
+                    'llm': llm,
+                    'tools': tools,
+                    'agent_context': AgentContext(
+                        system_message_suffix=effective_suffix,
+                        secrets=secrets,
+                    ),
+                }
+            )
+            agent = agent_settings.create_agent()
+        else:
+            # Legacy path: no SDK settings — build agent manually.
+            condenser = self._create_condenser(llm, agent_type, condenser_max_size)
+            agent = Agent(
+                llm=llm,
+                tools=tools,
+                condenser=condenser,
+                agent_context=AgentContext(
+                    system_message_suffix=effective_suffix,
+                    secrets=secrets,
+                ),
+            )
+
+        # -- Apply runtime-only overrides not captured by settings --
+        runtime_overrides: dict[str, Any] = {'mcp_config': mcp_config}
+        if agent_type == AgentType.PLAN:
+            runtime_overrides['system_prompt_filename'] = 'system_prompt_planning.j2'
+            runtime_overrides['system_prompt_kwargs'] = {
+                'plan_structure': format_plan_structure()
+            }
+            runtime_overrides['security_analyzer'] = None
+        else:
+            runtime_overrides['system_prompt_kwargs'] = {'cli_mode': False}
+
+        return agent.model_copy(update=runtime_overrides)

    def _update_agent_with_llm_metadata(
        self,
--- a/tests/unit/app_server/test_live_status_app_conversation_service.py
+++ b/tests/unit/app_server/test_live_status_app_conversation_service.py
@@ -884,25 +884,31 @@ class TestLiveStatusAppConversationService:
                working_dir=working_dir,
            )

-            # Assert
+            # Assert — Agent() receives llm, tools, condenser, agent_context
            mock_get_tools.assert_called_once_with(
                plan_path='/workspace/project/.agents_tmp/PLAN.md'
            )
            mock_agent_class.assert_called_once()
            call_kwargs = mock_agent_class.call_args[1]
            assert call_kwargs['llm'] == mock_llm
-            assert call_kwargs['system_prompt_filename'] == 'system_prompt_planning.j2'
-            assert (
-                call_kwargs['system_prompt_kwargs']['plan_structure']
-                == 'test_plan_structure'
-            )
-            assert call_kwargs['mcp_config'] == mcp_config
-            assert call_kwargs['security_analyzer'] is None
            assert call_kwargs['condenser'] == mock_condenser
+            assert call_kwargs['agent_context'].system_message_suffix.startswith(
+                PLANNING_AGENT_INSTRUCTION
+            )
            mock_create_condenser.assert_called_once_with(
                mock_llm, AgentType.PLAN, self.mock_user.condenser_max_size
            )

+            # Runtime overrides applied via model_copy
+            copy_kwargs = mock_agent_instance.model_copy.call_args[1]['update']
+            assert copy_kwargs['mcp_config'] == mcp_config
+            assert copy_kwargs['system_prompt_filename'] == 'system_prompt_planning.j2'
+            assert (
+                copy_kwargs['system_prompt_kwargs']['plan_structure']
+                == 'test_plan_structure'
+            )
+            assert copy_kwargs['security_analyzer'] is None
+
    @patch(
        'openhands.app_server.app_conversation.live_status_app_conversation_service.get_default_tools'
    )
@@ -937,18 +943,21 @@ class TestLiveStatusAppConversationService:
                self.mock_user.condenser_max_size,
            )

-            # Assert
+            # Assert — Agent() receives core fields
            mock_agent_class.assert_called_once()
            call_kwargs = mock_agent_class.call_args[1]
            assert call_kwargs['llm'] == mock_llm
-            assert call_kwargs['system_prompt_kwargs']['cli_mode'] is False
-            assert call_kwargs['mcp_config'] == mcp_config
            assert call_kwargs['condenser'] == mock_condenser
            mock_get_tools.assert_called_once_with(enable_browser=True)
            mock_create_condenser.assert_called_once_with(
                mock_llm, AgentType.DEFAULT, self.mock_user.condenser_max_size
            )

+            # Runtime overrides applied via model_copy
+            copy_kwargs = mock_agent_instance.model_copy.call_args[1]['update']
+            assert copy_kwargs['system_prompt_kwargs']['cli_mode'] is False
+            assert copy_kwargs['mcp_config'] == mcp_config
+
    @patch(
        'openhands.app_server.app_conversation.live_status_app_conversation_service.get_default_tools',
        return_value=[],
@@ -992,6 +1001,8 @@ class TestLiveStatusAppConversationService:
        assert agent.condenser is None
        assert isinstance(agent.critic, APIBasedCritic)
        assert agent.critic.mode == 'all_actions'
+        assert agent.critic.server_url == 'https://llm-proxy.app.all-hands.dev/vllm'
+        assert agent.critic.model_name == 'critic'
        assert agent.critic.iterative_refinement is not None
        assert agent.critic.iterative_refinement.success_threshold == 0.75
        assert agent.critic.iterative_refinement.max_iterations == 2
@@ -1034,10 +1045,12 @@ class TestLiveStatusAppConversationService:
                self.mock_user.condenser_max_size,
            )

-            # Assert - verify model_copy was called with agent_context containing planning instruction
-            model_copy_call = mock_agent_instance.model_copy.call_args
-            agent_context = model_copy_call[1]['update']['agent_context']
-            assert agent_context.system_message_suffix == PLANNING_AGENT_INSTRUCTION
+            # Assert — agent_context goes to Agent() constructor
+            call_kwargs = mock_agent_class.call_args[1]
+            assert (
+                call_kwargs['agent_context'].system_message_suffix
+                == PLANNING_AGENT_INSTRUCTION
+            )

    @patch(
        'openhands.app_server.app_conversation.live_status_app_conversation_service.get_planning_tools'
@@ -1078,13 +1091,11 @@ class TestLiveStatusAppConversationService:
                self.mock_user.condenser_max_size,
            )

-            # Assert - verify planning instruction is prepended to existing suffix
-            model_copy_call = mock_agent_instance.model_copy.call_args
-            agent_context = model_copy_call[1]['update']['agent_context']
-            assert agent_context.system_message_suffix.startswith(
-                PLANNING_AGENT_INSTRUCTION
-            )
-            assert existing_suffix in agent_context.system_message_suffix
+            # Assert — agent_context goes to Agent() constructor
+            call_kwargs = mock_agent_class.call_args[1]
+            suffix = call_kwargs['agent_context'].system_message_suffix
+            assert suffix.startswith(PLANNING_AGENT_INSTRUCTION)
+            assert existing_suffix in suffix

    @patch(
        'openhands.app_server.app_conversation.live_status_app_conversation_service.get_default_tools'
@@ -1120,10 +1131,9 @@ class TestLiveStatusAppConversationService:
                self.mock_user.condenser_max_size,
            )

-            # Assert - verify no planning instruction for default agent
-            model_copy_call = mock_agent_instance.model_copy.call_args
-            agent_context = model_copy_call[1]['update']['agent_context']
-            assert agent_context.system_message_suffix is None
+            # Assert — agent_context goes to Agent() constructor
+            call_kwargs = mock_agent_class.call_args[1]
+            assert call_kwargs['agent_context'].system_message_suffix is None

    @pytest.mark.asyncio
    async def test_finalize_conversation_request_with_skills(self):