[AgentBench evaluation] set run_as_devin to true (#2269)

Co-authored-by: Leo <ifuryst@gmail.com>
This commit is contained in:
Boxuan Li
2024-06-05 00:53:33 -07:00
committed by GitHub
parent 1b25a37ad4
commit 208b1461ca

View File

@@ -24,7 +24,8 @@ sandbox_timeout = 120
ssh_hostname = "localhost"
use_host_network = false
run_as_devin = false
# AgentBench specific
run_as_devin = true
enable_auto_lint = true
[eval_gpt35_turbo]