mirror of
https://github.com/OpenHands/OpenHands.git
synced 2026-03-22 05:37:20 +08:00
feat: Support Tau-Bench and BFCL evaluation benchmarks (#11953)
Co-authored-by: openhands <openhands@all-hands.dev>
This commit is contained in:
@@ -192,6 +192,9 @@ datasets = "*"
|
||||
joblib = "*"
|
||||
swebench = { git = "https://github.com/ryanhoangt/SWE-bench.git", rev = "fix-modal-patch-eval" }
|
||||
multi-swe-bench = "0.1.2"
|
||||
pandas = "*"
|
||||
# tau-bench = { git = "https://github.com/sierra-research/tau-bench.git" }
|
||||
# bfcl-eval = "*" # TODO: Verify exact package name/source
|
||||
|
||||
[tool.poetry.group.testgeneval.dependencies]
|
||||
fuzzywuzzy = "^0.18.0"
|
||||
|
||||
Reference in New Issue
Block a user