mirror of
https://github.com/trycua/computer.git
synced 2026-02-18 12:28:51 -06:00
Remove dataset size limit during HUD evaluation
This commit is contained in:
@@ -198,7 +198,7 @@
|
||||
" model=\"openai/computer-use-preview\", # Or any supported model string\n",
|
||||
" max_concurrent=20, # Tune to your infra\n",
|
||||
" max_steps=50, # Safety cap per task\n",
|
||||
" split=\"train[:3]\" # Limit to just 3 tasks\n",
|
||||
" #split=\"train[:5]\" # Limit to just 5 tasks\n",
|
||||
")\n",
|
||||
"\n",
|
||||
"# results is a list from hud.datasets.run_dataset; inspect/aggregate as needed\n",
|
||||
|
||||
Reference in New Issue
Block a user