Remove dataset size limit during HUD evaluation

This commit is contained in:
James Murdza
2025-09-12 12:55:43 -04:00
parent 68ecdcc99a
commit 4b3e2077fb

View File

@@ -198,7 +198,7 @@
" model=\"openai/computer-use-preview\", # Or any supported model string\n",
" max_concurrent=20, # Tune to your infra\n",
" max_steps=50, # Safety cap per task\n",
" split=\"train[:3]\" # Limit to just 3 tasks\n",
" #split=\"train[:5]\" # Limit to just 5 tasks\n",
")\n",
"\n",
"# results is a list from hud.datasets.run_dataset; inspect/aggregate as needed\n",