Files
sci-gui-agent-benchmark/run_operator.sh
yuanmengqi ea51f5264a fix chrome
2025-06-30 08:07:24 +00:00

9 lines
268 B
Bash

python run_multienv_openaicua.py \
--headless \
--observation_type screenshot \
--model computer-use-preview \
--result_dir ./results_chrome_operator \
--test_all_meta_path evaluation_examples/test_fix_chrome.json \
--region us-east-1 \
--max_steps 150 \
--num_envs 10