Files
sci-gui-agent-benchmark/run_operator_fix.sh
yuanmengqi cb070307ee merge code
2025-07-15 14:57:14 +00:00

9 lines
274 B
Bash

python run_multienv_openaicua.py \
--headless \
--observation_type screenshot \
--model computer-use-preview \
--result_dir ./results_operator_full_test_0713_gdrive2 \
--test_all_meta_path evaluation_examples/test.json \
--max_steps 100 \
--num_envs 10 \
--provider_name aws