feat: add client password argument to multiple agents and scripts

- Introduced `--client_password` argument in `run_multienv_aguvis.py`, `run_multienv_claude.py`, and `run_multienv_gta1.py` for enhanced security and flexibility.
- Updated agent classes (`PromptAgent`, `AguvisAgent`, `GTA1Agent`) to accept and utilize `client_password` for improved configuration.
- Modified evaluation guidelines to reflect the new client password requirement.
- Ensured existing logic remains intact while enhancing functionality for better user experience.
This commit is contained in:
yuanmengqi
2025-07-27 16:11:23 +00:00
parent 122b16742b
commit 523d553e88
9 changed files with 627 additions and 28 deletions

View File

@@ -80,6 +80,12 @@ def config() -> argparse.Namespace:
default="screenshot",
help="Observation type",
)
parser.add_argument(
"--provider_name", type=str, default="aws", choices=["aws", "virtualbox", "vmware", "docker", "azure"], help="Provider name"
)
parser.add_argument(
"--client_password", type=str, default="", help="Client password"
)
parser.add_argument("--screen_width", type=int, default=1920)
parser.add_argument("--screen_height", type=int, default=1080)
parser.add_argument("--sleep_after_execution", type=float, default=2.0)
@@ -216,6 +222,7 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None:
temperature=args.temperature,
action_space=args.action_space,
observation_type=args.observation_type,
client_password=args.client_password
)
agents.append(agent)
@@ -227,7 +234,8 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None:
os_type="Ubuntu",
require_a11y_tree=args.observation_type
in ["a11y_tree", "screenshot_a11y_tree", "som"],
provider_name = "docker"
provider_name = args.provider_name,
client_password=args.client_password
)
envs.append(env)