feat: add client password argument to multiple agents and scripts

- Introduced `--client_password` argument in `run_multienv_aguvis.py`, `run_multienv_claude.py`, and `run_multienv_gta1.py` for enhanced security and flexibility. - Updated agent classes (`PromptAgent`, `AguvisAgent`, `GTA1Agent`) to accept and utilize `client_password` for improved configuration. - Modified evaluation guidelines to reflect the new client password requirement. - Ensured existing logic remains intact while enhancing functionality for better user experience.
2025-07-27 16:11:23 +00:00
parent 122b16742b
commit 523d553e88
9 changed files with 627 additions and 28 deletions
--- a/run_multienv_claude.py
+++ b/run_multienv_claude.py
@@ -14,8 +14,7 @@ from tqdm import tqdm
 from multiprocessing import Process, Manager, current_process
 import lib_run_single
 from desktop_env.desktop_env import DesktopEnv
-from mm_agents.anthropic import AnthropicAgent as PromptAgent
-
+from mm_agents.anthropic import AnthropicAgent

 # .env
 from dotenv import load_dotenv
@@ -152,7 +151,7 @@ def run_env_tasks(task_queue, args, shared_scores):
            client_password=args.client_password
        )
        active_environments.append(env)
-        agent = PromptAgent(
+        agent = AnthropicAgent(
            env=env,
            model=args.model,
            max_tokens=args.max_tokens,
@@ -161,10 +160,9 @@ def run_env_tasks(task_queue, args, shared_scores):
            action_space=args.action_space,
            observation_type=args.observation_type,
            max_trajectory_length=args.max_trajectory_length,
-            client_password=args.client_password,
            provider_name=args.provider_name,
            screen_width=args.screen_width,
-            screen_height=args.screen_height
+            screen_height=args.screen_height,
        )
        logger.info(f"Process {current_process().name} started.")
        while True: