feat: add client password argument to multiple agents and scripts

- Introduced `--client_password` argument in `run_multienv_aguvis.py`, `run_multienv_claude.py`, and `run_multienv_gta1.py` for enhanced security and flexibility.
- Updated agent classes (`PromptAgent`, `AguvisAgent`, `GTA1Agent`) to accept and utilize `client_password` for improved configuration.
- Modified evaluation guidelines to reflect the new client password requirement.
- Ensured existing logic remains intact while enhancing functionality for better user experience.
This commit is contained in:
yuanmengqi
2025-07-27 16:11:23 +00:00
parent 122b16742b
commit 523d553e88
9 changed files with 627 additions and 28 deletions

View File

@@ -14,8 +14,7 @@ from tqdm import tqdm
from multiprocessing import Process, Manager, current_process
import lib_run_single
from desktop_env.desktop_env import DesktopEnv
from mm_agents.anthropic import AnthropicAgent as PromptAgent
from mm_agents.anthropic import AnthropicAgent
# .env
from dotenv import load_dotenv
@@ -152,7 +151,7 @@ def run_env_tasks(task_queue, args, shared_scores):
client_password=args.client_password
)
active_environments.append(env)
agent = PromptAgent(
agent = AnthropicAgent(
env=env,
model=args.model,
max_tokens=args.max_tokens,
@@ -161,10 +160,9 @@ def run_env_tasks(task_queue, args, shared_scores):
action_space=args.action_space,
observation_type=args.observation_type,
max_trajectory_length=args.max_trajectory_length,
client_password=args.client_password,
provider_name=args.provider_name,
screen_width=args.screen_width,
screen_height=args.screen_height
screen_height=args.screen_height,
)
logger.info(f"Process {current_process().name} started.")
while True: