Files
sci-gui-agent-benchmark/evaluation_examples/examples/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json
yuanmengqi e433f35c1f feat: standardize configuration fields across all evaluation examples
- Add `fixed_ip` field to all 369 JSON files in examples directory
  - Set to `true` for 8 files listed in google_chrome.json multi_apps
  - Set to `false` for remaining 361 files
- Add `possibility_of_env_change` field to 363 JSON files missing this field
  - Set to "low" for newly added fields
  - Preserve existing values (4 medium, 2 high) for 6 files that already had this field

This ensures consistent configuration schema across all evaluation examples
while maintaining backward compatibility with existing settings.
2025-07-16 13:45:34 +00:00

127 lines
3.1 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{
"id": "6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a",
"snapshot": "multiapps",
"instruction": "I now want to count the meeting cities of the three machine learning conferences in the past ten years from 2013 to 2019(including 2013 and 2019). I have listed the names and years of the conferences in excel. Please fill in the vacant locations.",
"source": "author",
"config": [
{
"type": "download",
"parameters": {
"files": [
{
"url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/Conference.xlsx",
"path": "/home/user/Desktop/ConferenceCity.xlsx"
}
]
}
},
{
"type": "open",
"parameters": {
"path": "/home/user/Desktop/ConferenceCity.xlsx"
}
}
],
"trajectory": "trajectories/",
"related_apps": [
"calc",
"chrome",
"os"
],
"evaluator": {
"postconfig": [
{
"type": "download",
"parameters": {
"files": [
{
"url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/ConferenceCity%20Gold.xlsx",
"path": "/home/user/Desktop/ConferenceCity_Gold.xlsx"
}
]
}
},
{
"type": "activate_window",
"parameters": {
"window_name": "ConferenceCity.xlsx - LibreOffice Calc"
}
},
{
"type": "execute",
"parameters": {
"command": [
"python",
"-c",
"import pyautogui; import time; pyautogui.hotkey(\"ctrl\", \"s\"); time.sleep(0.5);"
]
}
}
],
"func": "compare_conference_city_in_order",
"expected": {
"type": "rule",
"rules": {
"expected": [
"Scottsdale",
"Atlanta",
[
"Lake Tahoe",
"Stateline"
],
[
"Banff",
"Alberta's Rockies",
"Albertas Rockies"
],
"Beijing",
[
"Montreal",
"Montréal"
],
"San Diego",
"Lille",
[
"Montreal",
"Montréal"
],
"San Juan",
[
"New York",
"New York City",
"NYC"
],
"Barcelona",
"Toulon",
"Sydney",
[
"Los Angeles",
"Long Beach",
"LA"
],
"Vancouver",
"Stockholm",
[
"Montreal",
"Montréal"
],
"New Orleans",
[
"Los Angeles",
"Long Beach",
"LA"
],
"Vancouver"
]
}
},
"result": {
"type": "vm_file",
"path": "/home/user/Desktop/ConferenceCity.xlsx",
"dest": "ConferenceCity.xlsx"
}
},
"proxy": false,
"fixed_ip": false,
"possibility_of_env_change": "low"
}