From f3151e622500d4bd49b9e1c8a210926e757db81c Mon Sep 17 00:00:00 2001 From: TeAka Network Date: Wed, 4 Jun 2025 20:32:42 +1200 Subject: [PATCH 1/7] Update README.md (#206) --- desktop_env/server/README.md | 4 ---- 1 file changed, 4 deletions(-) diff --git a/desktop_env/server/README.md b/desktop_env/server/README.md index 3b80401..edf79e7 100644 --- a/desktop_env/server/README.md +++ b/desktop_env/server/README.md @@ -653,9 +653,5 @@ You can use accerciser to check the accessibility tree on GNOME VM. sudo apt install accerciser ``` - -## [Windows](https://huggingface.co/datasets/xlangai/windows_osworld) -Coming soon... - ## [MacOS](https://huggingface.co/datasets/xlangai/macos_osworld) Coming soon... From 5959c0846e9e67773ee117841096f1c448e605da Mon Sep 17 00:00:00 2001 From: chenjix <211250101@smail.nju.edu.cn> Date: Sat, 7 Jun 2025 00:13:38 +0800 Subject: [PATCH 2/7] Fix libreoffice impress evaluation --- desktop_env/evaluators/metrics/slides.py | 19 +++++++++++++++++-- desktop_env/evaluators/metrics/vlc.py | 2 +- 2 files changed, 18 insertions(+), 3 deletions(-) diff --git a/desktop_env/evaluators/metrics/slides.py b/desktop_env/evaluators/metrics/slides.py index 90eea64..307752f 100644 --- a/desktop_env/evaluators/metrics/slides.py +++ b/desktop_env/evaluators/metrics/slides.py @@ -389,10 +389,22 @@ def evaluate_presentation_fill_to_rgb_distance(pptx_file, rules): except: original_rgb = None + def get_rgb_from_color(color): + try: + if hasattr(color, "rgb"): + return color.rgb + else: + return None + except: + return None + def slide_fill_distance_to_rgb(_slide, _rgb, _original_rgb): fill = _slide.background.fill if fill.type == 1: - r1, g1, b1 = fill.fore_color.rgb + color_rgb = get_rgb_from_color(fill.fore_color) + if color_rgb is None: + return 1 + r1, g1, b1 = color_rgb r2, g2, b2 = _rgb if _original_rgb is not None: @@ -404,7 +416,10 @@ def evaluate_presentation_fill_to_rgb_distance(pptx_file, rules): elif fill.type == 5: master_fill = _slide.slide_layout.slide_master.background.fill if master_fill.type == 1: - r1, g1, b1 = master_fill.fore_color.rgb + color_rgb = get_rgb_from_color(master_fill.fore_color) + if color_rgb is None: + return 1 + r1, g1, b1 = color_rgb else: return 1 r2, g2, b2 = _rgb diff --git a/desktop_env/evaluators/metrics/vlc.py b/desktop_env/evaluators/metrics/vlc.py index 94892bd..5af7b50 100644 --- a/desktop_env/evaluators/metrics/vlc.py +++ b/desktop_env/evaluators/metrics/vlc.py @@ -117,7 +117,7 @@ def compare_images(image1_path, image2_path, **options): similarity_index = ssim(image1_array, image2_array) epsilon = 0.01 - if base_score is None: + if base_score is not None: if similarity_index >= base_score + epsilon: return (similarity_index - base_score) / (1 - base_score) else: From 8471394cc1ee16bfedaff5c933995d886eae56cd Mon Sep 17 00:00:00 2001 From: yuanmengqi Date: Sat, 7 Jun 2025 15:57:18 +0000 Subject: [PATCH 3/7] add branch feat/aws-provider-support --- evaluation_examples/test_0607.json | 5 +++++ run_operator_vlc.sh | 9 +++++++++ 2 files changed, 14 insertions(+) create mode 100644 evaluation_examples/test_0607.json create mode 100644 run_operator_vlc.sh diff --git a/evaluation_examples/test_0607.json b/evaluation_examples/test_0607.json new file mode 100644 index 0000000..574901b --- /dev/null +++ b/evaluation_examples/test_0607.json @@ -0,0 +1,5 @@ +{ + "vlc": [ + "8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f" + ] +} \ No newline at end of file diff --git a/run_operator_vlc.sh b/run_operator_vlc.sh new file mode 100644 index 0000000..b6c1e89 --- /dev/null +++ b/run_operator_vlc.sh @@ -0,0 +1,9 @@ +python run_multienv_openaicua.py \ + --headless \ + --observation_type screenshot \ + --model computer-use-preview \ + --result_dir ./results_vlc_retest \ + --test_all_meta_path evaluation_examples/test_0607.json \ + --region us-east-1 \ + --max_steps 3 \ + --num_envs 1 From 9fa768d24d48afc434e786bf629e337f9d9e54dc Mon Sep 17 00:00:00 2001 From: yuanmengqi Date: Sat, 7 Jun 2025 17:26:45 +0000 Subject: [PATCH 4/7] refactor: update URLs in multiple JSON files to ensure proper encoding of special characters --- .../7efeb4b1-3d19-4762-b163-63328d66303b.json | 4 ++-- .../21760ecb-8f62-40d2-8d85-0cee5725cb72.json | 2 +- .../0a0faba3-5580-44df-965d-f562a99b291c.json | 4 ++-- .../bb8ccc78-479f-4a2f-a71e-d565e439436b.json | 2 +- .../0c825995-5b70-4526-b663-113f4c999dd2.json | 6 +++--- .../185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json | 16 ++++++++-------- .../1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json | 10 +++++----- .../2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json | 18 +++++++++--------- .../337d318b-aa07-4f4f-b763-89d9a2dd013f.json | 8 ++++---- .../3a93cae4-ad3e-403e-8c12-65303b271818.json | 14 +++++++------- .../3f05f3b9-29ba-4b6b-95aa-2204697ffc06.json | 10 +++++----- .../42d25c08-fb87-4927-8b65-93631280a26f.json | 2 +- .../5bc63fb9-276a-4439-a7c1-9dc76401737f.json | 2 +- .../6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json | 2 +- .../716a6079-22da-47f1-ba73-c9d58f986a38.json | 2 +- .../7ff48d5b-2df2-49da-b500-a5150ffc7f18.json | 2 +- .../869de13e-bef9-4b91-ba51-f6708c40b096.json | 6 +++--- .../873cafdd-a581-47f6-8b33-b9696ddb7b05.json | 2 +- .../8e116af7-7db7-4e35-a68b-b0939c066c78.json | 2 +- .../9f3bb592-209d-43bc-bb47-d77d9df56504.json | 4 ++-- .../a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb.json | 4 ++-- .../a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a.json | 2 +- .../dd60633f-2c72-42ba-8547-6f2c8cb0fdb0.json | 2 +- .../deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json | 4 ++-- .../f5c13cdd-205c-4719-a562-348ae5cd1d91.json | 2 +- .../d38192b0-17dc-4e1d-99c3-786d0117de77.json | 2 +- .../386dbd0e-0241-4a0a-b6a2-6704fba26b1c.json | 2 +- .../59f21cfb-0120-4326-b255-a5b827b38967.json | 2 +- .../8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f.json | 2 +- .../8f080098-ddb1-424c-b438-4e96e5e4786e.json | 4 ++-- .../efcf0d81-0835-4880-b2fd-d866e8bc2294.json | 2 +- .../fba2c100-79e8-42df-ae74-b592418d54f4.json | 2 +- .../7efeb4b1-3d19-4762-b163-63328d66303b.json | 4 ++-- .../ecb0df7a-4e8d-4a03-b162-053391d3afaf.json | 2 +- .../185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json | 16 ++++++++-------- .../1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json | 10 +++++----- .../2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json | 18 +++++++++--------- .../3a93cae4-ad3e-403e-8c12-65303b271818.json | 14 +++++++------- .../6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json | 2 +- .../74d5859f-ed66-4d3e-aa0e-93d7a592ce41.json | 4 ++-- .../8e116af7-7db7-4e35-a68b-b0939c066c78.json | 2 +- .../deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json | 4 ++-- .../e528b65e-1107-4b8c-8988-490e4fece599.json | 2 +- 43 files changed, 113 insertions(+), 113 deletions(-) diff --git a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json index aa1e30a..a965e02 100644 --- a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json +++ b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#.xlsx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial%23.xlsx", "path": "/home/user/Order_Sales_Serial#.xlsx" } ] @@ -61,7 +61,7 @@ "func": "compare_table", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#_gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial%23_gold.xlsx", "dest": "Order_Sales_Serial#_gold.xlsx" }, "result": { diff --git a/evaluation_examples/examples/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72.json b/evaluation_examples/examples/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72.json index 30cdf53..82a830b 100644 --- a/evaluation_examples/examples/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72.json +++ b/evaluation_examples/examples/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72/Ch4 Video Effect.pptx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_impress/21760ecb-8f62-40d2-8d85-0cee5725cb72/Ch4%20Video%20Effect.pptx", "path": "/home/user/Desktop/Ch4 Video Effect.pptx" } ] diff --git a/evaluation_examples/examples/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c.json b/evaluation_examples/examples/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c.json index 0da08f7..4b9b405 100644 --- a/evaluation_examples/examples/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c.json +++ b/evaluation_examples/examples/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c/04 CHIN9505 EBook Purchasing info 2021 Jan.docx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c/04%20CHIN9505%20EBook%20Purchasing%20info%202021%20Jan.docx", "path": "/home/user/Desktop/04 CHIN9505 EBook Purchasing info 2021 Jan.docx" } ] @@ -55,7 +55,7 @@ "func": "check_tabstops", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c/04 CHIN9505 EBook Purchasing info 2021 Jan_Gold.docx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/0a0faba3-5580-44df-965d-f562a99b291c/04%20CHIN9505%20EBook%20Purchasing%20info%202021%20Jan_Gold.docx", "dest": "04 CHIN9505 EBook Purchasing info 2021 Jan_Gold.docx" }, "result": { diff --git a/evaluation_examples/examples/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b.json b/evaluation_examples/examples/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b.json index 8d77f97..87ee2c0 100644 --- a/evaluation_examples/examples/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b.json +++ b/evaluation_examples/examples/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b/The Wonders of Our Solar System.docx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_writer/bb8ccc78-479f-4a2f-a71e-d565e439436b/The%20Wonders%20of%20Our%20Solar%20System.docx", "path": "/home/user/Desktop/The Wonders of Our Solar System.docx" } ] diff --git a/evaluation_examples/examples/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2.json b/evaluation_examples/examples/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2.json index 743d51e..63fc18f 100644 --- a/evaluation_examples/examples/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2.json +++ b/evaluation_examples/examples/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2.json @@ -73,11 +73,11 @@ }, { "path": "/home/user/Desktop/GE Guidebook.pdf", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/GE Guidebook.pdf" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/GE%20Guidebook.pdf" }, { "path": "/home/user/Desktop/assessing_and_reporting_water_quality(q&a).pdf", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/assessing_and_reporting_water_quality(q&a).pdf" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/assessing_and_reporting_water_quality%28q%26a%29.pdf" } ] } @@ -102,7 +102,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/environment_policy_report (draft)_gold.docx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/0c825995-5b70-4526-b663-113f4c999dd2/environment_policy_report%20%28draft%29_gold.docx", "dest": "environment_policy_report (draft)_gold.docx" }, "options": { diff --git a/evaluation_examples/examples/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json b/evaluation_examples/examples/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json index 97cc4c1..3d7b88c 100644 --- a/evaluation_examples/examples/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json +++ b/evaluation_examples/examples/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json @@ -10,7 +10,7 @@ "files": [ { "path": "/home/user/Desktop/Employee Performance Evaluation Summary.xlsx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Employee Performance Evaluation Summary.xlsx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Employee%20Performance%20Evaluation%20Summary.xlsx" }, { "path": "/home/user/Desktop/review_template.pdf", @@ -49,13 +49,13 @@ "result": { "type": "cloud_file", "path": [ - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Alex Lee.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/David Wilson.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Emily Johnson.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/John Doe.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Linda Green.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Michael Brown.pdf", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Sophia Carter.pdf" + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Alex%20Lee.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/David%20Wilson.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Emily%20Johnson.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/John%20Doe.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Linda%20Green.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Michael%20Brown.pdf", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Sophia%20Carter.pdf" ], "dest": [ "Alex Lee_Gold.pdf", diff --git a/evaluation_examples/examples/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json b/evaluation_examples/examples/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json index 5e29730..95889b9 100644 --- a/evaluation_examples/examples/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json +++ b/evaluation_examples/examples/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json @@ -24,15 +24,15 @@ "files": [ { "path": "/home/user/Desktop/Grammer test 1.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer test 1.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer%20test%201.docx" }, { "path": "/home/user/Desktop/Grammer test 2.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammar test 2.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammar%20test%202.docx" }, { "path": "/home/user/Desktop/Grammer test 3.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer test 3.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer%20test%203.docx" }, { "path": "/home/user/Desktop/Answer.docx", @@ -56,11 +56,11 @@ }, { "path": "/home/user/Desktop/Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "/home/user/Desktop/Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course%20Timetable.xlsx" } ] } diff --git a/evaluation_examples/examples/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json b/evaluation_examples/examples/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json index fd22983..e50d572 100644 --- a/evaluation_examples/examples/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json +++ b/evaluation_examples/examples/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json @@ -24,15 +24,15 @@ "files": [ { "path": "/home/user/Desktop/students work/Zheng He .docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng He .docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng%20He%20.docx" }, { "path": "/home/user/Desktop/students work/The literature reviews of weekly readings.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The literature reviews of weekly readings.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The%20literature%20reviews%20of%20weekly%20readings.docx" }, { "path": "/home/user/Desktop/students work/The British Justice System.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The British Justice System.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The%20British%20Justice%20System.docx" }, { "path": "/home/user/Desktop/students work/quiz2.docx", @@ -44,11 +44,11 @@ }, { "path": "/home/user/Desktop/students work/Q1&2&3.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Q1&2&3.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Q1%262%263.docx" }, { "path": "/home/user/Desktop/students work/Photo Ethics in Journalism.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Photo Ethics in Journalism.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Photo%20Ethics%20in%20Journalism.docx" }, { "path": "/home/user/Desktop/students work/cassie.docx", @@ -56,7 +56,7 @@ }, { "path": "/home/user/Desktop/students work/case study.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study.docx" }, { "path": "/home/user/Desktop/Grammar rules PDF/irregularrules02.pdf", @@ -76,11 +76,11 @@ }, { "path": "/home/user/Desktop/Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "/home/user/Desktop/Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course%20Timetable.xlsx" } ] } @@ -117,7 +117,7 @@ "func": "compare_references", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study gold.docx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study%20gold.docx", "dest": "case study gold.docx" }, "result": { diff --git a/evaluation_examples/examples/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f.json b/evaluation_examples/examples/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f.json index f4c8918..e8abf4e 100644 --- a/evaluation_examples/examples/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f.json +++ b/evaluation_examples/examples/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f.json @@ -10,15 +10,15 @@ "files": [ { "path": "/home/user/Desktop/invoice TII-20220301-90.pdf", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/invoice TII-20220301-90.pdf" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/invoice%20TII-20220301-90.pdf" }, { "path": "/home/user/Desktop/Invoice # GES-20220215-82.pdf", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice # GES-20220215-82.pdf" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice%20%2523%20GES-20220215-82.pdf" }, { "path": "/home/user/Desktop/Invoice # 243729.pdf", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice # 243729.pdf" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice%20%2523%20243729.pdf" }, { "path": "/home/user/Desktop/Bank-Statement.pdf", @@ -42,7 +42,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice # 243729.pdf", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/337d318b-aa07-4f4f-b763-89d9a2dd013f/Invoice%20%2523%20243729.pdf", "dest": "Invoice # 243729 Gold.pdf" } }, diff --git a/evaluation_examples/examples/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818.json b/evaluation_examples/examples/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818.json index 3bd61a6..0b66efa 100644 --- a/evaluation_examples/examples/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818.json +++ b/evaluation_examples/examples/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818.json @@ -24,7 +24,7 @@ "files": [ { "path": "/home/user/Desktop/students work/Zheng He .docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng He .docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng%20He%20.docx" }, { "path": "/home/user/Desktop/students work/cassie.docx", @@ -32,7 +32,7 @@ }, { "path": "/home/user/Desktop/students work/case study.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study.docx" }, { "path": "/home/user/Desktop/Grammar rules PDF/irregularrules02.pdf", @@ -52,11 +52,11 @@ }, { "path": "/home/user/Desktop/Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "/home/user/Desktop/Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable.xlsx" } ] } @@ -118,17 +118,17 @@ "expected": [ { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold.xlsx", "dest": "Course Timetable gold.xlsx" }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold 2.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold%202.xlsx", "dest": "Course Timetable gold 2.xlsx" }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold 3.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold%203.xlsx", "dest": "Course Timetable gold 3.xlsx" } ], diff --git a/evaluation_examples/examples/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06.json b/evaluation_examples/examples/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06.json index 66408c2..8c389c9 100644 --- a/evaluation_examples/examples/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06.json +++ b/evaluation_examples/examples/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06.json @@ -63,23 +63,23 @@ }, { "path": "/home/user/Music/Cheng Xiang - Missing You.mp3", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Cheng Xiang - Missing You.mp3" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Cheng%20Xiang%20-%20Missing%20You.mp3" }, { "path": "/home/user/Music/Han Baoyi - Tears of Dancing Girl.mp3", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Han Baoyi - Tears of Dancing Girl.mp3" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Han%20Baoyi%20-%20Tears%20of%20Dancing%20Girl.mp3" }, { "path": "/home/user/Music/Huang An - I Know Missing is Painful.mp3", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Huang An - I Know Missing is Painful.mp3" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Huang%20An%20-%20I%20Know%20Missing%20is%20Painful.mp3" }, { "path": "/home/user/Music/Chen Shaohua - Red Daughter.mp3", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Chen Shaohua - Red Daughter.mp3" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Chen%20Shaohua%20-%20Red%20Daughter.mp3" }, { "path": "/home/user/Music/Zhou Xuan - Nights in Shanghai.mp3", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Zhou Xuan - Nights in Shanghai.mp3" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/3f05f3b9-29ba-4b6b-95aa-2204697ffc06/Zhou%20Xuan%20-%20Nights%20in%20Shanghai.mp3" } ] } diff --git a/evaluation_examples/examples/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f.json b/evaluation_examples/examples/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f.json index b335a9e..710ac31 100644 --- a/evaluation_examples/examples/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f.json +++ b/evaluation_examples/examples/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f.json @@ -152,7 +152,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f/Pass Through.epub", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/42d25c08-fb87-4927-8b65-93631280a26f/Pass%20Through.epub", "dest": "Pass Through Gold.epub" } }, diff --git a/evaluation_examples/examples/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f.json b/evaluation_examples/examples/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f.json index f84850f..8143f2f 100644 --- a/evaluation_examples/examples/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f.json +++ b/evaluation_examples/examples/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f/LLM results.json", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/5bc63fb9-276a-4439-a7c1-9dc76401737f/LLM%20results.json", "path": "/home/user/Desktop/llm_answers.json" } ] diff --git a/evaluation_examples/examples/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json b/evaluation_examples/examples/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json index 0a595c6..2727d8b 100644 --- a/evaluation_examples/examples/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json +++ b/evaluation_examples/examples/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json @@ -35,7 +35,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/ConferenceCity Gold.xlsx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/ConferenceCity%20Gold.xlsx", "path": "/home/user/Desktop/ConferenceCity_Gold.xlsx" } ] diff --git a/evaluation_examples/examples/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38.json b/evaluation_examples/examples/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38.json index ccea1bf..30738d3 100644 --- a/evaluation_examples/examples/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38.json +++ b/evaluation_examples/examples/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38.json @@ -16,7 +16,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38/Secret document.docx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/716a6079-22da-47f1-ba73-c9d58f986a38/Secret%20document.docx", "path": "/home/user/Data3/List3/secret.docx" } ] diff --git a/evaluation_examples/examples/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18.json b/evaluation_examples/examples/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18.json index 21075c0..5e29695 100644 --- a/evaluation_examples/examples/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18.json +++ b/evaluation_examples/examples/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18/All Locations.docx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/7ff48d5b-2df2-49da-b500-a5150ffc7f18/All%20Locations.docx", "path": "/home/user/Desktop/AllLocations.docx" } ] diff --git a/evaluation_examples/examples/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096.json b/evaluation_examples/examples/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096.json index 8082c52..fa18be8 100644 --- a/evaluation_examples/examples/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096.json +++ b/evaluation_examples/examples/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096.json @@ -43,7 +43,7 @@ "path": "/home/user/Desktop/2-if-for-array.zip" }, { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/07-cluster-kMean (1).ppt", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/07-cluster-kMean%20%281%29.ppt", "path": "/home/user/Desktop/07-cluster-kMean (1).ppt" }, { @@ -67,7 +67,7 @@ "path": "/home/user/Desktop/DOC_2480903712718068684.pdf" }, { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/Family Status Equality-Eng (Aug 2021).pdf", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/Family%20Status%20Equality-Eng%20%28Aug%202021%29.pdf", "path": "/home/user/Desktop/Family Status Equality-Eng (Aug 2021).pdf" }, { @@ -79,7 +79,7 @@ "path": "/home/user/Desktop/paper01.pdf" }, { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/GLUE: A MULTI-TASK BENCHMARK AND ANALYSIS.pdf", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/869de13e-bef9-4b91-ba51-f6708c40b096/GLUE%3A%20A%20MULTI-TASK%20BENCHMARK%20AND%20ANALYSIS.pdf", "path": "/home/user/Desktop/GLUE: A MULTI-TASK BENCHMARK AND ANALYSIS.pdf" }, { diff --git a/evaluation_examples/examples/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05.json b/evaluation_examples/examples/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05.json index f6ed367..c10889e 100644 --- a/evaluation_examples/examples/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05.json +++ b/evaluation_examples/examples/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05.json @@ -28,7 +28,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05/Recommended plugin list.docx", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/873cafdd-a581-47f6-8b33-b9696ddb7b05/Recommended%20plugin%20list.docx", "path": "/home/user/Desktop/Recommended_plugin_list.docx" } ] diff --git a/evaluation_examples/examples/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78.json b/evaluation_examples/examples/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78.json index c4b02c2..5e00c93 100644 --- a/evaluation_examples/examples/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78.json +++ b/evaluation_examples/examples/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78.json @@ -89,7 +89,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78/my_bookkeeping Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/8e116af7-7db7-4e35-a68b-b0939c066c78/my_bookkeeping%20Gold.xlsx", "dest": "my_bookkeeping_gold.xlsx" }, "options": { diff --git a/evaluation_examples/examples/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504.json b/evaluation_examples/examples/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504.json index b6b5fea..5e2dffa 100644 --- a/evaluation_examples/examples/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504.json +++ b/evaluation_examples/examples/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504.json @@ -41,7 +41,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504/Gold subtitles.srt", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504/Gold%20subtitles.srt", "path": "/home/user/subtitles_Gold.srt" } ] @@ -52,7 +52,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504/Subtitles script.py", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/9f3bb592-209d-43bc-bb47-d77d9df56504/Subtitles%20script.py", "path": "/home/user/Desktop/subtitles_script.py" } ] diff --git a/evaluation_examples/examples/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb.json b/evaluation_examples/examples/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb.json index 47446b0..b887a6c 100644 --- a/evaluation_examples/examples/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb.json +++ b/evaluation_examples/examples/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb.json @@ -118,8 +118,8 @@ "type": "cloud_file", "multi": "true", "path": [ - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb/Amazon Web Services Invoice Available [Account: 0123456789ab].eml", - "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb/Your receipt from X (formerly Twitter) #0123-4567.eml" + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb/Amazon%20Web%20Services%20Invoice%20Available%20%5BAccount%3A%200123456789ab%5D.eml", + "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a0b9dc9c-fc07-4a88-8c5d-5e3ecad91bcb/Your%20receipt%20from%20X%20%28formerly%20Twitter%29%20%25230123-4567.eml" ], "dest": [ "gold1.eml", diff --git a/evaluation_examples/examples/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a.json b/evaluation_examples/examples/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a.json index 1ea79a9..9536a92 100644 --- a/evaluation_examples/examples/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a.json +++ b/evaluation_examples/examples/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a/Hello Extension.zip", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/a74b607e-6bb5-4ea8-8a7c-5d97c7bbcd2a/Hello%20Extension.zip", "path": "/home/user/Desktop/helloExtension.zip" } ] diff --git a/evaluation_examples/examples/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0.json b/evaluation_examples/examples/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0.json index d3143f0..9066531 100644 --- a/evaluation_examples/examples/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0.json +++ b/evaluation_examples/examples/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0.json @@ -47,7 +47,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0/Colab Gold.py", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/dd60633f-2c72-42ba-8547-6f2c8cb0fdb0/Colab%20Gold.py", "dest": "colab_Gold.py" } }, diff --git a/evaluation_examples/examples/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json b/evaluation_examples/examples/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json index 8d353e8..14f3762 100644 --- a/evaluation_examples/examples/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json +++ b/evaluation_examples/examples/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json @@ -10,7 +10,7 @@ "files": [ { "path": "/home/user/Desktop/New Large Language Models.xlsx", - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New Large Language Models.xlsx" + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New%20Large%20Language%20Models.xlsx" } ] } @@ -68,7 +68,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New Large Language Models Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New%20Large%20Language%20Models%20Gold.xlsx", "dest": "New Large Language Models Gold.xlsx" }, "options": { diff --git a/evaluation_examples/examples/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91.json b/evaluation_examples/examples/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91.json index e877b92..58227d2 100644 --- a/evaluation_examples/examples/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91.json +++ b/evaluation_examples/examples/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91.json @@ -23,7 +23,7 @@ "path": "/home/user/thunderbird-profile.tar.gz" }, { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91/Payment Reminder.html", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/f5c13cdd-205c-4719-a562-348ae5cd1d91/Payment%20Reminder.html", "path": "/home/user/.payment-reminder-mail-body.html" }, { diff --git a/evaluation_examples/examples/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77.json b/evaluation_examples/examples/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77.json index 2720d81..e876d86 100644 --- a/evaluation_examples/examples/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77.json +++ b/evaluation_examples/examples/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77.json @@ -17,7 +17,7 @@ "path": "/home/user/thunderbird-profile.tar.gz" }, { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77/New-month AWS Bill.html", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/thunderbird/d38192b0-17dc-4e1d-99c3-786d0117de77/New-month%20AWS%20Bill.html", "path": "/home/user/.aws-bill-mail-body.html" } ] diff --git a/evaluation_examples/examples/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c.json b/evaluation_examples/examples/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c.json index 4d0d595..261c16e 100644 --- a/evaluation_examples/examples/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c.json +++ b/evaluation_examples/examples/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c.json @@ -20,7 +20,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c/Colorful-Flowers(chosic.com).mp3", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/386dbd0e-0241-4a0a-b6a2-6704fba26b1c/Colorful-Flowers%28chosic.com%29.mp3", "path": "/home/user/Desktop/Colorful-Flowers.mp3" } ] diff --git a/evaluation_examples/examples/vlc/59f21cfb-0120-4326-b255-a5b827b38967.json b/evaluation_examples/examples/vlc/59f21cfb-0120-4326-b255-a5b827b38967.json index 5e6ccfd..af7d904 100644 --- a/evaluation_examples/examples/vlc/59f21cfb-0120-4326-b255-a5b827b38967.json +++ b/evaluation_examples/examples/vlc/59f21cfb-0120-4326-b255-a5b827b38967.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/59f21cfb-0120-4326-b255-a5b827b38967/Rick Astley - Never Gonna Give You Up (Official Music Video).mp4", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/59f21cfb-0120-4326-b255-a5b827b38967/Rick%20Astley%20-%20Never%20Gonna%20Give%20You%20Up%20%28Official%20Music%20Video%29.mp4", "path": "/home/user/Desktop/Rick Astley - Never Gonna Give You Up (Official Music Video).mp4" } ] diff --git a/evaluation_examples/examples/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f.json b/evaluation_examples/examples/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f.json index a3281f7..7cb2ffe 100644 --- a/evaluation_examples/examples/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f.json +++ b/evaluation_examples/examples/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f/Optimus - Gen 2.mp4", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8d9fd4e2-6fdb-46b0-b9b9-02f06495c62f/Optimus%20-%20Gen%202.mp4", "path": "/home/user/Desktop/Gen 2.mp4" } ] diff --git a/evaluation_examples/examples/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e.json b/evaluation_examples/examples/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e.json index c315ea5..81170ee 100644 --- a/evaluation_examples/examples/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e.json +++ b/evaluation_examples/examples/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e/Baby Justin Bieber.mp4", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e/Baby%20Justin%20Bieber.mp4", "path": "/home/user/Desktop/Baby Justin Bieber.mp4" } ] @@ -41,7 +41,7 @@ "func": "compare_audios", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e/Baby Justin Bieber.mp3", + "path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/8f080098-ddb1-424c-b438-4e96e5e4786e/Baby%20Justin%20Bieber.mp3", "dest": "baby_gold.mp3" }, "result": { diff --git a/evaluation_examples/examples/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294.json b/evaluation_examples/examples/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294.json index 6bbe549..a5f6367 100644 --- a/evaluation_examples/examples/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294.json +++ b/evaluation_examples/examples/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294/Interstellar Movie - Official Trailer.mp4", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/efcf0d81-0835-4880-b2fd-d866e8bc2294/Interstellar%20Movie%20-%20Official%20Trailer.mp4", "path": "/home/user/Desktop/Interstellar Movie - Official Trailer.mp4" } ] diff --git a/evaluation_examples/examples/vlc/fba2c100-79e8-42df-ae74-b592418d54f4.json b/evaluation_examples/examples/vlc/fba2c100-79e8-42df-ae74-b592418d54f4.json index 314b2c4..7f383fc 100644 --- a/evaluation_examples/examples/vlc/fba2c100-79e8-42df-ae74-b592418d54f4.json +++ b/evaluation_examples/examples/vlc/fba2c100-79e8-42df-ae74-b592418d54f4.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/fba2c100-79e8-42df-ae74-b592418d54f4/Interstellar Movie - Official Trailer.mp4", + "url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/vlc/fba2c100-79e8-42df-ae74-b592418d54f4/Interstellar%20Movie%20-%20Official%20Trailer.mp4", "path": "/home/user/Desktop/Interstellar Movie - Official Trailer.mp4" } ] diff --git a/evaluation_examples/examples_windows/excel/7efeb4b1-3d19-4762-b163-63328d66303b.json b/evaluation_examples/examples_windows/excel/7efeb4b1-3d19-4762-b163-63328d66303b.json index 7065c26..1a6fa55 100644 --- a/evaluation_examples/examples_windows/excel/7efeb4b1-3d19-4762-b163-63328d66303b.json +++ b/evaluation_examples/examples_windows/excel/7efeb4b1-3d19-4762-b163-63328d66303b.json @@ -9,7 +9,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#.xlsx", + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial%23.xlsx", "path": "C:\\Users\\User\\Order_Sales_Serial#.xlsx" } ] @@ -61,7 +61,7 @@ "func": "compare_table", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#_gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial%23_gold.xlsx", "dest": "Order_Sales_Serial#_gold.xlsx" }, "result": { diff --git a/evaluation_examples/examples_windows/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json b/evaluation_examples/examples_windows/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json index 5959afd..61a05b5 100644 --- a/evaluation_examples/examples_windows/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json +++ b/evaluation_examples/examples_windows/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json @@ -102,7 +102,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf/Order_Id_Mark_Pass_Fail (1).xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/excel/ecb0df7a-4e8d-4a03-b162-053391d3afaf/Order_Id_Mark_Pass_Fail%20%281%29.xlsx", "dest": "Order_Id_Mark_Pass_Fail_gold.xlsx" } } diff --git a/evaluation_examples/examples_windows/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json b/evaluation_examples/examples_windows/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json index d439cde..497d603 100644 --- a/evaluation_examples/examples_windows/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json +++ b/evaluation_examples/examples_windows/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef.json @@ -10,7 +10,7 @@ "files": [ { "path": "C:\\Users\\User\\Desktop\\Employee Performance Evaluation Summary.xlsx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Employee Performance Evaluation Summary.xlsx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Employee%20Performance%20Evaluation%20Summary.xlsx" }, { "path": "C:\\Users\\User\\Desktop\\review_template.pdf", @@ -49,13 +49,13 @@ "result": { "type": "cloud_file", "path": [ - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Alex Lee.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/David Wilson.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Emily Johnson.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/John Doe.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Linda Green.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Michael Brown.pdf", - "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Sophia Carter.pdf" + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Alex%20Lee.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/David%20Wilson.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Emily%20Johnson.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/John%20Doe.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Linda%20Green.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Michael%20Brown.pdf", + "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/185f29bd-5da0-40a6-b69c-ba7f4e0324ef/Sophia%20Carter.pdf" ], "dest": [ "Alex Lee_Gold.pdf", diff --git a/evaluation_examples/examples_windows/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json b/evaluation_examples/examples_windows/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json index c90e151..571c9bf 100644 --- a/evaluation_examples/examples_windows/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json +++ b/evaluation_examples/examples_windows/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea.json @@ -17,15 +17,15 @@ "files": [ { "path": "C:\\Users\\User\\Desktop\\Grammer test 1.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer test 1.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer%20test%201.docx" }, { "path": "C:\\Users\\User\\Desktop\\Grammer test 2.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammar test 2.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammar%20test%202.docx" }, { "path": "C:\\Users\\User\\Desktop\\Grammer test 3.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer test 3.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/1f18aa87-af6f-41ef-9853-cdb8f32ebdea/Grammer%20test%203.docx" }, { "path": "C:\\Users\\User\\Desktop\\Answer.docx", @@ -49,11 +49,11 @@ }, { "path": "C:\\Users\\User\\Desktop\\Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "C:\\Users\\User\\Desktop\\Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course%20Timetable.xlsx" } ] } diff --git a/evaluation_examples/examples_windows/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json b/evaluation_examples/examples_windows/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json index c8e529e..bc9da10 100644 --- a/evaluation_examples/examples_windows/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json +++ b/evaluation_examples/examples_windows/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e.json @@ -17,15 +17,15 @@ "files": [ { "path": "C:\\Users\\User\\Desktop\\students work\\Zheng He .docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng He .docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng%20He%20.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\The literature reviews of weekly readings.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The literature reviews of weekly readings.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The%20literature%20reviews%20of%20weekly%20readings.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\The British Justice System.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The British Justice System.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/The%20British%20Justice%20System.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\quiz2.docx", @@ -37,11 +37,11 @@ }, { "path": "C:\\Users\\User\\Desktop\\students work\\Q1&2&3.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Q1&2&3.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Q1%262%263.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\Photo Ethics in Journalism.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Photo Ethics in Journalism.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Photo%20Ethics%20in%20Journalism.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\cassie.docx", @@ -49,7 +49,7 @@ }, { "path": "C:\\Users\\User\\Desktop\\students work\\case study.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study.docx" }, { "path": "C:\\Users\\User\\Desktop\\Grammar rules PDF\\irregularrules02.pdf", @@ -69,11 +69,11 @@ }, { "path": "C:\\Users\\User\\Desktop\\Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "C:\\Users\\User\\Desktop\\Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course%20Timetable.xlsx" } ] } @@ -110,7 +110,7 @@ "func": "compare_references", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study gold.docx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study%20gold.docx", "dest": "case study gold.docx" }, "result": { diff --git a/evaluation_examples/examples_windows/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818.json b/evaluation_examples/examples_windows/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818.json index 139f81c..a1c6133 100644 --- a/evaluation_examples/examples_windows/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818.json +++ b/evaluation_examples/examples_windows/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818.json @@ -17,7 +17,7 @@ "files": [ { "path": "C:\\Users\\User\\Desktop\\students work\\Zheng He .docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng He .docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Zheng%20He%20.docx" }, { "path": "C:\\Users\\User\\Desktop\\students work\\cassie.docx", @@ -25,7 +25,7 @@ }, { "path": "C:\\Users\\User\\Desktop\\students work\\case study.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case study.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/case%20study.docx" }, { "path": "C:\\Users\\User\\Desktop\\Grammar rules PDF\\irregularrules02.pdf", @@ -45,11 +45,11 @@ }, { "path": "C:\\Users\\User\\Desktop\\Public Lecture Teaching Plan.docx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public Lecture Teaching Plan.docx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Public%20Lecture%20Teaching%20Plan.docx" }, { "path": "C:\\Users\\User\\Desktop\\Course Timetable.xlsx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course Timetable.xlsx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/2c1ebcd7-9c6d-4c9a-afad-900e381ecd5e/Course%20Timetable.xlsx" } ] } @@ -111,17 +111,17 @@ "expected": [ { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold.xlsx", "dest": "Course Timetable gold.xlsx" }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold 2.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold%202.xlsx", "dest": "Course Timetable gold 2.xlsx" }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course Timetable Gold 3.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/3a93cae4-ad3e-403e-8c12-65303b271818/Course%20Timetable%20Gold%203.xlsx", "dest": "Course Timetable gold 3.xlsx" } ], diff --git a/evaluation_examples/examples_windows/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json b/evaluation_examples/examples_windows/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json index 9f8d7a3..f8722c8 100644 --- a/evaluation_examples/examples_windows/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json +++ b/evaluation_examples/examples_windows/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a.json @@ -35,7 +35,7 @@ "parameters": { "files": [ { - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/ConferenceCity Gold.xlsx", + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/6f4073b8-d8ea-4ade-8a18-c5d1d5d5aa9a/ConferenceCity%20Gold.xlsx", "path": "C:\\Users\\User\\Desktop\\ConferenceCity_Gold.xlsx" } ] diff --git a/evaluation_examples/examples_windows/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41.json b/evaluation_examples/examples_windows/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41.json index 4fec431..ec58680 100644 --- a/evaluation_examples/examples_windows/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41.json +++ b/evaluation_examples/examples_windows/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41.json @@ -145,7 +145,7 @@ }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41/Google Drive - Virus scan warning.bin", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41/Google%20Drive%20-%20Virus%20scan%20warning.bin", "dest": "background_script.js" }, { @@ -160,7 +160,7 @@ }, { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41/Google Drive - Virus scan warning.bin", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/74d5859f-ed66-4d3e-aa0e-93d7a592ce41/Google%20Drive%20-%20Virus%20scan%20warning.bin", "dest": "script.js" } ] diff --git a/evaluation_examples/examples_windows/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78.json b/evaluation_examples/examples_windows/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78.json index ac4c220..bc8fba5 100644 --- a/evaluation_examples/examples_windows/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78.json +++ b/evaluation_examples/examples_windows/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78.json @@ -89,7 +89,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78/my_bookkeeping Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/8e116af7-7db7-4e35-a68b-b0939c066c78/my_bookkeeping%20Gold.xlsx", "dest": "my_bookkeeping_gold.xlsx" }, "options": { diff --git a/evaluation_examples/examples_windows/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json b/evaluation_examples/examples_windows/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json index 9b170ad..ac7706a 100644 --- a/evaluation_examples/examples_windows/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json +++ b/evaluation_examples/examples_windows/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2.json @@ -10,7 +10,7 @@ "files": [ { "path": "C:\\Users\\User\\Desktop\\New Large Language Models.xlsx", - "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New Large Language Models.xlsx" + "url": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New%20Large%20Language%20Models.xlsx" } ] } @@ -68,7 +68,7 @@ }, "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New Large Language Models Gold.xlsx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/multi_app/deec51c9-3b1e-4b9e-993c-4776f20e8bb2/New%20Large%20Language%20Models%20Gold.xlsx", "dest": "New Large Language Models Gold.xlsx" }, "options": { diff --git a/evaluation_examples/examples_windows/word/e528b65e-1107-4b8c-8988-490e4fece599.json b/evaluation_examples/examples_windows/word/e528b65e-1107-4b8c-8988-490e4fece599.json index d898c27..df4540d 100644 --- a/evaluation_examples/examples_windows/word/e528b65e-1107-4b8c-8988-490e4fece599.json +++ b/evaluation_examples/examples_windows/word/e528b65e-1107-4b8c-8988-490e4fece599.json @@ -55,7 +55,7 @@ "func": "compare_docx_files", "expected": { "type": "cloud_file", - "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/word/e528b65e-1107-4b8c-8988-490e4fece599/Geography_And_Magical_Realism (1).docx", + "path": "https://huggingface.co/datasets/xlangai/windows_osworld_file_cache/resolve/main/word/e528b65e-1107-4b8c-8988-490e4fece599/Geography_And_Magical_Realism%20%281%29.docx", "dest": "Geography_And_Magical_Realism_Gold.docx" }, "result": { From ca650221378131151ab7b1e718974582a418ec29 Mon Sep 17 00:00:00 2001 From: yuanmengqi Date: Sat, 7 Jun 2025 21:16:26 +0000 Subject: [PATCH 5/7] fix: update AMI ID for us-east-1 region in AWS manager configuration --- desktop_env/providers/aws/manager.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/desktop_env/providers/aws/manager.py b/desktop_env/providers/aws/manager.py index b3ce1f1..d2ad14f 100644 --- a/desktop_env/providers/aws/manager.py +++ b/desktop_env/providers/aws/manager.py @@ -33,7 +33,7 @@ DEFAULT_REGION = "us-east-1" # todo: public the AMI images # ami-05e7d7bd279ea4f14 IMAGE_ID_MAP = { - "us-east-1": "ami-00d1fe56632acbefd", + "us-east-1": "ami-00509b93f2216f419", "ap-east-1": "ami-0c092a5b8be4116f5", } From 88536712205b8843fb6efd069311181372e75429 Mon Sep 17 00:00:00 2001 From: yuanmengqi Date: Sat, 7 Jun 2025 21:17:00 +0000 Subject: [PATCH 6/7] fix: enhance instruction clarity and adjust timing in automation script for LibreOffice Impress example --- .../ef9d12bd-bcee-4ba0-a40e-918400f43ddf.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/evaluation_examples/examples/libreoffice_impress/ef9d12bd-bcee-4ba0-a40e-918400f43ddf.json b/evaluation_examples/examples/libreoffice_impress/ef9d12bd-bcee-4ba0-a40e-918400f43ddf.json index 7c2e0ed..9bd9603 100644 --- a/evaluation_examples/examples/libreoffice_impress/ef9d12bd-bcee-4ba0-a40e-918400f43ddf.json +++ b/evaluation_examples/examples/libreoffice_impress/ef9d12bd-bcee-4ba0-a40e-918400f43ddf.json @@ -1,7 +1,7 @@ { "id": "ef9d12bd-bcee-4ba0-a40e-918400f43ddf", "snapshot": "libreoffice_impress", - "instruction": "I closed the slide panel on the left and idk how to get it back please help", + "instruction": "I closed the slide panel on the left and idk how to get it back please help. Please restore the left slide panel so it becomes visible again.", "source": "https://www.reddit.com/r/libreoffice/comments/18elh3y/i_closed_the_slide_pannel_on_the_left_and_idk_how/", "config": [ { @@ -19,7 +19,7 @@ "command": [ "python", "-c", - "import pyautogui; import time; pyautogui.click(960, 540); time.sleep(5); pyautogui.press('esc'); time.sleep(0.3); pyautogui.press('f10'); time.sleep(0.3); pyautogui.press('right', presses=2, interval=0.1); time.sleep(0.3); pyautogui.press('down', presses=11, interval=0.1); pyautogui.press('enter')" + "import pyautogui; import time; time.sleep(5); pyautogui.click(960, 540); time.sleep(5); pyautogui.press('esc'); time.sleep(0.3); pyautogui.press('f10'); time.sleep(0.3); pyautogui.press('right', presses=2, interval=0.1); time.sleep(0.3); pyautogui.press('down', presses=11, interval=0.1); pyautogui.press('enter')" ] } } From eaf7b9e48fb7bc394d49990bc8fdc62bea055ebd Mon Sep 17 00:00:00 2001 From: yuanmengqi Date: Sat, 7 Jun 2025 21:17:18 +0000 Subject: [PATCH 7/7] refactor: replace hardcoded AMI ID with dynamic retrieval from IMAGE_ID_MAP in AWS DesktopEnv initialization --- run_multienv_openaicua.py | 6 ++++-- run_test_env.py | 6 ++++-- 2 files changed, 8 insertions(+), 4 deletions(-) diff --git a/run_multienv_openaicua.py b/run_multienv_openaicua.py index 65464d0..82af5c7 100644 --- a/run_multienv_openaicua.py +++ b/run_multienv_openaicua.py @@ -176,13 +176,15 @@ def run_env_tasks(env_idx: int, env_tasks: dict, args: argparse.Namespace, share signal.signal(signal.SIGTERM, lambda signum, frame: process_signal_handler(signum, frame, env_idx)) # ami-05e7d7bd279ea4f14 + from desktop_env.providers.aws.manager import IMAGE_ID_MAP + REGION = "us-east-1" env = DesktopEnv( path_to_vm=args.path_to_vm, action_space=args.action_space, provider_name="aws", - region="us-east-1", - snapshot_name="ami-02fea2e5b77c79c17", + region=REGION, + snapshot_name=IMAGE_ID_MAP[REGION], screen_size=(args.screen_width, args.screen_height), headless=args.headless, diff --git a/run_test_env.py b/run_test_env.py index feba441..b4b85f2 100644 --- a/run_test_env.py +++ b/run_test_env.py @@ -223,13 +223,15 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None: ) agents.append(agent) + from desktop_env.providers.aws.manager import IMAGE_ID_MAP + REGION = "us-east-1" env = DesktopEnv( path_to_vm=args.path_to_vm, action_space=agent.action_space, provider_name="aws", - region="us-east-1", - snapshot_name="ami-05e7d7bd279ea4f14", + region=REGION, + snapshot_name=IMAGE_ID_MAP[REGION], screen_size=(args.screen_width, args.screen_height), headless=args.headless,