From 4897211a46aafa241baad9c995c65bf753c2ab0b Mon Sep 17 00:00:00 2001 From: David Chang Date: Wed, 31 Jan 2024 22:55:47 +0800 Subject: [PATCH] ver Jan31stv6 finished calc human evaluation updated calc configs with an extra sleep to guarantee the integrity of downloaded xlsx file --- branch_flag | 2 +- desktop_env/evaluators/metrics/table.py | 16 ++--- ...269ae-2111-4a07-81fd-3fcd711993b0-win.json | 6 ++ .../01b269ae-2111-4a07-81fd-3fcd711993b0.json | 6 ++ .../0cecd4f3-74de-457b-ba94-29ad6b5dafb6.json | 6 ++ .../1334ca3e-f9e3-4db8-9ca7-b4c653be7d17.json | 6 ++ .../21df9241-f8d7-4509-b7f1-37e501a823f7.json | 6 ++ .../347ef137-7eeb-4c80-a3bb-0951f26a8aff.json | 6 ++ .../357ef137-7eeb-4c80-a3bb-0951f26a8aff.json | 6 ++ .../37608790-6147-45d0-9f20-1137bb35703d.json | 6 ++ .../4188d3a4-077d-46b7-9c86-23e1a036f6c1.json | 6 ++ .../4e6fcf72-daf3-439f-a232-c434ce416af6.json | 62 ++++++++++++++++++- .../4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json | 6 ++ .../51b11269-2ca8-4b2a-9163-f21758420e78.json | 6 ++ .../6054afcb-5bab-4702-90a0-b259b5d3217c.json | 6 ++ .../6e99a1ad-07d2-4b66-a1ce-ece6d99c20a5.json | 6 ++ .../7a4e4bc8-922c-4c84-865c-25ba34136be1.json | 6 ++ .../7e429b8d-a3f0-4ed0-9b58-08957d00b127.json | 6 ++ .../7efeb4b1-3d19-4762-b163-63328d66303b.json | 6 ++ .../8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json | 6 ++ .../a01fbce3-2793-461f-ab86-43680ccbae25.json | 8 ++- .../a9f325aa-8c05-4e4f-8341-9e4358565f4f.json | 6 ++ .../abed40dc-063f-4598-8ba5-9fe749c0615d.json | 6 ++ .../d681960f-7bc3-4286-9913-a8812ba3261a.json | 6 ++ .../eb03d19a-b88d-4de4-8a64-ca0ac66f426b.json | 6 ++ .../ecb0df7a-4e8d-4a03-b162-053391d3afaf.json | 6 ++ .../f9584479-3d0d-4c79-affa-9ad7afdd8850.json | 6 ++ main.py | 7 ++- 28 files changed, 216 insertions(+), 17 deletions(-) diff --git a/branch_flag b/branch_flag index 760637d..9daeafb 100644 --- a/branch_flag +++ b/branch_flag @@ -1 +1 @@ -exp_som +test diff --git a/desktop_env/evaluators/metrics/table.py b/desktop_env/evaluators/metrics/table.py index 4e8bac6..294e2e5 100644 --- a/desktop_env/evaluators/metrics/table.py +++ b/desktop_env/evaluators/metrics/table.py @@ -392,17 +392,13 @@ if __name__ == '__main__': logger.addHandler(stdout_handler) logger.addHandler(sdebug_handler) - path1 = "../../任务数据/LibreOffice Calc/Multiply_Time_Number.xlsx" - path2 = "../../任务数据/LibreOffice Calc/Multiply_Time_Number_gold.xlsx" - rules = [{"type": "check_cell" - , "sheet_idx": 0 - , "coordinate": "E3" - , "props": {"value": {"method": "approx:0.001" - , "ref": 191.6667 - } - } + path1 = "snapshots/test/cache/4e6fcf72-daf3-439f-a232-c434ce416af6/Employee_Age_By_Birthday.xlsx" + path2 = "snapshots/test/cache/4e6fcf72-daf3-439f-a232-c434ce416af6/Employee_Age_By_Birthday_gold.xlsx" + rules = [ { "type": "sheet_data" + , "sheet_idx0": 0 + , "sheet_idx1": "EI0" } - ] + ] print(compare_table(path1, path2 , rules=rules ) diff --git a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0-win.json b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0-win.json index dfa3dcb..355c776 100644 --- a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0-win.json +++ b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0-win.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json index 3ae596d..2dfd0d2 100644 --- a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json +++ b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/0cecd4f3-74de-457b-ba94-29ad6b5dafb6.json b/evaluation_examples/examples/libreoffice_calc/0cecd4f3-74de-457b-ba94-29ad6b5dafb6.json index e12377c..97ad2a1 100644 --- a/evaluation_examples/examples/libreoffice_calc/0cecd4f3-74de-457b-ba94-29ad6b5dafb6.json +++ b/evaluation_examples/examples/libreoffice_calc/0cecd4f3-74de-457b-ba94-29ad6b5dafb6.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/1334ca3e-f9e3-4db8-9ca7-b4c653be7d17.json b/evaluation_examples/examples/libreoffice_calc/1334ca3e-f9e3-4db8-9ca7-b4c653be7d17.json index 08b9f8f..1ee0683 100644 --- a/evaluation_examples/examples/libreoffice_calc/1334ca3e-f9e3-4db8-9ca7-b4c653be7d17.json +++ b/evaluation_examples/examples/libreoffice_calc/1334ca3e-f9e3-4db8-9ca7-b4c653be7d17.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/21df9241-f8d7-4509-b7f1-37e501a823f7.json b/evaluation_examples/examples/libreoffice_calc/21df9241-f8d7-4509-b7f1-37e501a823f7.json index 199bc74..e55f7cb 100644 --- a/evaluation_examples/examples/libreoffice_calc/21df9241-f8d7-4509-b7f1-37e501a823f7.json +++ b/evaluation_examples/examples/libreoffice_calc/21df9241-f8d7-4509-b7f1-37e501a823f7.json @@ -69,6 +69,12 @@ "/home/user/Represent_in_millions_billions.xlsx" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/347ef137-7eeb-4c80-a3bb-0951f26a8aff.json b/evaluation_examples/examples/libreoffice_calc/347ef137-7eeb-4c80-a3bb-0951f26a8aff.json index 9115022..11a1c4b 100644 --- a/evaluation_examples/examples/libreoffice_calc/347ef137-7eeb-4c80-a3bb-0951f26a8aff.json +++ b/evaluation_examples/examples/libreoffice_calc/347ef137-7eeb-4c80-a3bb-0951f26a8aff.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json b/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json index 544a464..58ec20a 100644 --- a/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json +++ b/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json b/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json index 1e37657..ab6d275 100644 --- a/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json +++ b/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/4188d3a4-077d-46b7-9c86-23e1a036f6c1.json b/evaluation_examples/examples/libreoffice_calc/4188d3a4-077d-46b7-9c86-23e1a036f6c1.json index 7b77db3..1e8d045 100644 --- a/evaluation_examples/examples/libreoffice_calc/4188d3a4-077d-46b7-9c86-23e1a036f6c1.json +++ b/evaluation_examples/examples/libreoffice_calc/4188d3a4-077d-46b7-9c86-23e1a036f6c1.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json b/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json index 65df118..a047e10 100644 --- a/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json +++ b/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json @@ -50,12 +50,70 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } + }, + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.usercontent.google.com/download?id=1sRI72UGfHiVBRFuV4uwhr173u3Sf46Y6&export=download&authuser=0&confirm=t&uuid=90da5e2b-39c0-449d-b753-09dfed73b509&at=APZUnTVFInccKo2QB9JNnIidFfG3:1705909465173", + "path": "/home/user/Employee_Age_By_Birthday_gold.xlsx" + } + ] + } + }, + { + "type": "open", + "parameters": { + "path": "/home/user/Employee_Age_By_Birthday_gold.xlsx" + } + }, + { + "type": "sleep", + "parameters": { + "seconds": 2 + } + }, + { + "type": "activate_window", + "parameters": { + "window_name": "Employee_Age_By_Birthday_gold.xlsx - LibreOffice Calc", + "strict": true + } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } + }, + { + "type": "execute", + "parameters": { + "command": [ + "python", + "-c", + "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" + ] + } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", "expected": { - "type": "cloud_file", - "path": "https://drive.usercontent.google.com/download?id=1sRI72UGfHiVBRFuV4uwhr173u3Sf46Y6&export=download&authuser=0&confirm=t&uuid=90da5e2b-39c0-449d-b753-09dfed73b509&at=APZUnTVFInccKo2QB9JNnIidFfG3:1705909465173", + "type": "vm_file", + "path": "/home/user/Employee_Age_By_Birthday_gold.xlsx", "dest": "Employee_Age_By_Birthday_gold.xlsx" }, "result": { diff --git a/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json b/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json index 0e8b6d8..b910327 100644 --- a/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json +++ b/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json @@ -69,6 +69,12 @@ "/home/user/Padding_Decimals_In_Formular.xlsx" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/51b11269-2ca8-4b2a-9163-f21758420e78.json b/evaluation_examples/examples/libreoffice_calc/51b11269-2ca8-4b2a-9163-f21758420e78.json index b89606d..80b2167 100644 --- a/evaluation_examples/examples/libreoffice_calc/51b11269-2ca8-4b2a-9163-f21758420e78.json +++ b/evaluation_examples/examples/libreoffice_calc/51b11269-2ca8-4b2a-9163-f21758420e78.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json b/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json index 833a9cb..460b4ca 100644 --- a/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json +++ b/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/6e99a1ad-07d2-4b66-a1ce-ece6d99c20a5.json b/evaluation_examples/examples/libreoffice_calc/6e99a1ad-07d2-4b66-a1ce-ece6d99c20a5.json index c985a2e..18b1da1 100644 --- a/evaluation_examples/examples/libreoffice_calc/6e99a1ad-07d2-4b66-a1ce-ece6d99c20a5.json +++ b/evaluation_examples/examples/libreoffice_calc/6e99a1ad-07d2-4b66-a1ce-ece6d99c20a5.json @@ -69,6 +69,12 @@ "/home/user/Keep_Two_decimal_points.xlsx" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json b/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json index 7bf9cef..99133d0 100644 --- a/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json +++ b/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/7e429b8d-a3f0-4ed0-9b58-08957d00b127.json b/evaluation_examples/examples/libreoffice_calc/7e429b8d-a3f0-4ed0-9b58-08957d00b127.json index c06cde7..48998ef 100644 --- a/evaluation_examples/examples/libreoffice_calc/7e429b8d-a3f0-4ed0-9b58-08957d00b127.json +++ b/evaluation_examples/examples/libreoffice_calc/7e429b8d-a3f0-4ed0-9b58-08957d00b127.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json index 43fcb6b..fe89bcc 100644 --- a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json +++ b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json b/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json index 2c115d0..bb95f4c 100644 --- a/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json +++ b/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/a01fbce3-2793-461f-ab86-43680ccbae25.json b/evaluation_examples/examples/libreoffice_calc/a01fbce3-2793-461f-ab86-43680ccbae25.json index ce5b308..3db1a03 100644 --- a/evaluation_examples/examples/libreoffice_calc/a01fbce3-2793-461f-ab86-43680ccbae25.json +++ b/evaluation_examples/examples/libreoffice_calc/a01fbce3-2793-461f-ab86-43680ccbae25.json @@ -1,7 +1,7 @@ { "id": "a01fbce3-2793-461f-ab86-43680ccbae25", "snapshot": "libreoffice_calc", - "instruction": "I need to set the decimal separator as a comma (,) for localized data representation and clarity in visualization. Can you assist with this?", + "instruction": "I need to set the decimal separator as a comma (,) for localized data representation and clarity in visualization. Can you help me to update all the numbers in the sheet? Also please keep the decimal numbers as-is.", "source": "https://superuser.com/questions/1250677/how-to-set-decimal-separator-in-libre-office-calc", "config": [ { @@ -69,6 +69,12 @@ "/home/user/Set_Decimal_Separator_Dot.xlsx" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json b/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json index 8b50b36..c0cc65d 100644 --- a/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json +++ b/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json b/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json index e3d8cd1..b32cf0a 100644 --- a/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json +++ b/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json b/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json index 111f16c..8fbecea 100644 --- a/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json +++ b/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/eb03d19a-b88d-4de4-8a64-ca0ac66f426b.json b/evaluation_examples/examples/libreoffice_calc/eb03d19a-b88d-4de4-8a64-ca0ac66f426b.json index d2a30ab..215ee46 100644 --- a/evaluation_examples/examples/libreoffice_calc/eb03d19a-b88d-4de4-8a64-ca0ac66f426b.json +++ b/evaluation_examples/examples/libreoffice_calc/eb03d19a-b88d-4de4-8a64-ca0ac66f426b.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json b/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json index 3ba14cf..b0afdc6 100644 --- a/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json +++ b/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/evaluation_examples/examples/libreoffice_calc/f9584479-3d0d-4c79-affa-9ad7afdd8850.json b/evaluation_examples/examples/libreoffice_calc/f9584479-3d0d-4c79-affa-9ad7afdd8850.json index b522e4d..d9ff527 100644 --- a/evaluation_examples/examples/libreoffice_calc/f9584479-3d0d-4c79-affa-9ad7afdd8850.json +++ b/evaluation_examples/examples/libreoffice_calc/f9584479-3d0d-4c79-affa-9ad7afdd8850.json @@ -50,6 +50,12 @@ "import pyautogui; pyautogui.hotkey(\"ctrl\", \"s\");" ] } + }, + { + "type": "sleep", + "parameters": { + "seconds": 0.5 + } } ], "func": "compare_table", diff --git a/main.py b/main.py index c783c00..ce7ee30 100644 --- a/main.py +++ b/main.py @@ -47,11 +47,12 @@ def human_agent(): Runs the Gym environment with human input. """ - with open("evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0-win.json", "r") as f: + with open("evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json", "r") as f: example = json.load(f) - example["snapshot"] = "Snapshot 1" + example["snapshot"] = "Snapshot 30" - env = DesktopEnv( path_to_vm="~/vmware/Windows 10 x64/Windows 10 x64.vmx" + #env = DesktopEnv( path_to_vm="~/vmware/Windows 10 x64/Windows 10 x64.vmx" + env = DesktopEnv( path_to_vm="/mnt/data1/david/os-images/Ubuntu-1218/Ubuntu.vmx" , action_space="computer_13" , task_config=example )