From 1ff9f5c38b3663739733e21dbf6f5b1baa7d7da4 Mon Sep 17 00:00:00 2001 From: David Chang Date: Mon, 26 Feb 2024 20:50:08 +0800 Subject: [PATCH 1/3] ver Feb26th statistics of action types of exp_som branch --- action_type_analysis.py | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 action_type_analysis.py diff --git a/action_type_analysis.py b/action_type_analysis.py new file mode 100644 index 0000000..750ef9b --- /dev/null +++ b/action_type_analysis.py @@ -0,0 +1,22 @@ +import json +import glob + +from typing import Dict, Counter +from typing import Any + +import collections + +action_counter: Counter[str] = collections.Counter() +for trjctr in glob.glob("snapshots/exp_som/exp_trajectory/**/*.json", recursive=True): + with open(trjctr) as f: + for l in f: + step: Dict[str, Any] = json.loads(l) + #print(step) + for rsp in step.get("action", "").splitlines(): + if rsp.startswith("pyautogui."): + action_counter[rsp[10:rsp.find("(")]] += 1 + elif rsp in {"WAIT", "FAIL", "DONE"}: + action_counter[rsp] += 1 + +for k, nb in sorted(action_counter.items(), key=(lambda itm: itm[1]), reverse=True): + print(k, nb) From 1ed763591b6579ecd8c6025dbba4fbe37614ac73 Mon Sep 17 00:00:00 2001 From: David Chang Date: Mon, 26 Feb 2024 23:19:17 +0800 Subject: [PATCH 2/3] ver Feb26thv2 updated two new chrome tasks --- .../chrome/82bc8d6a-36eb-4d2d-8801-ef714fb1e55a.json | 7 +++---- .../chrome/da46d875-6b82-4681-9284-653b0c7ae241.json | 9 ++++----- 2 files changed, 7 insertions(+), 9 deletions(-) diff --git a/evaluation_examples/examples/chrome/82bc8d6a-36eb-4d2d-8801-ef714fb1e55a.json b/evaluation_examples/examples/chrome/82bc8d6a-36eb-4d2d-8801-ef714fb1e55a.json index f6c7a68..eaf66d7 100644 --- a/evaluation_examples/examples/chrome/82bc8d6a-36eb-4d2d-8801-ef714fb1e55a.json +++ b/evaluation_examples/examples/chrome/82bc8d6a-36eb-4d2d-8801-ef714fb1e55a.json @@ -1,7 +1,7 @@ { "id": "82bc8d6a-36eb-4d2d-8801-ef714fb1e55a", "snapshot": "chrome", - "instruction": "On April 21, look up a flight from Mumbai to Stockholm.", + "instruction": "On next Monday, look up a flight from Mumbai to Stockholm.", "source": "test_task_1", "config": [ { @@ -61,10 +61,9 @@ "expected": { "fromStation": "BOM", "toStation": "STO", - "time": "{Year}-{Month0D}-{DayD}" + "time": "{Year}-{Month0D}-{Day0D}" } } } } - } - \ No newline at end of file +} diff --git a/evaluation_examples/examples/chrome/da46d875-6b82-4681-9284-653b0c7ae241.json b/evaluation_examples/examples/chrome/da46d875-6b82-4681-9284-653b0c7ae241.json index a458935..0abaac7 100644 --- a/evaluation_examples/examples/chrome/da46d875-6b82-4681-9284-653b0c7ae241.json +++ b/evaluation_examples/examples/chrome/da46d875-6b82-4681-9284-653b0c7ae241.json @@ -1,7 +1,7 @@ { "id": "da46d875-6b82-4681-9284-653b0c7ae241", "snapshot": "chrome", - "instruction": "Schedule an appointment to apply for transportation access pass in the Charlie Card store on the first Monday four months later, 10:15 am, fill in my details (James Smith, james.smith@gmail.com), and book.", + "instruction": "Schedule an appointment to apply for transportation access pass in the Charlie Card store on the first Monday four months later, 10:15 am, fill in my details (James Smith, james.smith@gmail.com). And don not click \"book\" directly. Let me review it.", "source": "test_task_2", "config": [ { @@ -58,7 +58,7 @@ "1": "content", "2": "time" } - } + } }, { "type": "active_tab_html_parse", @@ -74,7 +74,7 @@ "type": "rule", "rules":{ "expected": ["CharlieCardStoreAppointments@mbta.com\/bookings\/"] - } + } }, { "type": "rule_relativeTime", @@ -99,5 +99,4 @@ } ] } - } - \ No newline at end of file +} From 88cb9363abc29dc3211dce97d4ec87dfc2ef523f Mon Sep 17 00:00:00 2001 From: BlankCheng <913501223@qq.com> Date: Tue, 27 Feb 2024 14:00:16 +0800 Subject: [PATCH 3/3] gimp update infeasible --- .../045bf3ff-9077-4b86-b483-a1040a949cff.json | 39 ++++++++++++++++ .../2e6f678f-472d-4c55-99cc-8e7c5c402a71.json | 46 +++++++++++++++++++ .../58d3eeeb-e9d0-499f-962e-fd0db2a744d8.json | 39 ++++++++++++++++ .../8ea73f6f-9689-42ad-8c60-195bbf06a7ba.json | 39 ++++++++++++++++ .../dbbf4b99-2253-4b10-9274-45f246af2466.json | 39 ++++++++++++++++ 5 files changed, 202 insertions(+) create mode 100644 evaluation_examples/examples/gimp/045bf3ff-9077-4b86-b483-a1040a949cff.json create mode 100644 evaluation_examples/examples/gimp/2e6f678f-472d-4c55-99cc-8e7c5c402a71.json create mode 100644 evaluation_examples/examples/gimp/58d3eeeb-e9d0-499f-962e-fd0db2a744d8.json create mode 100644 evaluation_examples/examples/gimp/8ea73f6f-9689-42ad-8c60-195bbf06a7ba.json create mode 100644 evaluation_examples/examples/gimp/dbbf4b99-2253-4b10-9274-45f246af2466.json diff --git a/evaluation_examples/examples/gimp/045bf3ff-9077-4b86-b483-a1040a949cff.json b/evaluation_examples/examples/gimp/045bf3ff-9077-4b86-b483-a1040a949cff.json new file mode 100644 index 0000000..54e5534 --- /dev/null +++ b/evaluation_examples/examples/gimp/045bf3ff-9077-4b86-b483-a1040a949cff.json @@ -0,0 +1,39 @@ +{ + "id": "045bf3ff-9077-4b86-b483-a1040a949cff", + "snapshot": "gimp", + "instruction": "Could you turn my image into CYMK mode?", + "source": "https://www.makeuseof.com/tag/can-photoshop-gimp-cant/", + "config": [ + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.google.com/uc?export=download&id=1YnUq4q9rv7pr1MZPdaD2mVFZRrsgISmn", + "path": "/home/user/Desktop/gate.jpeg" + } + ] + } + }, + { + "type": "launch", + "parameters": { + "command": [ + "gimp", + "/home/user/Desktop/gate.jpeg" + ] + } + } + ], + "trajectory": "trajectories/", + "related_apps": [ + "gimp" + ], + "evaluator": { + "func": "infeasible", + "expected": { + }, + "result": { + } + } +} \ No newline at end of file diff --git a/evaluation_examples/examples/gimp/2e6f678f-472d-4c55-99cc-8e7c5c402a71.json b/evaluation_examples/examples/gimp/2e6f678f-472d-4c55-99cc-8e7c5c402a71.json new file mode 100644 index 0000000..6f7b55e --- /dev/null +++ b/evaluation_examples/examples/gimp/2e6f678f-472d-4c55-99cc-8e7c5c402a71.json @@ -0,0 +1,46 @@ +{ + "id": "2e6f678f-472d-4c55-99cc-8e7c5c402a71", + "snapshot": "gimp", + "instruction": "Please batch process the images on the desktop by lifting the brightness to 50.", + "source": "", + "config": [ + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.google.com/uc?export=download&id=1uOZWtT9E8YW_IOu51meW5a0jAgwS1DoX", + "path": "/home/user/Desktop/squirrel.jpeg" + }, + { + "url": "https://drive.google.com/uc?export=download&id=1KCyoqh3bTsbY42r9YSqIvcGuUr6i95GU", + "path": "/home/user/Desktop/panda.jpeg" + }, + { + "url": "https://drive.google.com/uc?export=download&id=1xftsr0mRUvqKGPCHOnzUMm7tMnuqdhAA", + "path": "/home/user/Desktop/heron.jpeg" + } + ] + } + }, + { + "type": "launch", + "parameters": { + "command": [ + "gimp" + ] + } + } + ], + "trajectory": "trajectories/", + "related_apps": [ + "gimp" + ], + "evaluator": { + "func": "infeasible", + "expected": { + }, + "result": { + } + } +} \ No newline at end of file diff --git a/evaluation_examples/examples/gimp/58d3eeeb-e9d0-499f-962e-fd0db2a744d8.json b/evaluation_examples/examples/gimp/58d3eeeb-e9d0-499f-962e-fd0db2a744d8.json new file mode 100644 index 0000000..5fe5537 --- /dev/null +++ b/evaluation_examples/examples/gimp/58d3eeeb-e9d0-499f-962e-fd0db2a744d8.json @@ -0,0 +1,39 @@ +{ + "id": "58d3eeeb-e9d0-499f-962e-fd0db2a744d8", + "snapshot": "gimp", + "instruction": "Please describe what is happening in the image.", + "source": "", + "config": [ + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.google.com/uc?export=download&id=1w9R8RYkbFl88n8_Vgk_zZeD5J4t4yrzC", + "path": "/home/user/Desktop/heron.jpeg" + } + ] + } + }, + { + "type": "launch", + "parameters": { + "command": [ + "gimp", + "/home/user/Desktop/heron.jpeg" + ] + } + } + ], + "trajectory": "trajectories/", + "related_apps": [ + "gimp" + ], + "evaluator": { + "func": "infeasible", + "expected": { + }, + "result": { + } + } +} \ No newline at end of file diff --git a/evaluation_examples/examples/gimp/8ea73f6f-9689-42ad-8c60-195bbf06a7ba.json b/evaluation_examples/examples/gimp/8ea73f6f-9689-42ad-8c60-195bbf06a7ba.json new file mode 100644 index 0000000..a19c2a5 --- /dev/null +++ b/evaluation_examples/examples/gimp/8ea73f6f-9689-42ad-8c60-195bbf06a7ba.json @@ -0,0 +1,39 @@ +{ + "id": "8ea73f6f-9689-42ad-8c60-195bbf06a7ba", + "snapshot": "gimp", + "instruction": "Can you enhance this low-resolution photo to high-resolution without increasing the file size?", + "source": "", + "config": [ + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.google.com/uc?export=download&id=14r8Y0Cq8yTtQ5kfqhwWij5ow3LWApy2n", + "path": "/home/user/Desktop/low_resolution.jpeg" + } + ] + } + }, + { + "type": "launch", + "parameters": { + "command": [ + "gimp", + "/home/user/Desktop/low_resolution.jpeg" + ] + } + } + ], + "trajectory": "trajectories/", + "related_apps": [ + "gimp" + ], + "evaluator": { + "func": "infeasible", + "expected": { + }, + "result": { + } + } +} \ No newline at end of file diff --git a/evaluation_examples/examples/gimp/dbbf4b99-2253-4b10-9274-45f246af2466.json b/evaluation_examples/examples/gimp/dbbf4b99-2253-4b10-9274-45f246af2466.json new file mode 100644 index 0000000..f9087f3 --- /dev/null +++ b/evaluation_examples/examples/gimp/dbbf4b99-2253-4b10-9274-45f246af2466.json @@ -0,0 +1,39 @@ +{ + "id": "dbbf4b99-2253-4b10-9274-45f246af2466", + "snapshot": "gimp", + "instruction": "Convert my new raw image into jpeg.", + "source": "https://www.makeuseof.com/tag/can-photoshop-gimp-cant/", + "config": [ + { + "type": "download", + "parameters": { + "files": [ + { + "url": "https://drive.google.com/uc?export=download&id=1zcxzbQ5dp-mgpu0mom-LB8BKJH-V01Kr", + "path": "/home/user/Desktop/yicun.raw" + } + ] + } + }, + { + "type": "launch", + "parameters": { + "command": [ + "gimp", + "/home/user/Desktop/yicun.raw" + ] + } + } + ], + "trajectory": "trajectories/", + "related_apps": [ + "gimp" + ], + "evaluator": { + "func": "infeasible", + "expected": { + }, + "result": { + } + } +} \ No newline at end of file