From afd5952e4429f1f0ac8e639c130605ef6b1010f0 Mon Sep 17 00:00:00 2001 From: Danyang Zhang Date: Sat, 4 Oct 2025 00:13:29 +0800 Subject: [PATCH] ver Oct3rd (#349) updated a series of instructions to ask the agent not to do any unnecessary actions. --- .../01b269ae-2111-4a07-81fd-3fcd711993b0.json | 2 +- .../0bf05a7d-b28b-44d2-955a-50b41e24012a.json | 2 +- .../357ef137-7eeb-4c80-a3bb-0951f26a8aff.json | 4 ++-- .../37608790-6147-45d0-9f20-1137bb35703d.json | 4 ++-- .../4e6fcf72-daf3-439f-a232-c434ce416af6.json | 4 ++-- .../4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json | 4 ++-- .../6054afcb-5bab-4702-90a0-b259b5d3217c.json | 4 ++-- .../7a4e4bc8-922c-4c84-865c-25ba34136be1.json | 4 ++-- .../7efeb4b1-3d19-4762-b163-63328d66303b.json | 4 ++-- .../8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json | 4 ++-- .../a9f325aa-8c05-4e4f-8341-9e4358565f4f.json | 4 ++-- .../abed40dc-063f-4598-8ba5-9fe749c0615d.json | 2 +- .../d681960f-7bc3-4286-9913-a8812ba3261a.json | 4 ++-- .../ecb0df7a-4e8d-4a03-b162-053391d3afaf.json | 2 +- 14 files changed, 24 insertions(+), 24 deletions(-) diff --git a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json index b68f9a6..ac7de50 100644 --- a/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json +++ b/evaluation_examples/examples/libreoffice_calc/01b269ae-2111-4a07-81fd-3fcd711993b0.json @@ -1,7 +1,7 @@ { "id": "01b269ae-2111-4a07-81fd-3fcd711993b0", "snapshot": "libreoffice_calc", - "instruction": "Fill all the blank cells in B1:E30 with the value in the cell above it.", + "instruction": "Fill all the blank cells in B1:E30 with the value in the cell above it. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/VrUzPTIwQ04", "config": [ { diff --git a/evaluation_examples/examples/libreoffice_calc/0bf05a7d-b28b-44d2-955a-50b41e24012a.json b/evaluation_examples/examples/libreoffice_calc/0bf05a7d-b28b-44d2-955a-50b41e24012a.json index 73e3b8f..31027ad 100644 --- a/evaluation_examples/examples/libreoffice_calc/0bf05a7d-b28b-44d2-955a-50b41e24012a.json +++ b/evaluation_examples/examples/libreoffice_calc/0bf05a7d-b28b-44d2-955a-50b41e24012a.json @@ -1,7 +1,7 @@ { "id": "0bf05a7d-b28b-44d2-955a-50b41e24012a", "snapshot": "libreoffice_calc", - "instruction": "I would like to copy all the numbers in the 'Old ID' column to the 'New 7 Digit Id' column, and pad them with zeros in front, to fill them up to seven digits.", + "instruction": "I would like to copy all the numbers in the 'Old ID' column to the 'New 7 Digit Id' column, and pad them with zeros in front, to fill them up to seven digits. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/FPAQaDTS8VY", "config": [ { diff --git a/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json b/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json index e731867..a9263a2 100644 --- a/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json +++ b/evaluation_examples/examples/libreoffice_calc/357ef137-7eeb-4c80-a3bb-0951f26a8aff.json @@ -1,7 +1,7 @@ { "id": "357ef137-7eeb-4c80-a3bb-0951f26a8aff", "snapshot": "libreoffice_calc", - "instruction": "I have calculated the total work hours from the everday hours. And I have an hourly rate. Now I want to multiply the total hours with the hourly rate to get a total earned amount. However, I can't get a correct answer by directly multiply the two cells. Here the \"total hours\" is of time and \"hourly rate\" is just a number. How can I get the correct product of them?", + "instruction": "I have calculated the total work hours from the everday hours. And I have an hourly rate. Now I want to multiply the total hours with the hourly rate to get a total earned amount. However, I can't get a correct answer by directly multiply the two cells. Here the \"total hours\" is of time and \"hourly rate\" is just a number. How can I get the correct product of them? Help me fill in the cell the correct answer. Don't touch irrelevant blank regions.", "source": "https://www.reddit.com/r/excel/comments/17zny8u/calculating_total_amount_earned_from_total_hours/", "config": [ { @@ -83,4 +83,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json b/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json index 784a098..326b1e4 100644 --- a/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json +++ b/evaluation_examples/examples/libreoffice_calc/37608790-6147-45d0-9f20-1137bb35703d.json @@ -1,7 +1,7 @@ { "id": "37608790-6147-45d0-9f20-1137bb35703d", "snapshot": "libreoffice_calc", - "instruction": "The information are mixed in one field. Help me split them and fill in the columns of First Name, Last Name and Rank", + "instruction": "The information are mixed in one field. Help me split them and fill in the columns of First Name, Last Name and Rank. Finish the work and don't touch the original data.", "source": "https://www.youtube.com/shorts/uzPo_CPCHH8", "config": [ { @@ -82,4 +82,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json b/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json index 47c7fec..bc14383 100644 --- a/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json +++ b/evaluation_examples/examples/libreoffice_calc/4e6fcf72-daf3-439f-a232-c434ce416af6.json @@ -1,7 +1,7 @@ { "id": "4e6fcf72-daf3-439f-a232-c434ce416af6", "snapshot": "libreoffice_calc", - "instruction": "Please calculate the ages of the employees according to their birthday.", + "instruction": "Please calculate the ages of the employees according to their birthday. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/0uxJccNCKcE", "config": [ { @@ -134,4 +134,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json b/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json index 0e3305d..07f4fe9 100644 --- a/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json +++ b/evaluation_examples/examples/libreoffice_calc/4f07fbe9-70de-4927-a4d5-bb28bc12c52c.json @@ -1,7 +1,7 @@ { "id": "4f07fbe9-70de-4927-a4d5-bb28bc12c52c", "snapshot": "libreoffice_calc", - "instruction": "Here I want to use the numerical value from a cell in the text. I can set its number of decimal digits to 2 in the original value cell but don't know how to fix it in the text as well. Please help me to do this.", + "instruction": "Here I want to use the numerical value from a cell in the text. I can set its number of decimal digits to 2 in the original value cell but don't know how to fix it in the text as well. Please help me to do this. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://superuser.com/questions/1081048/libreoffice-calc-how-to-pad-number-to-fixed-decimals-when-used-within-formula", "config": [ { @@ -115,4 +115,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json b/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json index a4523f1..e8212ce 100644 --- a/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json +++ b/evaluation_examples/examples/libreoffice_calc/6054afcb-5bab-4702-90a0-b259b5d3217c.json @@ -1,7 +1,7 @@ { "id": "6054afcb-5bab-4702-90a0-b259b5d3217c", "snapshot": "libreoffice_calc", - "instruction": "Some data are missed by now and are filled by 'N/A' temporarily. Please hide them in the table for now. Do not delete them and filter is no needed.", + "instruction": "Some data are missed by now and are filled by 'N/A' temporarily. Please hide them in the table for now. Do not delete any cells and filter is not needed.", "source": "https://www.youtube.com/shorts/JTbZ8sRxkdU", "config": [ { @@ -90,4 +90,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json b/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json index 9c5637b..bfed08f 100644 --- a/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json +++ b/evaluation_examples/examples/libreoffice_calc/7a4e4bc8-922c-4c84-865c-25ba34136be1.json @@ -1,7 +1,7 @@ { "id": "7a4e4bc8-922c-4c84-865c-25ba34136be1", "snapshot": "libreoffice_calc", - "instruction": "Reorder the columns to be \"Date\", \"First Name\", \"Last Name\", \"Order ID\", \"Sales\"", + "instruction": "Reorder the columns to be \"Date\", \"First Name\", \"Last Name\", \"Order ID\", \"Sales\". Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/bvUhr1AHs44", "config": [ { @@ -82,4 +82,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json index b7a2ecf..49d6559 100644 --- a/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json +++ b/evaluation_examples/examples/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b.json @@ -1,7 +1,7 @@ { "id": "7efeb4b1-3d19-4762-b163-63328d66303b", "snapshot": "libreoffice_calc", - "instruction": "Fill the Sequence Numbers as \"No. #\" in the \"Seq No.\" column", + "instruction": "Fill the Sequence Numbers as \"No. #\" in the \"Seq No.\" column. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/4jzXfZNhfmk", "config": [ { @@ -82,4 +82,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json b/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json index 107d478..e0677b6 100644 --- a/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json +++ b/evaluation_examples/examples/libreoffice_calc/8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14.json @@ -1,7 +1,7 @@ { "id": "8b1ce5f2-59d2-4dcc-b0b0-666a714b9a14", "snapshot": "libreoffice_calc", - "instruction": "Given a partial calendar, please highlight all the weekends (Satureday & Sunday) by setting the cell background as red (#ff0000).", + "instruction": "Given a partial calendar, please highlight all the weekends (Satureday & Sunday) by setting the cell background as red (#ff0000). Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/Hbcwu6IQ1ns", "config": [ { @@ -90,4 +90,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json b/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json index 93625fb..7bef426 100644 --- a/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json +++ b/evaluation_examples/examples/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f.json @@ -1,7 +1,7 @@ { "id": "a9f325aa-8c05-4e4f-8341-9e4358565f4f", "snapshot": "libreoffice_calc", - "instruction": "I want to copy the movie titles in 'Garbage Movie Titles' column to the 'Clean Movie Titles' column. But please remove the adundant whitespaces and canonicalize the letter cases by capitalizing the first letter of each words and leave other letters as lower case.", + "instruction": "I want to copy the movie titles in 'Garbage Movie Titles' column to the 'Clean Movie Titles' column. But please remove the adundant whitespaces and canonicalize the letter cases by capitalizing the first letter of each words and leave other letters as lower case. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/A0gmEBRKXWs", "config": [ { @@ -82,4 +82,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json b/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json index 58b1637..d75a527 100644 --- a/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json +++ b/evaluation_examples/examples/libreoffice_calc/abed40dc-063f-4598-8ba5-9fe749c0615d.json @@ -1,7 +1,7 @@ { "id": "abed40dc-063f-4598-8ba5-9fe749c0615d", "snapshot": "libreoffice_calc", - "instruction": "Check the names in column \"Names with duplicates\" and put the unique ones in column \"Unique Names\". Keep the original order of the first occurrences.", + "instruction": "Check the names in column \"Names with duplicates\" and put the unique ones in column \"Unique Names\". Keep the original order of the first occurrences. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://help.libreoffice.org/7.6/ro/text/scalc/guide/remove_duplicates.html?&DbPAR=SHARED&System=UNIX", "config": [ { diff --git a/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json b/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json index b0e74cb..813bb82 100644 --- a/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json +++ b/evaluation_examples/examples/libreoffice_calc/d681960f-7bc3-4286-9913-a8812ba3261a.json @@ -1,7 +1,7 @@ { "id": "d681960f-7bc3-4286-9913-a8812ba3261a", "snapshot": "libreoffice_calc", - "instruction": "According to the scale table shown above, calculate and give each student a grade in the table below", + "instruction": "According to the scale table shown above, calculate and give each student a grade in the table below. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/d7U1S_IsTVM", "config": [ { @@ -82,4 +82,4 @@ "proxy": false, "fixed_ip": false, "possibility_of_env_change": "low" -} \ No newline at end of file +} diff --git a/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json b/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json index b254536..240f503 100644 --- a/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json +++ b/evaluation_examples/examples/libreoffice_calc/ecb0df7a-4e8d-4a03-b162-053391d3afaf.json @@ -1,7 +1,7 @@ { "id": "ecb0df7a-4e8d-4a03-b162-053391d3afaf", "snapshot": "libreoffice_calc", - "instruction": "In the column \"Pass/Fail/Held\", one from the texts \"Pass\", \"Fail\", and \"Held\" should be filled. For convinience, enable data validation for the cells in this column so that the texts to fill can be directly selected from a drop down list.", + "instruction": "In the column \"Pass/Fail/Held\", one from the texts \"Pass\", \"Fail\", and \"Held\" should be filled. For convinience, enable data validation for the cells in this column so that the texts to fill can be directly selected from a drop down list. Finish the work and don't touch irrelevant regions, even if they are blank.", "source": "https://www.youtube.com/shorts/tXOovKn0H68", "config": [ {