feat: Migrate OSWorld files to HuggingFace cache with comprehensive documentation
- Add detailed README for file cache repository - Implement migration script with retry logic and browser simulation - Support automatic file type detection and deduplication - Ensure reliable hosting for OSWorld evaluation files
This commit is contained in:
@@ -1,85 +1,85 @@
|
||||
{
|
||||
"id": "68a25bd4-59c7-4f4d-975e-da0c8509c848",
|
||||
"snapshot": "libreoffice_calc",
|
||||
"instruction": "I've compiled papers and books with links in this spreadsheet. Help me download the PDF of the first paper, save it as \"paper01.pdf\" in the /home/user directory. Additionally, I would like to know which paper in my list cites the initial one. Please determine and document the title saved as \"ans.docx\" in the same directory.",
|
||||
"source": "",
|
||||
"config": [
|
||||
{
|
||||
"type": "download",
|
||||
"parameters": {
|
||||
"files": [
|
||||
{
|
||||
"url": "https://drive.usercontent.google.com/download?id=1g2lhX7CtuT6kc2Bmss0WU5zT1eXnnbEU&export=download&authuser=0&confirm=t&uuid=37232f45-fedf-46c1-a292-f1080eb8c281&at=APZUnTV8C-zCWkPmRAc3BpiKz1uo:1709894768912",
|
||||
"path": "/home/user/Desktop/rsc-ebook-collection-2023.xlsx"
|
||||
}
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "open",
|
||||
"parameters": {
|
||||
"path": "/home/user/Desktop/rsc-ebook-collection-2023.xlsx"
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "launch",
|
||||
"parameters": {
|
||||
"command": [
|
||||
"google-chrome",
|
||||
"--remote-debugging-port=1337"
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "launch",
|
||||
"parameters": {
|
||||
"command": [
|
||||
"socat",
|
||||
"tcp-listen:9222,fork",
|
||||
"tcp:localhost:1337"
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "activate_window",
|
||||
"parameters": {
|
||||
"window_name": "Google Chrome"
|
||||
}
|
||||
}
|
||||
],
|
||||
"trajectory": "trajectories/68a25bd4-59c7-4f4d-975e-da0c8509c848",
|
||||
"related_apps": [
|
||||
"libreoffice_calc",
|
||||
"chrome"
|
||||
],
|
||||
"evaluator": {
|
||||
"func": [
|
||||
"compare_pdfs",
|
||||
"compare_docx_files"
|
||||
],
|
||||
"expected": [
|
||||
{
|
||||
"type": "cloud_file",
|
||||
"path": "https://drive.usercontent.google.com/download?id=1kAp7ulAR_h4snny212yg1xyR1cMy3H2Q&export=download&authuser=0&confirm=t&uuid=3f6cb74c-63cc-4653-9083-00626ef2fc11&at=APZUnTWuXvVM2w1Q9h0hOsuX6thn:1709789680904",
|
||||
"dest": "paper01_Gold.pdf"
|
||||
},
|
||||
{
|
||||
"type": "cloud_file",
|
||||
"path": "https://drive.usercontent.google.com/download?id=1UMimItX51tzNXkIMGPpHOdPNF5Dx0Tpy&export=download&authuser=0&confirm=t&uuid=97b668a6-2d0d-4389-ac5e-234e931b4328&at=APZUnTVvuvbAE8r7jpK8AkzGUzyw:1709790384938",
|
||||
"dest": "ans_Gold.docx"
|
||||
}
|
||||
],
|
||||
"result": [
|
||||
{
|
||||
"type": "vm_file",
|
||||
"path": "/home/user/paper01.pdf",
|
||||
"dest": "paper01.pdf"
|
||||
},
|
||||
{
|
||||
"type": "vm_file",
|
||||
"path": "/home/user/ans.docx",
|
||||
"dest": "ans.docx"
|
||||
}
|
||||
"id": "68a25bd4-59c7-4f4d-975e-da0c8509c848",
|
||||
"snapshot": "libreoffice_calc",
|
||||
"instruction": "I've compiled papers and books with links in this spreadsheet. Help me download the PDF of the first paper, save it as \"paper01.pdf\" in the /home/user directory. Additionally, I would like to know which paper in my list cites the initial one. Please determine and document the title saved as \"ans.docx\" in the same directory.",
|
||||
"source": "",
|
||||
"config": [
|
||||
{
|
||||
"type": "download",
|
||||
"parameters": {
|
||||
"files": [
|
||||
{
|
||||
"url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/68a25bd4-59c7-4f4d-975e-da0c8509c848/rsc-ebook-collection-2023.xlsx",
|
||||
"path": "/home/user/Desktop/rsc-ebook-collection-2023.xlsx"
|
||||
}
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "open",
|
||||
"parameters": {
|
||||
"path": "/home/user/Desktop/rsc-ebook-collection-2023.xlsx"
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "launch",
|
||||
"parameters": {
|
||||
"command": [
|
||||
"google-chrome",
|
||||
"--remote-debugging-port=1337"
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "launch",
|
||||
"parameters": {
|
||||
"command": [
|
||||
"socat",
|
||||
"tcp-listen:9222,fork",
|
||||
"tcp:localhost:1337"
|
||||
]
|
||||
}
|
||||
},
|
||||
{
|
||||
"type": "activate_window",
|
||||
"parameters": {
|
||||
"window_name": "Google Chrome"
|
||||
}
|
||||
}
|
||||
],
|
||||
"trajectory": "trajectories/68a25bd4-59c7-4f4d-975e-da0c8509c848",
|
||||
"related_apps": [
|
||||
"libreoffice_calc",
|
||||
"chrome"
|
||||
],
|
||||
"evaluator": {
|
||||
"func": [
|
||||
"compare_pdfs",
|
||||
"compare_docx_files"
|
||||
],
|
||||
"expected": [
|
||||
{
|
||||
"type": "cloud_file",
|
||||
"path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/68a25bd4-59c7-4f4d-975e-da0c8509c848/paper01.pdf",
|
||||
"dest": "paper01_Gold.pdf"
|
||||
},
|
||||
{
|
||||
"type": "cloud_file",
|
||||
"path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/multi_apps/68a25bd4-59c7-4f4d-975e-da0c8509c848/ans.docx",
|
||||
"dest": "ans_Gold.docx"
|
||||
}
|
||||
],
|
||||
"result": [
|
||||
{
|
||||
"type": "vm_file",
|
||||
"path": "/home/user/paper01.pdf",
|
||||
"dest": "paper01.pdf"
|
||||
},
|
||||
{
|
||||
"type": "vm_file",
|
||||
"path": "/home/user/ans.docx",
|
||||
"dest": "ans.docx"
|
||||
}
|
||||
]
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user