feat: Migrate OSWorld files to HuggingFace cache with comprehensive documentation

- Add detailed README for file cache repository
- Implement migration script with retry logic and browser simulation
- Support automatic file type detection and deduplication
- Ensure reliable hosting for OSWorld evaluation files
This commit is contained in:
Timothyxxx
2025-05-28 04:29:37 +08:00
parent a845824f06
commit 34748567a5
317 changed files with 12630 additions and 12008 deletions

View File

@@ -9,7 +9,7 @@
"parameters": {
"files": [
{
"url": "https://drive.usercontent.google.com/download?id=1muvWVg44C6EtBpBQkZ6_ylg3M8r3jjOC&export=download&authuser=0&confirm=t&uuid=41354a7c-d199-4044-960e-0d146fe6f12a&at=APZUnTW3nj5RV3SBJt5tdeVxM4mM:1705553238027",
"url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#.xlsx",
"path": "/home/user/Order_Sales_Serial#.xlsx"
}
]
@@ -58,17 +58,17 @@
}
}
],
"func": "compare_table",
"expected": {
"type": "cloud_file",
"path": "https://drive.usercontent.google.com/download?id=1K37qrxab2cib1SkKPthYkb83fzaj9ETa&export=download&authuser=0&confirm=t&uuid=66b763e6-2fb1-46fc-9753-7f8533366b82&at=APZUnTU1nCKKXBwCbyI8aKpdhE5W:1705560437314",
"dest": "Order_Sales_Serial#_gold.xlsx"
},
"result": {
"type": "vm_file",
"path": "/home/user/Order_Sales_Serial#.xlsx",
"dest": "Order_Sales_Serial#.xlsx"
},
"func": "compare_table",
"expected": {
"type": "cloud_file",
"path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/7efeb4b1-3d19-4762-b163-63328d66303b/Order_Sales_Serial#_gold.xlsx",
"dest": "Order_Sales_Serial#_gold.xlsx"
},
"result": {
"type": "vm_file",
"path": "/home/user/Order_Sales_Serial#.xlsx",
"dest": "Order_Sales_Serial#.xlsx"
},
"options": {
"rules": [
{
@@ -78,5 +78,5 @@
}
]
}
}
}
}
}