feat: Migrate OSWorld files to HuggingFace cache with comprehensive documentation

- Add detailed README for file cache repository
- Implement migration script with retry logic and browser simulation
- Support automatic file type detection and deduplication
- Ensure reliable hosting for OSWorld evaluation files
This commit is contained in:
Timothyxxx
2025-05-28 04:29:37 +08:00
parent a845824f06
commit 34748567a5
317 changed files with 12630 additions and 12008 deletions

View File

@@ -4,29 +4,29 @@
"instruction": "Remove the adundant whitespaces and canonicalize the letter cases by capitalizing the first letter of each words and leave other letters as lower case.",
"source": "https://www.youtube.com/shorts/A0gmEBRKXWs",
"config": [
{
"type": "download",
"parameters": {
"files": [
{
"url": "https://drive.usercontent.google.com/download?id=1PGJxDM5QglZFdLd7yLQnA2MASf2so14S&export=download&authuser=0&confirm=t&uuid=725f7d90-1e30-4579-b946-7c8932aac440&at=APZUnTUpha_2nl3sAOmM1AeCCir_:1705561280883",
"path": "/home/user/Movie_title_garbage_clean.xlsx"
}
]
}
},
{
"type": "open",
"parameters": {
"path": "/home/user/Movie_title_garbage_clean.xlsx"
}
}
],
{
"type": "download",
"parameters": {
"files": [
{
"url": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f/Movie_titles_garbage_clean.xlsx",
"path": "/home/user/Movie_title_garbage_clean.xlsx"
}
]
}
},
{
"type": "open",
"parameters": {
"path": "/home/user/Movie_title_garbage_clean.xlsx"
}
}
],
"trajectory": "trajectories/a9f325aa-8c05-4e4f-8341-9e4358565f4f",
"related_apps": [
"libreoffice calc"
],
"evaluator": {
"evaluator": {
"postconfig": [
{
"type": "activate_window",
@@ -58,17 +58,17 @@
}
}
],
"func": "compare_table",
"expected": {
"type": "cloud_file",
"path": "https://drive.usercontent.google.com/download?id=1hrmRQig53UW069MEN_V23xJXFrIooylm&export=download&authuser=0&confirm=t&uuid=82a01881-c72c-4463-b258-c8c66f8d72af&at=APZUnTVZVuQj91twmMdH1plMcABA:1705561377705",
"dest": "Movie_title_garbage_clean_gold.xlsx"
},
"result": {
"type": "vm_file",
"path": "/home/user/Movie_title_garbage_clean.xlsx",
"dest": "Movie_title_garbage_clean.xlsx"
},
"func": "compare_table",
"expected": {
"type": "cloud_file",
"path": "https://huggingface.co/datasets/xlangai/ubuntu_osworld_file_cache/resolve/main/libreoffice_calc/a9f325aa-8c05-4e4f-8341-9e4358565f4f/Movie_titles_garbage_clean_gold.xlsx",
"dest": "Movie_title_garbage_clean_gold.xlsx"
},
"result": {
"type": "vm_file",
"path": "/home/user/Movie_title_garbage_clean.xlsx",
"dest": "Movie_title_garbage_clean.xlsx"
},
"options": {
"rules": [
{
@@ -78,5 +78,5 @@
}
]
}
}
}
}
}