feat: 新增科研软件 benchmark 任务数据

- 新增 avogadro/imagej/jade/origin/ovito/pymol/vesta 等科研软件任务 JSON
- 修改 vllm_eval.py,修改图片文件名称为第x步
- desktop_env.py 添加额外数据参数 config 和 metadata
This commit is contained in:
2026-02-25 15:19:36 +08:00
parent 613f55f0da
commit 9899d4a0c7
85 changed files with 4703 additions and 71 deletions

View File

@@ -389,6 +389,314 @@
"971cbb5b-3cbf-4ff7-9e24-b5c84fcebfa6"
],
"jade": [
"MDIJade6.5使用手册_task1",
"MDIJade6.5使用手册_task10",
"MDIJade6.5使用手册_task2",
"MDIJade6.5使用手册_task3",
"MDIJade6.5使用手册_task4",
"MDIJade6.5使用手册_task5",
"MDIJade6.5使用手册_task6",
"MDIJade6.5使用手册_task7",
"MDIJade6.5使用手册_task8",
"MDIJade6.5使用手册_task9",
"jade_test"
],
"avogadro": [
"building-metal-complexes_task1",
"building-metal-complexes_task2",
"building-metal-complexes_task3",
"building-metal-complexes_task4",
"building-metal-complexes_task5",
"building-metal-complexes_task6",
"building-metal-complexes_task7",
"building-organic-molecules_task1",
"building-organic-molecules_task10",
"building-organic-molecules_task2",
"building-organic-molecules_task3",
"building-organic-molecules_task4",
"building-organic-molecules_task5",
"building-organic-molecules_task6",
"building-organic-molecules_task7",
"building-organic-molecules_task8",
"building-organic-molecules_task9",
"learning-avogadro_task1",
"learning-avogadro_task2",
"learning-avogadro_task3",
"learning-avogadro_task4",
"learning-avogadro_task5",
"learning-avogadro_task6",
"learning-avogadro_task7",
"learning-avogadro_task8",
"learning-avogadro_task9",
"naming-a-molecule_task1",
"naming-a-molecule_task2",
"using-qtaim-and-wfn_task1",
"using-qtaim-and-wfn_task2",
"using-qtaim-and-wfn_task3",
"viewing-electrostatic-potential_task1",
"viewing-electrostatic-potential_task2",
"viewing-molecular-orbitals_task1",
"viewing-molecular-orbitals_task2",
"viewing-molecular-orbitals_task3",
"viewing-vibrations_task1",
"viewing-vibrations_task2",
"viewing-vibrations_task3",
"viewing-vibrations_task4",
"viewing-vibrations_task5"
],
"imagej": [
"user-guide_task1",
"user-guide_task10",
"user-guide_task2",
"user-guide_task3",
"user-guide_task4",
"user-guide_task5",
"user-guide_task6",
"user-guide_task7",
"user-guide_task8",
"user-guide_task9"
],
"origin": [
"Origin_User_Guide_2025b_E_task1",
"Origin_User_Guide_2025b_E_task10",
"Origin_User_Guide_2025b_E_task11",
"Origin_User_Guide_2025b_E_task12",
"Origin_User_Guide_2025b_E_task2",
"Origin_User_Guide_2025b_E_task3",
"Origin_User_Guide_2025b_E_task4",
"Origin_User_Guide_2025b_E_task5",
"Origin_User_Guide_2025b_E_task6",
"Origin_User_Guide_2025b_E_task7",
"Origin_User_Guide_2025b_E_task8",
"Origin_User_Guide_2025b_E_task9"
],
"ovito": [
"animation_task1",
"animation_task10",
"animation_task2",
"animation_task3",
"animation_task4",
"animation_task5",
"animation_task6",
"animation_task7",
"animation_task8",
"animation_task9",
"aspherical_particles_task1",
"aspherical_particles_task10",
"aspherical_particles_task2",
"aspherical_particles_task3",
"aspherical_particles_task4",
"aspherical_particles_task5",
"aspherical_particles_task6",
"aspherical_particles_task7",
"aspherical_particles_task8",
"aspherical_particles_task9",
"clone_pipeline_task1",
"clone_pipeline_task2",
"clone_pipeline_task3",
"clone_pipeline_task4",
"clone_pipeline_task5",
"clone_pipeline_task6",
"clone_pipeline_task7",
"clone_pipeline_task8",
"code_generation_task1",
"code_generation_task2",
"code_generation_task3",
"code_generation_task4",
"code_generation_task5",
"code_generation_task6",
"code_generation_task7",
"code_generation_task8",
"customize_init_state_task1",
"customize_init_state_task2",
"customize_init_state_task3",
"customize_init_state_task4",
"customize_init_state_task5",
"data_model_task1",
"data_model_task10",
"data_model_task2",
"data_model_task3",
"data_model_task4",
"data_model_task5",
"data_model_task6",
"data_model_task7",
"data_model_task8",
"data_model_task9",
"export_task1",
"export_task2",
"export_task3",
"export_task4",
"export_task5",
"import_task1",
"import_task10",
"import_task2",
"import_task3",
"import_task4",
"import_task5",
"import_task6",
"import_task7",
"import_task8",
"import_task9",
"marker_particles_task1",
"marker_particles_task2",
"marker_particles_task3",
"marker_particles_task4",
"marker_particles_task5",
"marker_particles_task6",
"marker_particles_task7",
"marker_particles_task8",
"marker_particles_task9",
"miscellaneous_task1",
"miscellaneous_task10",
"miscellaneous_task2",
"miscellaneous_task3",
"miscellaneous_task4",
"miscellaneous_task5",
"miscellaneous_task6",
"miscellaneous_task7",
"miscellaneous_task8",
"miscellaneous_task9",
"pipeline_task1",
"pipeline_task2",
"pipeline_task3",
"pipeline_task4",
"pipeline_task5",
"pipeline_task6",
"pipeline_task7",
"pipeline_task8",
"pipeline_task9",
"python_extensions_task1",
"python_extensions_task10",
"python_extensions_task2",
"python_extensions_task3",
"python_extensions_task4",
"python_extensions_task5",
"python_extensions_task6",
"python_extensions_task7",
"python_extensions_task8",
"python_extensions_task9",
"remote_file_access_task1",
"remote_file_access_task10",
"remote_file_access_task2",
"remote_file_access_task3",
"remote_file_access_task4",
"remote_file_access_task5",
"remote_file_access_task6",
"remote_file_access_task7",
"remote_file_access_task8",
"remote_file_access_task9",
"remote_rendering_task1",
"remote_rendering_task2",
"remote_rendering_task3",
"remote_rendering_task4",
"remote_rendering_task5",
"remote_rendering_task6",
"remote_rendering_task7",
"remote_rendering_task8",
"remote_rendering_task9",
"rendering_task1",
"rendering_task2",
"rendering_task3",
"rendering_task4",
"rendering_task5",
"rendering_task6",
"rendering_task7",
"rendering_task8",
"rendering_task9",
"transparent_particles_task1",
"transparent_particles_task2",
"turntable_animation_task1",
"turntable_animation_task2",
"turntable_animation_task3",
"turntable_animation_task4",
"turntable_animation_task5",
"turntable_animation_task6",
"viewport_layouts_task1",
"viewport_layouts_task10",
"viewport_layouts_task2",
"viewport_layouts_task3",
"viewport_layouts_task4",
"viewport_layouts_task5",
"viewport_layouts_task6",
"viewport_layouts_task7",
"viewport_layouts_task8",
"viewport_layouts_task9",
"viewports_task1",
"viewports_task10",
"viewports_task11",
"viewports_task2",
"viewports_task3",
"viewports_task4",
"viewports_task5",
"viewports_task6",
"viewports_task7",
"viewports_task8",
"viewports_task9"
],
"pymol": [
"Biochemistry_student_intro_task1",
"Biochemistry_student_intro_task10",
"Biochemistry_student_intro_task2",
"Biochemistry_student_intro_task3",
"Biochemistry_student_intro_task4",
"Biochemistry_student_intro_task5",
"Biochemistry_student_intro_task6",
"Biochemistry_student_intro_task7",
"Biochemistry_student_intro_task8",
"Biochemistry_student_intro_task9",
"MovieSchool_1_task1",
"MovieSchool_1_task2",
"MovieSchool_1_task3",
"MovieSchool_1_task4",
"MovieSchool_1_task5",
"MovieSchool_1_task6",
"MovieSchool_1_task7",
"MovieSchool_3_task1",
"MovieSchool_3_task10",
"MovieSchool_3_task2",
"MovieSchool_3_task3",
"MovieSchool_3_task4",
"MovieSchool_3_task5",
"MovieSchool_3_task6",
"MovieSchool_3_task7",
"MovieSchool_3_task8",
"MovieSchool_3_task9",
"Mutagenesis_task1",
"Mutagenesis_task2",
"Mutagenesis_task3",
"Mutagenesis_task4",
"Mutagenesis_task5",
"Mutagenesis_task6",
"Mutagenesis_task7",
"Practical_Pymol_for_Beginners_task1",
"Practical_Pymol_for_Beginners_task10",
"Practical_Pymol_for_Beginners_task11",
"Practical_Pymol_for_Beginners_task12",
"Practical_Pymol_for_Beginners_task13",
"Practical_Pymol_for_Beginners_task2",
"Practical_Pymol_for_Beginners_task3",
"Practical_Pymol_for_Beginners_task4",
"Practical_Pymol_for_Beginners_task5",
"Practical_Pymol_for_Beginners_task6",
"Practical_Pymol_for_Beginners_task7",
"Practical_Pymol_for_Beginners_task8",
"Practical_Pymol_for_Beginners_task9",
"Visualizing_a_computed_structure_-_a_commented_example_task1",
"Visualizing_a_computed_structure_-_a_commented_example_task2",
"Visualizing_a_computed_structure_-_a_commented_example_task3",
"Visualizing_a_computed_structure_-_a_commented_example_task4"
],
"vesta": [
"VESTA_Manual_task1",
"VESTA_Manual_task10",
"VESTA_Manual_task11",
"VESTA_Manual_task2",
"VESTA_Manual_task3",
"VESTA_Manual_task4",
"VESTA_Manual_task5",
"VESTA_Manual_task6",
"VESTA_Manual_task7",
"VESTA_Manual_task8",
"VESTA_Manual_task9"
]
}