# API配置 api: key: "sk-oYh3Xrhg8oDY2gW02c966f31C84449Ad86F9Cd9dF6E64a8d" base_url: "https://vip.apiyi.com/v1" temperature: 0 # 默认使用模型的温度设置 max_retries: 10 # 支持多个模型 models: - "qwen-max-2025-01-25" - "gpt-4o" - "deepseek-chat" - "claude-sonnet-4-20250514" # 或者使用单个模型(向后兼容) # model: "qwen-max-2025-01-25" system_prompt: None # 评估配置 evaluation: max_workers: 20 # input_file: "/home/ubuntu/50T/LYT/MatBench/layer1/ALL-merge/merged.json" # input_file: "/home/ubuntu/50T/LYT/MatBench/layer2/PGEE/code/stepz_final_choice_questions.json" input_file: "/home/ubuntu/50T/LYT/MatBench/layer2/PGEE/code/stepz_final_choice_questions_filtered.json" # 输出配置 output: base_dir: "results" auto_timestamp: true filename_template: "{model}.json" summary_filename: "summary.json" # 输出格式选项 export_formats: - "json" # 详细JSON结果 - "csv" # CSV表格 - "excel" # Excel表格(需要openpyxl) # 日志配置 logging: level: "INFO" format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"