Add consistent scores validation (#368)
* Add consistent scores validation * revert osworld_run_maestro.py changes
This commit is contained in:
2
run.py
2
run.py
@@ -218,7 +218,7 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None:
|
|||||||
f.write("\n")
|
f.write("\n")
|
||||||
|
|
||||||
env.close()
|
env.close()
|
||||||
logger.info(f"Average score: {sum(scores) / len(scores)}")
|
logger.info(f"Average score: {sum(scores) / len(scores) if scores else 0}")
|
||||||
|
|
||||||
|
|
||||||
def get_unfinished(
|
def get_unfinished(
|
||||||
|
|||||||
@@ -457,7 +457,7 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None:
|
|||||||
f.write("\n")
|
f.write("\n")
|
||||||
|
|
||||||
env.close()
|
env.close()
|
||||||
logger.info(f"Average score: {sum(scores) / len(scores)}")
|
logger.info(f"Average score: {sum(scores) / len(scores) if scores else 0}")
|
||||||
|
|
||||||
|
|
||||||
def get_unfinished(action_space, use_model, observation_type, result_dir, total_file_json):
|
def get_unfinished(action_space, use_model, observation_type, result_dir, total_file_json):
|
||||||
|
|||||||
@@ -485,7 +485,7 @@ def test(args: argparse.Namespace, test_all_meta: dict) -> None:
|
|||||||
f.write("\n")
|
f.write("\n")
|
||||||
|
|
||||||
env.close()
|
env.close()
|
||||||
logger.info(f"Average score: {sum(scores) / len(scores)}")
|
logger.info(f"Average score: {sum(scores) / len(scores) if scores else 0}")
|
||||||
|
|
||||||
|
|
||||||
def get_unfinished(action_space, use_model, observation_type, result_dir, total_file_json):
|
def get_unfinished(action_space, use_model, observation_type, result_dir, total_file_json):
|
||||||
|
|||||||
Reference in New Issue
Block a user