From 57f2257254924f56c2ef85789deba81778ffb69a Mon Sep 17 00:00:00 2001 From: David Chang Date: Fri, 15 Mar 2024 22:49:35 +0800 Subject: [PATCH] ver Mar15th fixed bugs about infeasible task evaluation --- mm_agents/accessibility_tree_wrap/heuristic_retrieve.py | 4 ++-- mm_agents/agent.py | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/mm_agents/accessibility_tree_wrap/heuristic_retrieve.py b/mm_agents/accessibility_tree_wrap/heuristic_retrieve.py index 191eaa7..e37f614 100644 --- a/mm_agents/accessibility_tree_wrap/heuristic_retrieve.py +++ b/mm_agents/accessibility_tree_wrap/heuristic_retrieve.py @@ -69,11 +69,11 @@ def judge_node(node: ET, platform="ubuntu", check_image=False) -> bool: keeps = keeps and coordinates[0]>0 and coordinates[1]>0 and sizes[0]>0 and sizes[1]>0 return keeps -def filter_nodes(root: ET, platform="ubuntu"): +def filter_nodes(root: ET, platform="ubuntu", check_image=False): filtered_nodes = [] for node in root.iter(): - if judge_node(node, platform): + if judge_node(node, platform, check_image): filtered_nodes.append(node) #print(ET.tostring(node, encoding="unicode")) diff --git a/mm_agents/agent.py b/mm_agents/agent.py index f8fc1c8..039eda8 100644 --- a/mm_agents/agent.py +++ b/mm_agents/agent.py @@ -65,7 +65,7 @@ def tag_screenshot(screenshot, accessibility_tree): os.makedirs("tmp/images", exist_ok=True) tagged_screenshot_file_path = os.path.join("tmp/images", uuid_str + ".png") # nodes = filter_nodes(find_leaf_nodes(accessibility_tree)) - nodes = filter_nodes(ET.fromstring(accessibility_tree)) + nodes = filter_nodes(ET.fromstring(accessibility_tree), check_image=True) # Make tag screenshot marks, drew_nodes = draw_bounding_boxes(nodes, screenshot, tagged_screenshot_file_path)