From 5b07ec17bfe507f06015319c653bf96f3737732c Mon Sep 17 00:00:00 2001 From: tsuky_chen <3107760494@qq.com> Date: Sat, 9 Mar 2024 18:50:16 +0800 Subject: [PATCH] fix multi apps --- desktop_env/evaluators/metrics/docs.py | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/desktop_env/evaluators/metrics/docs.py b/desktop_env/evaluators/metrics/docs.py index e588e74..0787926 100644 --- a/desktop_env/evaluators/metrics/docs.py +++ b/desktop_env/evaluators/metrics/docs.py @@ -200,14 +200,13 @@ def compare_docx_images(docx_file1, docx_file2): return 1 -import pytesseract - - +import easyocr def compare_image_text(image_path, rule): - img = Image.open(image_path) - img_text = pytesseract.image_to_string(img) + reader = easyocr.Reader(['en']) + result = reader.readtext(image_path) + extracted_text = ' '.join([entry[1] for entry in result]) if rule['type'] == 'text': - return 1 if rule['text'] in img_text else 0 + return 1 if rule['text'] in extracted_text else 0 else: raise ValueError("Unsupported rule type")