Fix one bug in Chrome getter; fix one erro for corner case in doc

This commit is contained in:
Timothyxxx
2024-04-02 14:50:29 +08:00
parent af04a305a9
commit 2d8eeaad58
2 changed files with 49 additions and 32 deletions

View File

@@ -6,6 +6,7 @@ import zipfile
from io import BytesIO
from typing import List, Dict, Any
import easyocr
from PIL import Image
from docx import Document
from docx.enum.text import WD_PARAGRAPH_ALIGNMENT, WD_TAB_ALIGNMENT
@@ -247,8 +248,9 @@ def compare_docx_images(docx_file1, docx_file2):
return 1
import easyocr
def compare_image_text(image_path, rule):
if not image_path:
return 0
reader = easyocr.Reader(['en'])
result = reader.readtext(image_path)
extracted_text = ' '.join([entry[1] for entry in result])