Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -99,18 +99,18 @@ def _analyze_image(self, img: "Image") -> str:
"""
if not self.ocr:
try:
from rapidocr_onnxruntime import RapidOCR
from rapidocr import RapidOCR

self.ocr = RapidOCR()
except ImportError:
raise ImportError(
"`rapidocr-onnxruntime` package not found, please install it with "
"`pip install rapidocr-onnxruntime`"
"`rapidocr` package not found, please install it with "
"`pip install rapidocr`"
)
ocr_result, _ = self.ocr(np.array(img)) # type: ignore[misc]
ocr_result = self.ocr(np.array(img)) # type: ignore[misc]
content = ""
if ocr_result:
content = ("\n".join([text[1] for text in ocr_result])).strip()
if ocr_result and ocr_result.txts:
content = ("\n".join(ocr_result.txts)).strip()
return content


Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -73,22 +73,21 @@ def extract_from_images_with_rapidocr(
Text extracted from images.

Raises:
ImportError: If `rapidocr-onnxruntime` package is not installed.
ImportError: If `rapidocr` package is not installed.
"""
try:
from rapidocr_onnxruntime import RapidOCR
from rapidocr import RapidOCR
except ImportError:
raise ImportError(
"`rapidocr-onnxruntime` package not found, please install it with "
"`pip install rapidocr-onnxruntime`"
"`rapidocr` package not found, please install it with "
"`pip install rapidocr`"
)
ocr = RapidOCR()
text = ""
for img in images:
result, _ = ocr(img)
if result:
result = [text[1] for text in result]
text += "\n".join(result)
result = ocr(img)
if result and result.txts:
text += "\n".join(result.txts)
return text


Expand Down