ASureevaA
commited on
Commit
·
b2f68cd
1
Parent(s):
ed03824
edit
Browse files
app.py
CHANGED
|
@@ -45,18 +45,13 @@ def run_ocr(image_object: Image.Image) -> str:
|
|
| 45 |
rgb_image_object: Image.Image = image_object.convert("RGB")
|
| 46 |
numpy_image = numpy_module.array(rgb_image_object)
|
| 47 |
|
| 48 |
-
# detail=1 -> (bbox, текст, confidence), paragraph=True -> склейка в абзацы
|
| 49 |
ocr_results = ocr_reader.readtext(
|
| 50 |
numpy_image,
|
| 51 |
-
detail=
|
| 52 |
paragraph=True,
|
| 53 |
)
|
| 54 |
|
| 55 |
-
text_parts = []
|
| 56 |
-
for bounding_box, text_value, confidence_value in ocr_results:
|
| 57 |
-
if not text_value:
|
| 58 |
-
continue
|
| 59 |
-
text_parts.append(text_value)
|
| 60 |
|
| 61 |
recognized_text: str = "\n".join(text_parts).strip()
|
| 62 |
return recognized_text
|
|
|
|
| 45 |
rgb_image_object: Image.Image = image_object.convert("RGB")
|
| 46 |
numpy_image = numpy_module.array(rgb_image_object)
|
| 47 |
|
|
|
|
| 48 |
ocr_results = ocr_reader.readtext(
|
| 49 |
numpy_image,
|
| 50 |
+
detail=0,
|
| 51 |
paragraph=True,
|
| 52 |
)
|
| 53 |
|
| 54 |
+
text_parts = [str(text_value) for text_value in ocr_results if text_value]
|
|
|
|
|
|
|
|
|
|
|
|
|
| 55 |
|
| 56 |
recognized_text: str = "\n".join(text_parts).strip()
|
| 57 |
return recognized_text
|