This commit is contained in:
AuroraWright
2025-10-23 00:50:39 +02:00
parent 5f52de4627
commit bc9d758908
2 changed files with 5 additions and 4 deletions

View File

@@ -579,6 +579,7 @@ class TextFiltering:
first = True first = True
changed_lines_count = 0 changed_lines_count = 0
len_recovered_lines = 0 if not recovered_lines else len(recovered_lines)
for i, current_text in enumerate(current_lines): for i, current_text in enumerate(current_lines):
changed_line = current_result[i] changed_line = current_result[i]
@@ -598,7 +599,7 @@ class TextFiltering:
if text_similar: if text_similar:
continue continue
i2 = i if not recovered_lines else i - len(recovered_lines) i2 = i - len_recovered_lines
if (recovered_lines == None or i2 < 0) and recovered_lines_count > 0: if (recovered_lines == None or i2 < 0) and recovered_lines_count > 0:
if any(line.startswith(current_text) for j, line in enumerate(current_lines) if i != j): if any(line.startswith(current_text) for j, line in enumerate(current_lines) if i != j):
@@ -611,7 +612,7 @@ class TextFiltering:
if current_lines_ocr: if current_lines_ocr:
if i2 >= 0: if i2 >= 0:
is_furigana = self._furigana_filter(current_lines, current_lines_ocr, current_text, i2) is_furigana = self._furigana_filter(current_lines[len_recovered_lines:], current_lines_ocr, current_text, i2)
if is_furigana: if is_furigana:
continue continue
@@ -643,8 +644,8 @@ class TextFiltering:
if not current_lines[j].replace('\n', ''): if not current_lines[j].replace('\n', ''):
continue continue
other_line_bbox = current_lines_ocr[j].bounding_box
other_line_text = current_lines[j] other_line_text = current_lines[j]
other_line_bbox = current_lines_ocr[j].bounding_box
if len(current_text) <= len(other_line_text): if len(current_text) <= len(other_line_text):
is_vertical = other_line_bbox.height > other_line_bbox.width is_vertical = other_line_bbox.height > other_line_bbox.width

View File

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
[project] [project]
name = "owocr" name = "owocr"
version = "1.19.2" version = "1.19.3"
description = "Japanese OCR" description = "Japanese OCR"
readme = "README.md" readme = "README.md"
requires-python = ">=3.11" requires-python = ">=3.11"