Commit 51b8c57d authored by pangguosheng's avatar pangguosheng
Browse files

fix: skip the char corresponding to invalid bounding boxes

parent b71993a9
...@@ -108,6 +108,10 @@ def fill_char_in_spans(spans, all_chars): ...@@ -108,6 +108,10 @@ def fill_char_in_spans(spans, all_chars):
spans = sorted(spans, key=lambda x: x['bbox'][1]) spans = sorted(spans, key=lambda x: x['bbox'][1])
for char in all_chars: for char in all_chars:
# 跳过非法bbox的char
x1, y1, x2, y2 = char['bbox']
if abs(x1 - x2) <= 0.01 or abs(y1 - y2) <= 0.01:
continue
for span in spans: for span in spans:
if calculate_char_in_span(char['bbox'], span['bbox'], char['c']): if calculate_char_in_span(char['bbox'], span['bbox'], char['c']):
span['chars'].append(char) span['chars'].append(char)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment