Skip to content

Commit

Permalink
Merge pull request #786 from myhloli/fix-imgs-block
Browse files Browse the repository at this point in the history
refactor(ocr): adjust OCR processing parameters
  • Loading branch information
myhloli authored Oct 25, 2024
2 parents 25a6d4b + 1807126 commit d3d627c
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion magic_pdf/model/pdf_extract_kit.py
Original file line number Diff line number Diff line change
Expand Up @@ -83,7 +83,7 @@ def doclayout_yolo_model_init(weight):
return model


def ocr_model_init(show_log: bool = False, det_db_box_thresh=0.3, lang=None, use_dilation=True, det_db_unclip_ratio=2.4):
def ocr_model_init(show_log: bool = False, det_db_box_thresh=0.3, lang=None, use_dilation=True, det_db_unclip_ratio=1.8):
if lang is not None:
model = ModifiedPaddleOCR(show_log=show_log, det_db_box_thresh=det_db_box_thresh, lang=lang, use_dilation=use_dilation, det_db_unclip_ratio=det_db_unclip_ratio)
else:
Expand Down
2 changes: 1 addition & 1 deletion magic_pdf/pre_proc/ocr_dict_merge.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ def merge_spans_to_line(spans):
continue

# 如果当前的span与当前行的最后一个span在y轴上重叠,则添加到当前行
if __is_overlaps_y_exceeds_threshold(span['bbox'], current_line[-1]['bbox'], 0.6):
if __is_overlaps_y_exceeds_threshold(span['bbox'], current_line[-1]['bbox'], 0.5):
current_line.append(span)
else:
# 否则,开始新行
Expand Down

0 comments on commit d3d627c

Please sign in to comment.