Skip to content

Commit

Permalink
Merge pull request #62 from myhloli/master
Browse files Browse the repository at this point in the history
update confidence score 0.95->0.05
  • Loading branch information
myhloli authored Apr 23, 2024
2 parents ec2cbdd + 1146206 commit fc23483
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
2 changes: 1 addition & 1 deletion magic_pdf/model/magic_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,7 @@ def __fix_by_confidence(self):
need_remove_list = []
layout_dets = model_page_info["layout_dets"]
for layout_det in layout_dets:
if layout_det["score"] < 0.95:
if layout_det["score"] <= 0.05:
need_remove_list.append(layout_det)
else:
continue
Expand Down
4 changes: 2 additions & 2 deletions magic_pdf/pre_proc/ocr_dict_merge.py
Original file line number Diff line number Diff line change
Expand Up @@ -120,14 +120,14 @@ def sort_blocks_by_layout(all_bboxes, layout_bboxes):
# 如果是footnote则跳过
if block[7] == BlockType.Footnote:
continue
block_bbox = [block[0], block[1], block[2], block[3]]
block_bbox = block[:4]
if calculate_overlap_area_in_bbox1_area_ratio(block_bbox, layout_bbox) > 0.8:
layout_blocks.append(block)

# 如果layout_blocks不为空,则放入new_blocks中
if len(layout_blocks) > 0:
new_blocks.append(layout_blocks)
# 从spans删除已经放入layout_sapns中的span
# 从all_bboxes删除已经放入layout_blocks中的block
for layout_block in layout_blocks:
all_bboxes.remove(layout_block)

Expand Down

0 comments on commit fc23483

Please sign in to comment.