Skip to content

Commit

Permalink
Merge pull request #116 from papayalove/master
Browse files Browse the repository at this point in the history
修复分段边界问题
  • Loading branch information
myhloli authored May 28, 2024
2 parents 78ed786 + 135adac commit 5de3722
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion magic_pdf/para/para_split_v2.py
Original file line number Diff line number Diff line change
Expand Up @@ -534,7 +534,7 @@ def __connect_para_inter_layoutbox(blocks_group, new_layout_bbox):

pre_last_line_text = pre_last_line_text.strip()
next_first_line_text = next_first_line_text.strip()
if pre_last_line['bbox'][2] == pre_x2_max and pre_last_line_text[-1] not in LINE_STOP_FLAG and \
if pre_last_line['bbox'][2] == pre_x2_max and pre_last_line_text and pre_last_line_text[-1] not in LINE_STOP_FLAG and \
next_first_line['bbox'][0] == next_x0_min: # 前面一行沾满了整个行,并且没有结尾符号.下一行没有空白开头。
"""连接段落条件成立,将前一个layout的段落和后一个layout的段落连接。"""
#connected_layout_paras[-1][-1].extend(layout_paras[i][0])
Expand Down

0 comments on commit 5de3722

Please sign in to comment.