Unverified Commit 642eaee2 authored by myhloli's avatar myhloli Committed by GitHub

Merge pull request #75 from papayalove/master

更新了para_split
parents 1d81631b 2fc6e9a3
......@@ -414,7 +414,10 @@ def __connect_list_inter_page(pre_page_paras, next_page_paras, pre_page_layout_b
# 向layout_paras[i] 寻找开头具有相同缩进的连续的行
may_list_lines = []
for j in range(len(next_page_paras[0])):
lines = next_page_paras[0][j]["lines"]
next_page_block_j = next_page_paras[0][j]
if next_page_block_j["type"] != BlockType.Text:
break
lines = next_page_block_j["lines"]
if len(lines) == 1: # 只可能是一行,多行情况再需要分析了
if lines[0]['bbox'][0] > __find_layout_bbox_by_line(lines[0]['bbox'], next_page_layout_bbox)[0]:
may_list_lines.append(lines[0])
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment