Merge branch 'master' into v3.1

这个提交包含在:
505030475
2023-04-18 23:33:49 +08:00
当前提交 abd11e5dff
共有 3 个文件被更改,包括 9 次插入8 次删除

查看文件

@@ -448,6 +448,7 @@ def read_and_clean_pdf_text(fp):
pf = 998
for l in t['lines']:
txt_line = "".join([wtf['text'] for wtf in l['spans']])
if len(txt_line) == 0: continue
pf = primary_ffsize(l)
meta_line.append([txt_line, pf, l['bbox'], l])
for wtf in l['spans']: # for l in t['lines']:
@@ -558,8 +559,8 @@ def read_and_clean_pdf_text(fp):
meta_txt = meta_txt.replace('\n', '\n\n')
############################## <第 5 步,展示分割效果> ##################################
for f in finals:
print亮黄(f)
print亮绿('***************************')
# for f in finals:
# print亮黄(f)
# print亮绿('***************************')
return meta_txt, page_one_meta