From d35d7710c1bae82f252c570924ce8751ab154cc3 Mon Sep 17 00:00:00 2001 From: Your Name Date: Tue, 18 Apr 2023 16:14:30 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8Dpdf=E5=88=86=E8=A7=A3bug?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- crazy_functions/crazy_utils.py | 1 + 1 file changed, 1 insertion(+) diff --git a/crazy_functions/crazy_utils.py b/crazy_functions/crazy_utils.py index 189d948..356650d 100644 --- a/crazy_functions/crazy_utils.py +++ b/crazy_functions/crazy_utils.py @@ -444,6 +444,7 @@ def read_and_clean_pdf_text(fp): pf = 998 for l in t['lines']: txt_line = "".join([wtf['text'] for wtf in l['spans']]) + if len(txt_line) == 0: continue pf = primary_ffsize(l) meta_line.append([txt_line, pf, l['bbox'], l]) for wtf in l['spans']: # for l in t['lines']: