From 42533b86e2efc6787f184e3affd031a4ae67a2cf Mon Sep 17 00:00:00 2001 From: "majiahui@haimaqingfan.com" Date: Thu, 23 May 2024 16:37:08 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E6=94=B9bug=EF=BC=8C=E8=AF=86?= =?UTF-8?q?=E5=88=AB=E4=B8=89=E7=BA=A7=E6=A0=87=E9=A2=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ppt_api.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/ppt_api.py b/ppt_api.py index bb4db89..9aadc7f 100644 --- a/ppt_api.py +++ b/ppt_api.py @@ -222,6 +222,11 @@ def catalogue_extract(structure): catalogue_list = [] for level, text in structure[:-1]: + text = str(text).strip(" ").strip("\n") + erji_p = re.findall(pantten_erjibiaoti, text) + yiji_p = re.findall(pantten_yijibiaoti, text) + if erji_p == [] and yiji_p == []: + continue catalogue_list.append(str(text).strip(" ").strip("\n")) catalogue_str = "\n".join(catalogue_list) return catalogue_list, catalogue_str