From b89f9a70e3093d5ccf677a69b6a570696d8ef0d4 Mon Sep 17 00:00:00 2001 From: ZouJiu <1069679911@qq.com> Date: Fri, 20 Oct 2023 20:51:29 +0800 Subject: [PATCH] div content crawler --- crawler.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/crawler.py b/crawler.py index f71ebc9..b70bb50 100644 --- a/crawler.py +++ b/crawler.py @@ -404,6 +404,8 @@ def parser_beautiful(innerHTML, article, number, dircrea, bk=False): if len(prenode) > 0: for i in prenode: article += "\n\n```\n" + i.text + "\n```\n\n" + else: + article, number = parser_beautiful(chi, article, number, dircrea, bk) if bk: article += "**" return article, number