From d7dec6136494fc54e95568798b3f469e11f85887 Mon Sep 17 00:00:00 2001 From: lifegpc Date: Tue, 7 Feb 2023 12:01:59 +0800 Subject: [PATCH] =?UTF-8?q?=E6=94=AF=E6=8C=81

=E6=8D=A2=E8=A1=8C?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- rssparser.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/rssparser.py b/rssparser.py index 52f924c..3d66e0a 100644 --- a/rssparser.py +++ b/rssparser.py @@ -139,6 +139,12 @@ class HTMLSimpleParser(HTMLParser): elif len(self.tagName) > 1: self.tagContent[-2].add( f"<{tag}{self.tagAttrs[-1]}>{self.tagContent[-1].export()}") + elif tag in ['p']: + tmp = '' if self.data == '' else '\n\n' + if len(self.tagName) == 1: + self.data += tmp + self.tagContent[-1].export() + else: + self.tagContent[-2].add(tmp + self.tagContent[-1].export()) elif tag not in ['img', 'video', 'br', 'ugoira']: if len(self.tagName) == 1: self.data = f"{self.data}{self.tagContent[-1].export()}"