From 4816affc38ba1ffff48942fab47dda195f5cbfa3 Mon Sep 17 00:00:00 2001 From: Feng4 Date: Sun, 27 Dec 2020 00:28:47 +0800 Subject: [PATCH] Update mgstage.py --- WebCrawler/mgstage.py | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/WebCrawler/mgstage.py b/WebCrawler/mgstage.py index 089bbf2..e98eb5a 100644 --- a/WebCrawler/mgstage.py +++ b/WebCrawler/mgstage.py @@ -95,6 +95,18 @@ def getSeries(a): result2 = str(html.xpath('//th[contains(text(),"シリーズ")]/../td/text()')).strip(" ['']").strip('\\n ').strip( '\\n') return str(result1 + result2).strip('+').replace("', '", '').replace('"', '') + +def getExtrafanart(htmlcode): # 获取剧照 + html_pather = re.compile(r'
\s*?\s*?
') + html = html_pather.search(htmlcode) + if html: + html = html.group() + extrafanart_pather = re.compile(r'