From c9407e2df772c4e8da59252acf7d8167a40ad3a0 Mon Sep 17 00:00:00 2001 From: SharpX2016 Date: Wed, 28 Apr 2021 13:41:12 +0800 Subject: [PATCH] =?UTF-8?q?=E6=9B=B4=E6=96=B0=20javbus.py?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 修复javbus类别标签抓取时多出的 “多選提交” --- WebCrawler/javbus.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/WebCrawler/javbus.py b/WebCrawler/javbus.py index f8633da..108c903 100644 --- a/WebCrawler/javbus.py +++ b/WebCrawler/javbus.py @@ -103,7 +103,7 @@ def getTag(htmlcode): # 获取标签 soup = BeautifulSoup(htmlcode, 'lxml') a = soup.find_all(attrs={'class': 'genre'}) for i in a: - if 'onmouseout' in str(i): + if 'onmouseout' in str(i) or '多選提交' in str(i): continue tag.append(translateTag_to_sc(i.get_text())) return tag