From 0fa1e482cd963a31074ba25e51ba5831d0624ef9 Mon Sep 17 00:00:00 2001 From: yoshiko2 Date: Sat, 29 May 2021 23:35:07 +0800 Subject: [PATCH] Fix javbus source --- WebCrawler/javbus.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/WebCrawler/javbus.py b/WebCrawler/javbus.py index 45c6ec3..50bef20 100644 --- a/WebCrawler/javbus.py +++ b/WebCrawler/javbus.py @@ -47,6 +47,8 @@ def getYear(htmlcode): #获取年份 def getCover(htmlcode): #获取封面链接 doc = pq(htmlcode) image = doc('a.bigImage') + if not "javbus.com" in image.attr('href'): + return "https://www.javbus.com" + image.attr('href') return image.attr('href') def getRelease(htmlcode): #获取出版日期 html = etree.fromstring(htmlcode, etree.HTMLParser())