From ac22fcdf057d5a90c2a10d69371f4f7067c31807 Mon Sep 17 00:00:00 2001 From: lededev Date: Sun, 6 Jun 2021 05:06:42 +0800 Subject: [PATCH] optimize code logic --- WebCrawler/javbus.py | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/WebCrawler/javbus.py b/WebCrawler/javbus.py index de9d264..a8aa93c 100644 --- a/WebCrawler/javbus.py +++ b/WebCrawler/javbus.py @@ -48,12 +48,11 @@ def getCover(htmlcode): #获取封面链接 doc = pq(htmlcode) image = doc('a.bigImage') uri = image.attr('href') - if uri[0:4] != 'http': - if uri[0] == '/': - return "https://www.javbus.com" + uri - else: - return "https://www.javbus.com/" + uri - return uri + if uri[0:4] == 'http': + return uri + if uri[0] != '/': + uri = '/' + uri + return "https://www.javbus.com" + uri def getRelease(htmlcode): #获取出版日期 html = etree.fromstring(htmlcode, etree.HTMLParser()) result = str(html.xpath('/html/body/div[5]/div[1]/div[2]/p[2]/text()')).strip(" ['']")