From baf915508fe4240c3bee1f0278e75611d0bfc3a2 Mon Sep 17 00:00:00 2001 From: ChaseDream <1129chasedream@gmail.com> Date: Sun, 17 Jul 2022 20:07:50 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8Dgcolle=E6=97=A0=E6=B3=95?= =?UTF-8?q?=E5=88=AE=E5=89=8A=E7=9A=84=E9=97=AE=E9=A2=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit number前面缺了个self,请求URL会变成'https://gcolle.net/product_info.php/products_id/gcolle-xxxxx',导致无法刮削。 --- scrapinglib/gcolle.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scrapinglib/gcolle.py b/scrapinglib/gcolle.py index 40081f2..100e3ef 100644 --- a/scrapinglib/gcolle.py +++ b/scrapinglib/gcolle.py @@ -29,7 +29,7 @@ class Gcolle(Parser): self.number = number.upper().replace('GCOLLE-','') self.detailurl = 'https://gcolle.net/product_info.php/products_id/' + self.number session = get_html_session(cookies=self.cookies, proxies=self.proxies, verify=self.verify) - htmlcode = session.get('https://gcolle.net/product_info.php/products_id/' + number).text + htmlcode = session.get('https://gcolle.net/product_info.php/products_id/' + self.number).text htmltree = etree.HTML(htmlcode) r18url = self.getTreeElement(htmltree, self.expr_r18)