From 9c71e5976ad24eb7559948c7f7432f76000346aa Mon Sep 17 00:00:00 2001 From: mo_yy <54110819+moyy996@users.noreply.github.com> Date: Fri, 10 Jan 2020 14:09:35 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=A0=E9=99=A4=E6=A0=87=E9=A2=98=E4=B8=AD?= =?UTF-8?q?=E7=95=AA=E5=8F=B7=EF=BC=8C=E4=BD=BF=E7=94=A8=E5=B0=8F=E5=B0=81?= =?UTF-8?q?=E9=9D=A2=EF=BC=8C=E4=BF=AE=E5=A4=8D=E2=80=98=E6=BC=94=E5=91=98?= =?UTF-8?q?=E3=80=81=E7=89=87=E5=95=86=E2=80=99=E8=8E=B7=E5=8F=96?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- javdb.py | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/javdb.py b/javdb.py index 71bee4c..8b3e86b 100755 --- a/javdb.py +++ b/javdb.py @@ -75,7 +75,8 @@ def getTag(a): ',') -def getCover_small(html): +def getCover_small(a): + html = etree.fromstring(a, etree.HTMLParser()) # //table/tr[1]/td[1]/text() result = 'http:' + html.xpath( '//div[@id=\'videos\']/div[@class=\'grid columns\']/div[@class=\'grid-item column\'][1]/a[' '@class=\'box\']/div[@class=\'item-image fix-scale-cover\']/img/@src')[0] @@ -113,7 +114,7 @@ def main(number): 'actor': getActor(b), 'title': getTitle(b).replace("\\n", '').replace(' ', '').replace(getActor(a), '').replace(getNum(a), '').replace( - '无码', '').replace('有码', '').lstrip(' '), + '无码', '').replace('有码', '').lstrip(' ').replace(number, ''), 'studio': getStudio(b), 'outline': getOutline(b), 'runtime': getRuntime(b), @@ -121,7 +122,7 @@ def main(number): 'release': getRelease(b), 'number': getNum(b), 'cover': getCover(b), - 'cover_small': getCover_small(html), + 'cover_small': getCover_small(a), 'imagecut': 3, 'tag': getTag(b), 'label': getLabel(b), @@ -145,7 +146,7 @@ def main(number): 'title': getTitle(b).replace("\\n", '').replace(' ', '').replace(getActor(a), '').replace( getNum(b), '').replace( - '无码', '').replace('有码', '').lstrip(' '), + '无码', '').replace('有码', '').lstrip(' ').replace(number, ''), 'studio': getStudio(b), 'outline': getOutline(b), 'runtime': getRuntime(b), @@ -167,3 +168,5 @@ def main(number): dic['number'] = '' js = json.dumps(dic, ensure_ascii=False, sort_keys=True, indent=4, separators=(',', ':'), ) # .encode('UTF-8') return js + +# print(get_html('https://javdb1.com/v/WwZ0Q'))