弃用91mv,换用新网站javday
This commit is contained in:
43
scrapinglib/javday.py
Normal file
43
scrapinglib/javday.py
Normal file
@@ -0,0 +1,43 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
import re
|
||||
from lxml import etree
|
||||
from urllib.parse import urlparse, unquote
|
||||
from .parser import Parser
|
||||
|
||||
|
||||
class Javday(Parser):
|
||||
source = 'javday'
|
||||
|
||||
expr_url = '/html/head/meta[@property="og:url"]/@content'
|
||||
expr_cover = '/html/head/meta[@property="og:image"]/@content'
|
||||
expr_tags = '/html/head/meta[@name="keywords"]/@content'
|
||||
expr_title = "/html/head/title/text()"
|
||||
expr_actor = "//span[@class='vod_actor']/a/text()"
|
||||
expr_studio = '//span[@class="producer"]/a/text()'
|
||||
expr_number = '//span[@class="jpnum"]/text()'
|
||||
|
||||
def extraInit(self):
|
||||
self.imagecut = 4
|
||||
self.uncensored = True
|
||||
|
||||
def search(self, number):
|
||||
self.number = number.strip().upper()
|
||||
if self.specifiedUrl:
|
||||
self.detailurl = self.specifiedUrl
|
||||
else:
|
||||
self.detailurl = "https://javday.tv/videos/" + self.number.replace("-","") + "/"
|
||||
self.htmlcode = self.getHtml(self.detailurl)
|
||||
if self.htmlcode == 404:
|
||||
return 404
|
||||
htmltree = etree.fromstring(self.htmlcode, etree.HTMLParser())
|
||||
self.detailurl = self.getTreeElement(htmltree, self.expr_url)
|
||||
|
||||
result = self.dictformat(htmltree)
|
||||
return result
|
||||
|
||||
def getTitle(self, htmltree):
|
||||
title = super().getTitle(htmltree)
|
||||
# 删除番号和网站名
|
||||
result = title.replace(self.number,"").replace("- JAVDAY.TV","").strip()
|
||||
return result
|
||||
Reference in New Issue
Block a user