From 2096c0908c5b804de0865bd1e6e15e7df8955d06 Mon Sep 17 00:00:00 2001 From: yoshiko2 Date: Wed, 11 May 2022 22:51:10 +0800 Subject: [PATCH] Clean out of used modules --- WebCrawler/airav.py | 4 ---- WebCrawler/avsox.py | 3 --- WebCrawler/carib.py | 2 -- WebCrawler/dlsite.py | 14 -------------- WebCrawler/fanza.py | 7 ------- WebCrawler/fc2.py | 4 ---- WebCrawler/fc2club.py | 12 ------------ WebCrawler/gcolle.py | 2 -- WebCrawler/javbus.py | 3 --- WebCrawler/javdb.py | 18 ------------------ WebCrawler/madou.py | 3 --- WebCrawler/mgstage.py | 6 ------ WebCrawler/mv91.py | 5 ----- WebCrawler/storyline.py | 2 -- WebCrawler/xcity.py | 5 ----- 15 files changed, 90 deletions(-) diff --git a/WebCrawler/airav.py b/WebCrawler/airav.py index 030e8c7..eeea95f 100644 --- a/WebCrawler/airav.py +++ b/WebCrawler/airav.py @@ -1,10 +1,6 @@ import sys sys.path.append('../') -import re -from pyquery import PyQuery as pq#need install -from lxml import etree#need install from bs4 import BeautifulSoup#need install -import json from ADC_function import * from WebCrawler import javbus diff --git a/WebCrawler/avsox.py b/WebCrawler/avsox.py index 0c4a9d7..a18eab6 100644 --- a/WebCrawler/avsox.py +++ b/WebCrawler/avsox.py @@ -1,8 +1,5 @@ import sys sys.path.append('..') -import re -from lxml import etree -import json from ADC_function import * from WebCrawler.storyline import getStoryline from WebCrawler.crawler import * diff --git a/WebCrawler/carib.py b/WebCrawler/carib.py index 462dc61..50cbcc1 100755 --- a/WebCrawler/carib.py +++ b/WebCrawler/carib.py @@ -1,8 +1,6 @@ import sys sys.path.append('../') -import json from lxml import html -import re from ADC_function import * from WebCrawler.storyline import getStoryline diff --git a/WebCrawler/dlsite.py b/WebCrawler/dlsite.py index 19ab291..dc2c570 100644 --- a/WebCrawler/dlsite.py +++ b/WebCrawler/dlsite.py @@ -4,20 +4,6 @@ import json import sys sys.path.append('../') from ADC_function import * -# import sys -# import io -# sys.stdout = io.TextIOWrapper(sys.stdout.buffer, errors = 'replace', line_buffering = True) -#print(get_html('https://www.dlsite.com/maniax/work/=/product_id/VJ013152.html')) -#title /html/head/title/text() -#studio //th[contains(text(),"ブランド名")]/../td/span[1]/a/text() -#release //th[contains(text(),"販売日")]/../td/a/text() -#story //th[contains(text(),"シナリオ")]/../td/a/text() -#senyo //th[contains(text(),"声優")]/../td/a/text() -#tag //th[contains(text(),"ジャンル")]/../td/div/a/text() -#jianjie //*[@id="main_inner"]/div[3]/text() -#photo //*[@id="work_left"]/div/div/div[2]/div/div[1]/div[1]/ul/li/img/@src - -#https://www.dlsite.com/maniax/work/=/product_id/VJ013152.html def getTitle(html): result = str(html.xpath('/html/head/title/text()')[0]) diff --git a/WebCrawler/fanza.py b/WebCrawler/fanza.py index 622f837..735bf72 100644 --- a/WebCrawler/fanza.py +++ b/WebCrawler/fanza.py @@ -2,17 +2,10 @@ # -*- coding: utf-8 -*- import sys sys.path.append('../') -import json -import re from urllib.parse import urlencode -from lxml import etree - from ADC_function import * from WebCrawler.crawler import * -# import sys -# import io -# sys.stdout = io.TextIOWrapper(sys.stdout.buffer, errors = 'replace', line_buffering = True) class fanzaCrawler(Crawler): def getFanzaString(self,string): diff --git a/WebCrawler/fc2.py b/WebCrawler/fc2.py index a908269..7eae92b 100644 --- a/WebCrawler/fc2.py +++ b/WebCrawler/fc2.py @@ -1,14 +1,10 @@ import sys sys.path.append('../') import re -from lxml import etree#need install import json import config import ADC_function from WebCrawler.crawler import * -# import sys -# import io -# sys.stdout = io.TextIOWrapper(sys.stdout.buffer, errors = 'replace', line_buffering = True) def getExtrafanart(htmlcode): # 获取剧照 html_pather = re.compile(r'