From 94c5598fde7561a7e4cc5dc952801d000bae4e98 Mon Sep 17 00:00:00 2001 From: yoshiko2 Date: Mon, 3 May 2021 22:27:09 +0800 Subject: [PATCH] Fix all source Exception handling --- WebCrawler/avsox.py | 43 +++++++++++++++++++++++-------------------- WebCrawler/jav321.py | 4 ++-- WebCrawler/javlib.py | 2 +- 3 files changed, 26 insertions(+), 23 deletions(-) diff --git a/WebCrawler/avsox.py b/WebCrawler/avsox.py index 82c0b86..450c9a1 100644 --- a/WebCrawler/avsox.py +++ b/WebCrawler/avsox.py @@ -99,26 +99,29 @@ def main(number): web = get_html(result1) soup = BeautifulSoup(web, 'lxml') info = str(soup.find(attrs={'class': 'row movie'})) - dic = { - 'actor': getActor(web), - 'title': getTitle(web).strip(getNum(web)), - 'studio': getStudio(info), - 'outline': '',# - 'runtime': getRuntime(info), - 'director': '', # - 'release': getRelease(info), - 'number': getNum(info), - 'cover': getCover(web), - 'cover_small': getCover_small(a), - 'imagecut': 3, - 'tag': getTag(web), - 'label': getLabel(info), - 'year': getYear(getRelease(info)), # str(re.search('\d{4}',getRelease(a)).group()), - 'actor_photo': getActorPhoto(web), - 'website': result1, - 'source': 'avsox.py', - 'series': getSeries(info), - } + try: + dic = { + 'actor': getActor(web), + 'title': getTitle(web).strip(getNum(web)), + 'studio': getStudio(info), + 'outline': '', # + 'runtime': getRuntime(info), + 'director': '', # + 'release': getRelease(info), + 'number': getNum(info), + 'cover': getCover(web), + 'cover_small': getCover_small(a), + 'imagecut': 3, + 'tag': getTag(web), + 'label': getLabel(info), + 'year': getYear(getRelease(info)), # str(re.search('\d{4}',getRelease(a)).group()), + 'actor_photo': getActorPhoto(web), + 'website': result1, + 'source': 'avsox.py', + 'series': getSeries(info), + } + except: + dic = {"title": ""} js = json.dumps(dic, ensure_ascii=False, sort_keys=True, indent=4, separators=(',', ':'), ) # .encode('UTF-8') return js diff --git a/WebCrawler/jav321.py b/WebCrawler/jav321.py index 68b317c..f7c0fb4 100644 --- a/WebCrawler/jav321.py +++ b/WebCrawler/jav321.py @@ -31,7 +31,7 @@ def main(number: str) -> json: **data, } else: - dic = {} + dic = {"title": ""} return json.dumps(dic, ensure_ascii=False, sort_keys=True, indent=4, separators=(',', ':')) @@ -59,7 +59,7 @@ def parse_info(soup: BeautifulSoup) -> dict: "series": get_series(data_dic), } else: - return {} + return {"title": ""} def get_bold_text(h: str) -> str: diff --git a/WebCrawler/javlib.py b/WebCrawler/javlib.py index a13f2b2..7af0c14 100644 --- a/WebCrawler/javlib.py +++ b/WebCrawler/javlib.py @@ -94,7 +94,7 @@ def main(number: str): "series": '', } else: - dic = {} + dic = {"title": ""} return json.dumps(dic, ensure_ascii=False, sort_keys=True, indent=4, separators=(',', ':'))