Compare commits
3 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
b5f82f77a1 | ||
|
|
5f627d24e0 | ||
|
|
6817cd2093 |
27
core.py
27
core.py
@@ -12,13 +12,11 @@ import time
|
|||||||
#=====================爬虫核心部分==========================
|
#=====================爬虫核心部分==========================
|
||||||
def get_html(url):#网页请求核心
|
def get_html(url):#网页请求核心
|
||||||
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36'}
|
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36'}
|
||||||
getweb = requests.get(str(url),proxies={"http": "http://127.0.0.1:2334","https": "https://127.0.0.1:2334"},timeout=5,headers=headers).text
|
getweb = requests.get(str(url),timeout=5,headers=headers).text
|
||||||
try:
|
try:
|
||||||
return getweb
|
return getweb
|
||||||
except Exception as e:
|
except:
|
||||||
print(e)
|
print("[-]Connect Failed! Please check your Proxy.")
|
||||||
except IOError as e1:
|
|
||||||
print(e1)
|
|
||||||
|
|
||||||
def getTitle(htmlcode): #获取标题
|
def getTitle(htmlcode): #获取标题
|
||||||
doc = pq(htmlcode)
|
doc = pq(htmlcode)
|
||||||
@@ -85,7 +83,7 @@ def DownloadFileWithFilename(url,filename,path): #path = examle:photo , video.in
|
|||||||
print("[-]Download Failed2!")
|
print("[-]Download Failed2!")
|
||||||
time.sleep(3)
|
time.sleep(3)
|
||||||
os._exit(0)
|
os._exit(0)
|
||||||
def PrintFiles(html,html_outline,path):
|
def PrintFiles(html,path,number):
|
||||||
try:
|
try:
|
||||||
if not os.path.exists(path):
|
if not os.path.exists(path):
|
||||||
os.makedirs(path)
|
os.makedirs(path)
|
||||||
@@ -96,8 +94,8 @@ def PrintFiles(html,html_outline,path):
|
|||||||
print(" </set>", file=code)
|
print(" </set>", file=code)
|
||||||
print(" <studio>" + getStudio(html) + "+</studio>", file=code)
|
print(" <studio>" + getStudio(html) + "+</studio>", file=code)
|
||||||
print(" <year>" + getYear(html) + "</year>", file=code)
|
print(" <year>" + getYear(html) + "</year>", file=code)
|
||||||
print(" <outline>"+getOutline(html_outline)+"</outline>", file=code)
|
print(" <outline>"+getOutline(get_html_dww(number))+"</outline>", file=code)
|
||||||
print(" <plot>"+getOutline(html_outline)+"</plot>", file=code)
|
print(" <plot>"+getOutline(get_html_dww(number))+"</plot>", file=code)
|
||||||
print(" <runtime>"+str(getRuntime(html)).replace(" ","")+"</runtime>", file=code)
|
print(" <runtime>"+str(getRuntime(html)).replace(" ","")+"</runtime>", file=code)
|
||||||
print(" <director>" + getDirector(html) + "</director>", file=code)
|
print(" <director>" + getDirector(html) + "</director>", file=code)
|
||||||
print(" <poster>" + getNum(html) + ".png</poster>", file=code)
|
print(" <poster>" + getNum(html) + ".png</poster>", file=code)
|
||||||
@@ -122,8 +120,9 @@ def PrintFiles(html,html_outline,path):
|
|||||||
print(e1)
|
print(e1)
|
||||||
print("[-]Write Failed!")
|
print("[-]Write Failed!")
|
||||||
|
|
||||||
|
|
||||||
#=====================本地文件处理===========================
|
#=====================本地文件处理===========================
|
||||||
|
|
||||||
|
|
||||||
def argparse_get_file():
|
def argparse_get_file():
|
||||||
import argparse
|
import argparse
|
||||||
parser = argparse.ArgumentParser()
|
parser = argparse.ArgumentParser()
|
||||||
@@ -173,11 +172,14 @@ def imageDownload(htmlcode,filepath,number): #封面是否下载成功,否则
|
|||||||
shutil.move(filepath, 'failed/')
|
shutil.move(filepath, 'failed/')
|
||||||
os._exit(0)
|
os._exit(0)
|
||||||
DownloadFileWithFilename(getCover(htmlcode), number + '.jpg', path)
|
DownloadFileWithFilename(getCover(htmlcode), number + '.jpg', path)
|
||||||
print('[+]Downloaded!', path +'/'+number+'.jpg')
|
print('[+]Image Downloaded!', path +'/'+number+'.jpg')
|
||||||
def cutImage(number):
|
def cutImage(number):
|
||||||
try:
|
try:
|
||||||
img = Image.open(path + '/' + number + '.jpg')
|
img = Image.open(path + '/' + number + '.jpg')
|
||||||
img2 = img.crop((421, 0, 800, 538))
|
imgSize=img.size
|
||||||
|
w=img.width
|
||||||
|
h=img.height
|
||||||
|
img2 = img.crop((w/1.9, 0, w, h))
|
||||||
img2.save(path + '/' + number + '.png')
|
img2.save(path + '/' + number + '.png')
|
||||||
except:
|
except:
|
||||||
print('[-]Cover cut failed!')
|
print('[-]Cover cut failed!')
|
||||||
@@ -192,5 +194,6 @@ if __name__ == '__main__':
|
|||||||
htmlcode=get_html_javbus(number) #获取的HTML代码
|
htmlcode=get_html_javbus(number) #获取的HTML代码
|
||||||
creatFolder(htmlcode,number) #创建文件夹
|
creatFolder(htmlcode,number) #创建文件夹
|
||||||
imageDownload(htmlcode,filepath,number) #creatFoder会返回番号路径
|
imageDownload(htmlcode,filepath,number) #creatFoder会返回番号路径
|
||||||
cutImage(number) #裁剪图片
|
PrintFiles(htmlcode, path,number)#打印文件
|
||||||
|
cutImage(number) #裁剪图
|
||||||
pasteFileToFolder(filepath,number,path) #移动文件
|
pasteFileToFolder(filepath,number,path) #移动文件
|
||||||
|
|||||||
Reference in New Issue
Block a user