diff --git a/WebCrawler/avsox.py b/WebCrawler/avsox.py index f15b9b4..82c0b86 100644 --- a/WebCrawler/avsox.py +++ b/WebCrawler/avsox.py @@ -83,15 +83,17 @@ def getSeries(htmlcode): return '' def main(number): - a = get_html('https://avsox.host/cn/search/' + number) + html = get_html('https://tellme.pw/avsox') + site = etree.HTML(html).xpath('//div[@class="container"]/div/a/@href')[0] + a = get_html(site + '/cn/search/' + number) html = etree.fromstring(a, etree.HTMLParser()) # //table/tr[1]/td[1]/text() result1 = str(html.xpath('//*[@id="waterfall"]/div/a/@href')).strip(" ['']") if result1 == '' or result1 == 'null' or result1 == 'None': - a = get_html('https://avsox.host/cn/search/' + number.replace('-', '_')) + a = get_html(site + '/cn/search/' + number.replace('-', '_')) html = etree.fromstring(a, etree.HTMLParser()) # //table/tr[1]/td[1]/text() result1 = str(html.xpath('//*[@id="waterfall"]/div/a/@href')).strip(" ['']") if result1 == '' or result1 == 'null' or result1 == 'None': - a = get_html('https://avsox.host/cn/search/' + number.replace('_', '')) + a = get_html(site + '/cn/search/' + number.replace('_', '')) html = etree.fromstring(a, etree.HTMLParser()) # //table/tr[1]/td[1]/text() result1 = str(html.xpath('//*[@id="waterfall"]/div/a/@href')).strip(" ['']") web = get_html(result1) @@ -121,4 +123,4 @@ def main(number): return js if __name__ == "__main__": - print(main('012717_472')) \ No newline at end of file + print(main('012717_472'))