mirror of https://github.com/testerSunshine/12306
xicidaili不可用,增加了kuaidaili
parent
a495af8834
commit
8310a86c1d
|
@ -18,10 +18,15 @@ class proxy:
|
||||||
获取未加工代理列表
|
获取未加工代理列表
|
||||||
:return:
|
:return:
|
||||||
"""
|
"""
|
||||||
|
try:
|
||||||
|
self.get_proxy_from_xicidaili()
|
||||||
|
except Exception:
|
||||||
|
self.get_proxy_from_kuaidaili()
|
||||||
|
|
||||||
|
def get_proxy_from_xicidaili(self):
|
||||||
User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0'
|
User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0'
|
||||||
header = dict()
|
header = dict()
|
||||||
header['User-Agent'] = User_Agent
|
header['User-Agent'] = User_Agent
|
||||||
|
|
||||||
for i in range(1, 5):
|
for i in range(1, 5):
|
||||||
time.sleep(1)
|
time.sleep(1)
|
||||||
url = 'http://www.xicidaili.com/nn/' + str(i)
|
url = 'http://www.xicidaili.com/nn/' + str(i)
|
||||||
|
@ -37,6 +42,25 @@ class proxy:
|
||||||
print(ip_temp)
|
print(ip_temp)
|
||||||
self.proxy_list.append(ip_temp)
|
self.proxy_list.append(ip_temp)
|
||||||
|
|
||||||
|
def get_proxy_from_kuaidaili(self):
|
||||||
|
User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0'
|
||||||
|
header = dict()
|
||||||
|
header['User-Agent'] = User_Agent
|
||||||
|
for i in range(1, 5):
|
||||||
|
time.sleep(1)
|
||||||
|
url = 'https://www.kuaidaili.com/free/inha/' + str(i)
|
||||||
|
res = requests.get(url=url, headers=header).content
|
||||||
|
|
||||||
|
soup = BeautifulSoup(res, "html.parser")
|
||||||
|
ips = soup.findAll('tr')
|
||||||
|
|
||||||
|
for x in range(1, len(ips)):
|
||||||
|
ip = ips[x]
|
||||||
|
tds = ip.findAll("td")
|
||||||
|
ip_temp = tds[0].contents[0] + ":" + tds[1].contents[0]
|
||||||
|
print(ip_temp)
|
||||||
|
self.proxy_list.append(ip_temp)
|
||||||
|
|
||||||
def filter_proxy(self):
|
def filter_proxy(self):
|
||||||
"""
|
"""
|
||||||
将不可用IP剔除
|
将不可用IP剔除
|
||||||
|
@ -104,4 +128,5 @@ class proxy:
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
a = proxy()
|
a = proxy()
|
||||||
|
a.get_proxy()
|
||||||
print(a.get_filter_proxy())
|
print(a.get_filter_proxy())
|
||||||
|
|
Loading…
Reference in New Issue