xicidaili不可用,增加了kuaidaili

pull/805/head
peng 2021-04-14 14:46:15 +08:00
parent a495af8834
commit 8310a86c1d
1 changed files with 26 additions and 1 deletions

View File

@ -18,10 +18,15 @@ class proxy:
获取未加工代理列表 获取未加工代理列表
:return: :return:
""" """
try:
self.get_proxy_from_xicidaili()
except Exception:
self.get_proxy_from_kuaidaili()
def get_proxy_from_xicidaili(self):
User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0' User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0'
header = dict() header = dict()
header['User-Agent'] = User_Agent header['User-Agent'] = User_Agent
for i in range(1, 5): for i in range(1, 5):
time.sleep(1) time.sleep(1)
url = 'http://www.xicidaili.com/nn/' + str(i) url = 'http://www.xicidaili.com/nn/' + str(i)
@ -37,6 +42,25 @@ class proxy:
print(ip_temp) print(ip_temp)
self.proxy_list.append(ip_temp) self.proxy_list.append(ip_temp)
def get_proxy_from_kuaidaili(self):
User_Agent = 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:43.0) Gecko/20100101 Firefox/43.0'
header = dict()
header['User-Agent'] = User_Agent
for i in range(1, 5):
time.sleep(1)
url = 'https://www.kuaidaili.com/free/inha/' + str(i)
res = requests.get(url=url, headers=header).content
soup = BeautifulSoup(res, "html.parser")
ips = soup.findAll('tr')
for x in range(1, len(ips)):
ip = ips[x]
tds = ip.findAll("td")
ip_temp = tds[0].contents[0] + ":" + tds[1].contents[0]
print(ip_temp)
self.proxy_list.append(ip_temp)
def filter_proxy(self): def filter_proxy(self):
""" """
将不可用IP剔除 将不可用IP剔除
@ -104,4 +128,5 @@ class proxy:
if __name__ == "__main__": if __name__ == "__main__":
a = proxy() a = proxy()
a.get_proxy()
print(a.get_filter_proxy()) print(a.get_filter_proxy())