from selenium import webdriver
import requests,time
from bs4 import BeautifulSoup
def url_open(url,a):
e=1
driver=webdriver.Firefox()
driver.implicitly_wait(1)
driver.get(url)
while(True):
html=driver.page_source
soup=BeautifulSoup(html,'lxml')
soup1=soup.select('tr[class="odd"],tr[class=""]')
e+=1
#print(soup1)
for i in soup1:
#print(i.text)
i=i.text.split()[0]+':'+i.text.split()[1]+' '+i.text.split()[4]
if('HTTPS'in i ):
print(i)
driver.find_element_by_class_name('next_page').click()
time.sleep(2)
if(e>a):
break
if __name__=='__main__':
url='http://www.xicidaili.com/nn'
a=int(input('请输入你要下载的页数:'))
url_open(url,a)
爬虫自动化-代理Ip获取
最新推荐文章于 2020-04-24 18:31:04 发布