门槛:
1.此网站只能用IE8或者ie9
2.有验证码
3.ajax的数据传递
4.当然也是很多iframe框架
上代码:
from selenium import webdriver
import time
from lxml import etree
class Xpspider(object):
def __init__(self):
self.driver = webdriver.Ie(executable_path=r'C:\Program Files\Internet Explorer\IEDriverServer.exe')
self.url = r'https://service.sharp.cn/'
self.run()
def run(self):
self.driver.get(self.url)
source = self.driver.page_source
self.login_page(source)
def login_page(self,source):
time.sleep(3)
textcode = input('请输入验证码!') #等待把相关录入
print('登录中,请等待...')
self.driver.find_element_by_id("orgcd").send_keys("要录入机构代码")
self.driver.find_elements_by_name('username')[0].send_keys('用户名')
self.driver.find_element_by_id("password").send_keys("密码")
self.driver.find_element_by_id(&