使用说明程序运行开始,需要输入出发地,目的地,出发时间,乘客信息,车次;乘客信息和车次可以输入多个
刚刚开始学习爬虫,selenium仅仅是解放了双手,运行效率不是很高;
程序运行时会打开chrome浏览器,因为使用的是chrome的浏览器驱动;
相关文档
https://selenium-python.readthedocs.io/installation.html#introduction
代码示例# encoding: utf-8from selenium import webdriverfrom selenium.webdriver.support.ui import WebDriverWaitfrom selenium.webdriver.support import expected_conditions as ECfrom selenium.webdriver.common.by import Byimport timeclass Qiangpiao(object):
def __init__(self):
driver_path = "E:\py_pachong\chromedriver.exe"
# 浏览器驱动
self.drive = webdriver.Chrome(executable_path=driver_path) # 登陆链接
self.login_url = "https://kyfw.12306.cn/otn/login/init"
# 登陆后的链接
self.initmy_url = "https://kyfw.12306.cn/otn/index/initMy12306"
# 查询页面
self.search_url = "https://kyfw.12306.cn/otn/leftTicket/init"
# 乘车人页面
self.passenger_url = "https://kyfw.12306.cn/otn/confirmPassenger/initDc"
def wait_input(self):
"""
主要用于页面审核;
当输入出发地,目的地,乘车时间后,会自动出发查询submit
:return:
"""
self.from_station = input("出发地:")
self.to_station = input("目的地:")
self.depart_time = input("出发时间:")
self.passengers = input("乘客姓名:").split(",")
self.trains = input("车次:").split(",") def _login(self):
"""
登陆验证,登陆成功后会跳转到 self.initmy_url
:return:
"""
self.drive.get(self.login_url)
WebDriverWait(self.drive, 1000).until(
EC.url_to_be(self.initmy_url)
)
print('登录成功') def _order_ticket(self):
"""
只实现了在无票的情况下去刷票
最关键的是等待验证 WebDriverWait
:return:
"""
self.drive.get(self.search_url)
WebDriverWait(self.drive, 1000).until(
EC.text_to_be_present_in_element_value((By.ID, "fromStationText"), self.from_station)
)
WebDriverWait(self.drive, 1000).until(
EC.text_to_be_present_in_element_value((By.ID, "toStationText"), self.to_station)
)
WebDriverWait(self.drive, 1000).until(
EC.text_to_be_present_in_element_value((By.ID, "train_date"), self.depart_time)
)
WebDriverWait(self.drive, 10000).until(
EC.element_to_be_clickable((By.ID, "query_ticket"))
)
searchBtn = self.drive.find_element_by_id("query_ticket")
searchBtn.click()
WebDriverWait(self.drive, 1000).until(
EC.presence_of_element_located((By.XPATH, ".//tbody[@id='queryLeftTable']/tr"))
) # find_elements_by_xpath 返回的是一个列表
# find_element_by_xpath 返回的是一个元素
tr_list = self.drive.find_elements_by_xpath(".//tbody[@id='queryLeftTable']/tr[not(@datatran)]") for tr in tr_list:
train_num = tr.find_element_by_class_name("number").text # print(train_num)
if train_num in self.trains:
left_ticket_td = tr.find_element_by_xpath(".//td[4]").text
num = 1
while left_ticket_td == "无":
print("暂时无票,正在刷新")
time.sleep(2)
searchBtn.click()
num += 1
print("抢票%s次" % num) if left_ticket_td != "无":
print(train_num + "有票")
oderBtn = tr.find_element_by_xpath(".//td[13]/a")
oderBtn.click()
WebDriverWait(self.drive, 1000).until(
EC.url_to_be(self.passenger_url)
)
WebDriverWait(self.drive, 1000).until(
EC.presence_of_element_located((By.XPATH, ".//ul[@id='normal_passenger_id']/li"))
)
passenger_labels = self.drive.find_elements_by_xpath( ".//ul[@id='normal_passenger_id']/li/label") for passenger_label in passenger_labels:
name = passenger_label.text if name in self.passengers:
passenger_label.click()
submitBtn = self.drive.find_element_by_id("submitOrder_id")
submitBtn.click()
WebDriverWait(self.drive, 1000).until(
EC.presence_of_element_located((By.CLASS_NAME, "dhtmlx_wins_body_outer"))
)
WebDriverWait(self.drive, 1000).until(
EC.presence_of_element_located((By.ID, "qr_submit_id"))
)
qr_submit = self.drive.find_element_by_id("qr_submit_id")
qr_submit.click() def run(self):
self.wait_input()
self._login()
self._order_ticket()if __name__ == '__main__':
spider = Qiangpiao()
spider.run()