一周之前没有接触过Python,更不用说Selenium,一把泪!直接上代码,故事稍后。。。
#coding = utf-8
#sudo apt-get install python3-openpyxl
from openpyxl import workbook
from openpyxl import load_workbook
import time
from urllib.request import urlopen
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.common.exceptions import NoSuchElementException
def getAllData(url):
global book # 全局工作表对象
PCBH = [] # 普查編號
SuoSH = [] # 索書號
CunJuan = ['','','','','','','','','',''] # 存卷
TMZZ = [] # 題名著者
BanBen = [] # 版本
CeShu = [] # 册(件)数
DanWei = [] # 单位
page_number = 14910 # 页数初始为1
while page_number <= 65914:
# print("-----------打印第",page_number,"页")
try:
link = driver