python xpath定位 麦客表单
python xpath定位 麦客表单
##只是部分代码,还可以完善一下!
#coding=utf-8
import re
import io
import jieba
from selenium import webdriver
#基本信息
list1=[ XXXXXXXXXXXXXXXXXXXXX]
list2=[XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX]
guanlian = dict(zip(list1,list2)) ###自己脑补
#打开浏览器
bs = webdriver.Firefox()
print (‘Input your url:’)
url = raw_input()
print url
bs.get(url)
html = bs.page_source
#获取源码&正则表达式获取内容
f = io.open(’./source.txt’,mode=“w”,encoding=‘utf-8’)
f.write(html)
str = re.sub("[!,%,[,],.,:,<,>,",-,=,/,?,;,_,$,#,",\,{,},*,(,),\\,\(,\),\:,\s+]","", html)
#结果写入result.txt文件
f = io.open(’./result.txt’,mode=“w”,encoding=‘utf-8’)
f.write(str)
#结果赋值给字符串
f = io.op