# !/usr/bin/env python
# -*- coding: utf-8 -*-
import urllib2
import urllib
import cookielib
import json
import httplib
import re
import requests
from lxml import etree
import StringIO
import time
s = requests.session()
print s.headers
url = "http://x.x.26.8:8760/"
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:54.0) Gecko/20100101 Firefox/54.0'
}
r = s.get(url, timeout=10, headers=headers)
r=r.text
r=r.encode('utf8')
print type(r)
f=open('fh1.html','w')
f.write(r)
f.close()
fh1=open('fh1.html','r')
fh2=fh1.read()
#print fh2
htmlEmt=etree.HTML(fh2)
#<a href="http://x.x.200.17:7003/loan-web/4ALogon.jsp?tgt=TGT-130672-O1fcAq4HGXFxYjmzfMfuIxAFlqgOfEzNVXja1fDMm5C7IXb7Ox-cas01.example.org" target="_blank">信贷系统</a>
#根据a标签,获取href的值
result=htmlEmt.xpath('//a/@href')
print
获取href 属性值
最新推荐文章于 2023-08-02 15:59:29 发布