直接上代码
__author__ = 'Elvis'
#-*- coding: UTF-8 -*-
import urllib
import re
def getHtml(url):
page = urllib.urlopen(url)
html = page.read()
return html
def getImage(html):
imgre = re.compile(r'src="(.+?\.jpg)"')
imglist = imgre.findall(html)
x=0
for image in imglist:
urllib.urlretrieve(image,'%s.jpg' % x)
x+=1
html = getHtml("http://tieba.baidu.com/index.html")
print getImage(html)
页面代码
结果: