import re
import urllib
import sys
reload(sys)
sys.setdefaultencoding('utf8')
def getHtml(url):
page = urllib.urlopen(url)
html = page.read()
return html
def getImg(html, x):
reg = r'src="(http://img.*?\.jpg)"'
imgre = re.compile(reg)
imList = re.findall(reg, html)
print(imList)
for i in imList:
print(i)
print x
urllib.urlretrieve(i, '%s.jpg' % x)
x += 1
return x
x = 1
url = "http://www.deyi.com/thread-10993290-"
for k in range(1, 3):
ul = url+str(k) + "-1.html"
print ul
html = getHtml(ul)
# print html
x = getImg(html, x)