淘宝图片爬取
1.找到对应网址找出规律,s=后面的数为一页加60
2.分析某图片地址,到源代码中搜索
import urllib.request
import re
keyname = "短裙"
#对keyname进行编码
key = urllib.request.quote(keyname)
for i in range(0,3):
url = "https://s.taobao.com/list?q="+key+"&cat=16&style=grid&seller_type=taobao&spm=a217f.8051907.1000187.1&bcoffset=0&s="+str(i*60)
data = urllib.request.urlopen(url).read().decode("utf-8","ignore")
pat = 'picUrl":"//(.*?)"'
allimgurl = re.compile(pat).findall(data)
print(allimgurl)
现在已爬不了