使用beautifulsoup抓取京东商品的名称和价格
#coding=utf-8
import urllibimport urllib2
import cookielib
from bs4 import BeautifulSoup
import sys
reload(sys)
sys.setdefaultencoding("utf-8") #处理编码
product ="ThinkPad i5"
text = urllib.urlopen("http://search.jd.com/Search?keyword="+product+"&enc=utf-8").read()
soup = BeautifulSoup(text)
content = soup.find_all('div', attrs={'class':'lh-wrap'})
for wrap in content:
name_tags = wrap.find_all('div', attrs={'class':'p-name'})
for name in name_tags:
print '商品:'+name.find('a').get_text()