一个简单的爬虫小程序,可以抓取bing输入关键字后第一个页面的标题、链接。
import re,urllib.parse,urllib.request,urllib.error
from bs4 import BeautifulSoup as BS
baseUrl = 'http://cn.bing.com/search?'
word = '鹿晗 吴亦凡 张艺兴'
print(word)
word = word.encode(encoding='utf-8', errors='strict')
#print(word)
data = {
'q':word}
data = urllib.parse.urlencode(data)
#print(data)
url = baseUrl+data
print(url)
try:
html = urllib.request.urlopen(url)
except</