import urllib.request as ur
import urllib.parse as up
from lxml import etree
import os
import json
import codecs
def openUrl(url):
request = ur.Request(url)
request.add_header('User-Agent', 'Mozilla/5.0 (Windows NT 6.1; WOW64; rv:35.0) Gecko/20100101 Firefox/35.0')
response = ur.urlopen(request)
html = response.read()
return html
def getMeaning(words):
parse_json_list = {
}
print("\n正在爬取信息...")
for word in words:
parse_json = {
}
# 根据单词生成百度汉语url quote转码
url = 'https://hanyu.baidu.com/zici/s?wd=' + up.quote(word.replace(' ', '+')) + '&query=%E4%B8%80&srcid=28232&from=kg0'
python爬取百度汉字信息
最新推荐文章于 2024-05-30 18:00:43 发布