参考
https://blog.csdn.net/u012424313/article/details/82222188
https://www.cnblogs.com/yumingle/p/6675487.html
https://blog.csdn.net/python36/article/details/83029661
下载原始的 scel 词库文件
# coding=utf-8
import os
import sys
import requests
from urllib.request import urlretrieve
from bs4 import BeautifulSoup
class SouGSpider(object):
def __init__(self):
self.base_url = "http://pinyin.sogou.com"
self.homepage_url = "http://pinyin.sogou.com/dict/"
self.base_dir = "/Users/furuiyang/gitzip/JustSimpleSpider/soug/csv"
def callbackfunc(self, blocknum, blocksize, totalsize):
"""
回调函数
:param