import gensim import nltk from nltk.corpus import stopwords tokenizer = nltk.data.load('C:/opt/data/nlp/nltk_data/tokenizers/punkt/english.pickle')C:
以上的情况不知道为何老是导入不成功
换成以下代码:
import gensim
import nltk.data
from nltk.corpus import stopwords
tokenizer = nltk.data.load('tokenizers/punkt/english.pickle')
先导入nltk.data,再通过nltk.data.load()直接导入tokenizer/punkt/english.pickle