from gensim.models import word2vec
import gensim
import logging
# 模型训练,生成词向量
logging.basicConfig(format=’%(asctime)s : %(levelname)s : %(message)s’, level=logging.INFO)
sentences = word2vec.Text8Corpus(train_file_name) # 加载语料
model = gensim.models.Word2Vec(sentences, size=200) # 训练skip-gram模型; 默认window=5
model.save(save_model_file)
model.wv.save_word2vec_format(save_model_name + “.bin”, binary=True) # 以二进制类型保存模型以便重用
gnesim 模型训练,生成词向量
最新推荐文章于 2024-08-03 19:27:22 发布