自然语言处理-斯坦福CS224第一讲python代码实现

# txt文件google 或者 百度
import matplotlib as matplotlib  # this is used as mathmatic package
import notebook as notebook  # graphic package
import numpy as np
# Get the interactive Tools for Matplotlib

import matplotlib.pyplot as plt
import warnings

warnings.filterwarnings('ignore')

plt.style.use('ggplot')

from sklearn.manifold import TSNE  # word similarity package
from sklearn.decomposition import PCA

from gensim.test.utils import datapath, get_tmpfile
from gensim.models import KeyedVectors
from gensim.scripts.glove2word2vec import glove2word2vec

glove_file = datapath('C:ai_work_space\Corpus\glove.6B.100d.txt')
word2vec_glove_file = get_tmpfile("glove.6B.100d.word2vec.txt")
glove2word2vec(glove_file, word2vec_glove_file)

model = KeyedVectors.load_word2vec_format(word2vec_glove_file)

word2List = model.most_similar('banana')
for wordProbability in word2List:
    print(wordProbability)

word2NegList = model.most_similar(negative='banana')
for word2NegProbability in word2NegList:
    print(word2NegProbability)

# analogy test
result = model.most_similar(positive=['woman', 'king'], negative=['man'])

print("{}:{:.4f}".format(*result[0]))


def analogy(x1, x2, y1):
    analogyResult = model.most_similar(positive=[y1, x2], negative=[x1])
    return analogyResult[0][0]


print(analogy('japan', 'japanese', 'china'))
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值