def main(we_file='glove_model_50.npz', w2i_file='glove_word2idx_50.json'):
words = ['japan', 'japanese', 'england', 'english', 'australia', 'australian', 'china', 'chinese', 'italy', 'italian', 'french', 'france', 'spain', 'spanish']
with open(w2i_file) as f:
word2idx = json.load(f)
npz = np.load(we_file)
W = npz['arr_0']
V = npz['arr_1']
We = (W + V.T) / 2
idx = [word2idx[w] for w in words]
# We = We[idx]
tsne = TSNE()
Z = tsne.fit_transform(We)
Z = Z[idx]
plt.scatter(Z[:,0], Z[:,1])
for i in xrange(len(words)):
plt.annotate(s=words[i], xy=(Z[i,0], Z[i,1]))
plt.show()
评论列表
文章目录