lab 2
!pip install gensim nltk transformers torch matplotlib scikit-learn
import gensim.downloader as api
import numpy as np
from sklearn.decomposition import PCA
import matplotlib.pyplot as plt
model = api.load("glove-wiki-gigaword-50")
words = ["computer","internet","software","hardware","data",
"robot","ai","network","cloud","algorithm"]
vecs = np.array([model[w] for w in words])
xy = PCA(2).fit_transform(vecs)
plt.scatter(xy[:,0], xy[:,1])
for (x, y), w in zip(xy, words):
plt.text(x+0.01, y+0.01, w)
plt.title("PCA – Technology words")
plt.xlabel("PC1"); plt.ylabel("PC2")
plt.show()
word = "computer"
print("Similar to", word, ":", model.most_similar(word, topn=5))
Comments
Post a Comment