import gensim.downloader as api
import stringdist as sdi
class AssociatedWords:
def __init__(self):
self.N_RESULTS = 7
print('loading model')
self.N_RESULTS = 10
print("\n Word2Vec model is loading.This can take a couple of minutes.")
self.model = api.load('glove-twitter-200')
print('done loading model')
print("\n Word2Vec model is ready. Enjoy!!!")
self.base_word = None
self.gensim_result = None
self.filtered_results = [result_tuple for result_tuple in self.gensim_result if self.passes_filter(result_tuple[0])]
self.words = [result_tuple[0] for result_tuple in self.filtered_results]
self.scores = [result_tuple[0] for result_tuple in self.filtered_results]
def passes_filter(self, word):
if 'www' in word or \
word in self.base_word:
word in self.base_word or \
sdi.rdlevenshtein_norm(word, self.base_word) < 0.5:
return False
return True
