https://github.com/uhh-lt/path2vec
Raw File
Tip revision: 29984b2f392d3a8061b79ee37dda3499714a7244 authored by Andrey Kutuzov on 27 August 2019, 16:32:24 UTC
Hyperlinks to embeddings fixed
Tip revision: 29984b2
evaluation.py
#!/usr/bin/python3
# coding: utf-8

import gensim
import logging
import sys
from evaluate_lemmas import evaluate_synsets

logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO)
logger = logging.getLogger(__name__)

# Loading model and semantic similarity dataset
modelfile, wordnet_scores, static_scores = sys.argv[1:]

model = gensim.models.KeyedVectors.load_word2vec_format(modelfile, binary=False)

# Pre-calculating vector norms
model.init_sims(replace=True)

wordnet_synset_score = model.evaluate_word_pairs(wordnet_scores, dummy4unknown=True)
static_synset_score = model.evaluate_word_pairs(static_scores, dummy4unknown=True)
dynamic_synset_score = evaluate_synsets(model, 'simlex/simlex_original.tsv', logger,
                                        dummy4unknown=True)

name = modelfile.replace('_embeddings_', '_')[:-7]

print('Model\tWordnet\tStatic\tDynamic')
print(name + '\t' + str(round(wordnet_synset_score[1][0], 4)) + '\t'
      + str(round(static_synset_score[1][0], 4)) + '\t'
      + str(round(dynamic_synset_score[1][0], 4)))
back to top