Added mention intersection rule to resolving algorithms.

Bartłomiej Nitoń
1 parent a9a48a44
Showing 1 changed file with 13 additions and 9 deletions
corneferencer/resolvers/resolve.py
 import numpy
  
 from conf import NEURAL_MODEL, THRESHOLD
+from corneferencer.resolvers import features
 from corneferencer.resolvers.vectors import get_pair_vector
  
  
@@ -12,12 +13,13 @@ def incremental(text):
             best_prediction = 0.0
             best_ante = None
             for ante in text.mentions[:i]:
-                pair_vec = get_pair_vector(ante, ana)
-                sample = numpy.asarray([pair_vec], dtype=numpy.float32)
-                prediction = NEURAL_MODEL.predict(sample)[0]
-                if prediction > THRESHOLD and prediction >= best_prediction:
-                    best_prediction = prediction
-                    best_ante = ante
+                if not features.pair_intersect(ante, ana):
+                    pair_vec = get_pair_vector(ante, ana)
+                    sample = numpy.asarray([pair_vec], dtype=numpy.float32)
+                    prediction = NEURAL_MODEL.predict(sample)[0]
+                    if prediction > THRESHOLD and prediction >= best_prediction:
+                        best_prediction = prediction
+                        best_ante = ante
             if best_ante is not None:
                 # print ('wynik')
                 # print(best_ante.text, best_prediction, ana.text)
@@ -78,9 +80,11 @@ def get_best_set(sets, ana):
 def predict_set(mentions, ana):
     prediction_sum = 0.0
     for mnt in mentions:
-        pair_vec = get_pair_vector(mnt, ana)
-        sample = numpy.asarray([pair_vec], dtype=numpy.float32)
-        prediction = NEURAL_MODEL.predict(sample)[0]
+        prediction = 0.0
+        if not features.pair_intersect(mnt, ana):
+            pair_vec = get_pair_vector(mnt, ana)
+            sample = numpy.asarray([pair_vec], dtype=numpy.float32)
+            prediction = NEURAL_MODEL.predict(sample)[0]
         prediction_sum += prediction
         # print(mnt.text, prediction, ana.text)
     return prediction_sum / float(len(mentions))