vectors.py 1.56 KB
from corneferencer.resolvers import features


def get_pair_vector(ante, ana):
    vec = []
    vec.extend(ante.features)
    vec.extend(ana.features)
    pair_features = get_pair_features(ante, ana)
    vec.extend(pair_features)
    return vec


def get_mention_features(mention):
    vec = []
    vec.extend(features.head_vec(mention))
    vec.extend(features.first_word_vec(mention))
    vec.extend(features.last_word_vec(mention))
    vec.extend(features.first_after_vec(mention))
    vec.extend(features.second_after_vec(mention))
    vec.extend(features.first_before_vec(mention))
    vec.extend(features.second_before_vec(mention))
    vec.extend(features.preceding_context_vec(mention))
    vec.extend(features.following_context_vec(mention))
    vec.extend(features.mention_vec(mention))
    vec.extend(features.sentence_vec(mention))

    # cechy uzupelniajace
    vec.extend(features.mention_type(mention))

    return vec


def get_pair_features(ante, ana):
    vec = []
    vec.extend(features.distances_vec(ante, ana))
    vec.append(features.head_match(ante, ana))
    vec.append(features.exact_match(ante, ana))
    vec.append(features.base_match(ante, ana))

    # cechy uzupelniajace
    vec.append(features.ante_contains_rarest_from_ana(ante, ana))
    vec.extend(features.agreement(ante, ana, 'gender'))
    vec.extend(features.agreement(ante, ana, 'number'))
    vec.extend(features.agreement(ante, ana, 'person'))
    vec.append(features.is_acronym(ante, ana))
    vec.append(features.same_sentence(ante, ana))
    vec.append(features.same_paragraph(ante, ana))

    return vec