MorphInterpretation.cpp
2.32 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
/*
* File: MorphInterpretation.cpp
* Author: mlenart
*
* Created on November 14, 2013, 11:47 AM
*/
#include <string>
#include <sstream>
#include "morfeusz2.h"
#include "Environment.hpp"
#include "const.hpp"
using namespace std;
namespace morfeusz {
MorphInterpretation MorphInterpretation::createIgn(
int startNode, int endNode,
const std::string& orth,
const std::string& lemma) {
MorphInterpretation mi;
mi.startNode = startNode;
mi.endNode = endNode;
mi.orth = orth;
mi.lemma = lemma;
mi.tagId = 0;
mi.nameId = 0;
mi.labelsId = 0;
return mi;
}
/**
* Creates new instance with "sp" tag (meaning: "this is a sequence of whitespaces")
*/
MorphInterpretation MorphInterpretation::createWhitespace(int startNode, int endNode, const std::string& orth) {
MorphInterpretation mi;
mi.startNode = startNode;
mi.endNode = endNode;
mi.orth = orth;
mi.lemma = orth;
mi.tagId = 1;
mi.nameId = 0;
mi.labelsId = 0;
return mi;
}
static inline bool hasEnding(const string &fullString, const string &ending) {
if (fullString.length() >= ending.length()) {
return (0 == fullString.compare(fullString.length() - ending.length(), ending.length(), ending));
}
else {
return false;
}
}
bool MorphInterpretation::hasHomonym(const string& homonymId) const {
size_t homonymSeparatorIdx = this->lemma.length() - homonymId.length() - 1;
return homonymSeparatorIdx > 0
&& this->lemma[homonymSeparatorIdx] == HOMONYM_SEPARATOR
&& hasEnding(this->lemma, homonymId);
}
std::string MorphInterpretation::toString(bool includeNodeNumbers) const {
std::stringstream res;
if (includeNodeNumbers) {
res << startNode << "," << endNode << ",";
}
res << orth << ",";
res << lemma;
res << ",";
// res << getTag();
// if (!getName().empty()) {
// res << "," << getName();
// }
// if (!getQualifiers().empty()) {
// res << "," << getQualifiersStr(*this);
// }
return res.str();
}
}