CasePatternHelper.hpp
1.58 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
/*
* File: CasePatternHelper.hpp
* Author: lennyn
*
* Created on April 4, 2014, 12:11 PM
*/
#ifndef CASEPATTERNHELPER_HPP
#define CASEPATTERNHELPER_HPP
#include <vector>
#include "InterpsGroup.hpp"
#include "CasePatternHelper.hpp"
#include "compressionByteUtils.hpp"
#include "Environment.hpp"
class Environment;
class CasePatternHelper {
public:
CasePatternHelper() : caseSensitive(false) {
}
void setCaseSensitive(bool caseSensitive) {
this->caseSensitive = caseSensitive;
}
bool checkCasePattern(
const std::vector<uint32_t>& lowercaseCodepoints,
const std::vector<uint32_t>& originalCodepoints,
const std::vector<bool>& casePattern) const {
if (this->caseSensitive) {
for (unsigned int i = 0; i < casePattern.size(); i++) {
if (casePattern[i] && lowercaseCodepoints[i] == originalCodepoints[i]) {
return false;
}
}
}
return true;
}
bool checkInterpsGroupOrthCasePatterns(
const Environment& env,
const char* orthStart,
const char* orthEnd,
const InterpsGroup& ig) const;
static std::vector<bool> deserializeOneCasePattern(const unsigned char*& ptr);
private:
bool caseSensitive;
mutable vector<uint32_t> orthCodepoints;
mutable vector<uint32_t> normalizedCodepoints;
static const uint8_t LEMMA_ONLY_LOWER = 0;
static const uint8_t LEMMA_UPPER_PREFIX = 1;
static const uint8_t LEMMA_MIXED_CASE = 2;
};
#endif /* CASEPATTERNHELPER_HPP */