SegrulesFSA.hpp
2 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
/*
* File: SegrulesFSA.hpp
* Author: mlenart
*
* Created on 12 marzec 2014, 17:52
*/
#ifndef SEGRULESFSA_HPP
#define SEGRULESFSA_HPP
#include <set>
#include <iostream>
#include "../deserializationUtils.hpp"
struct SegrulesState {
uint16_t offset;
bool accepting;
bool weak;
bool shiftOrthFromPrevious;
bool sink;
};
inline bool operator<(const SegrulesState& s1, const SegrulesState& s2) {
return s1.offset < s2.offset;
}
class SegrulesFSA {
public:
SegrulesFSA(const unsigned char* ptr) : initialState(), ptr(ptr) {
SegrulesState state = {0, false, false, false, false};
initialState = state;
}
std::vector<SegrulesState> proceedToNext(
const unsigned char segnum,
const SegrulesState& state,
bool atEndOfWord) const {
std::vector<SegrulesState> res;
const unsigned char* currPtr = ptr + state.offset + 1;
const unsigned char transitionsNum = *currPtr++;
for (int i = 0; i < transitionsNum; i++) {
if (*currPtr == segnum) {
SegrulesState newState = this->transition2State(currPtr);
if ((atEndOfWord && newState.accepting)
|| (!atEndOfWord && !newState.sink)) {
res.push_back(newState);
}
}
currPtr += 4;
}
return res;
}
virtual ~SegrulesFSA() {
}
SegrulesState initialState;
private:
const unsigned char* ptr;
SegrulesState transition2State(const unsigned char* transitionPtr) const {
unsigned char ACCEPTING_FLAG = 1;
unsigned char WEAK_FLAG = 2;
SegrulesState res;
transitionPtr++;
res.shiftOrthFromPrevious = *transitionPtr++;
res.offset = readInt16(transitionPtr);
res.accepting = *(ptr + res.offset) & ACCEPTING_FLAG;
res.weak = *(ptr + res.offset) & WEAK_FLAG;
res.sink = *(ptr + res.offset + 1) == 0;
return res;
}
};
#endif /* SEGRULESFSA_HPP */