Blame view

fsabuilder/morfeuszbuilder/segrules/rulesNFA.py 4.45 KB
Michał Lenart authored
1
2
3
4
5
6
'''
Created on 24 sty 2014

@author: mlenart
'''
Michał Lenart authored
7
from morfeuszbuilder.segrules.rulesFSA import RulesFSA, RulesState
Michał Lenart authored
8
9
10

class RulesNFAState(object):
Michał Lenart authored
11
12
    statesCounter = 0
Michał Lenart authored
13
    def __init__(self, rule, initial=False, final=False, weak=False, autogenerated=False):
Michał Lenart authored
14
        self.rule = rule
Michał Lenart authored
15
        self.transitionsMap = {}
Michał Lenart authored
16
#         self.transitionsDataMap = {}
Michał Lenart authored
17
18
        self.initial = initial
        self.final = final
Michał Lenart authored
19
        self.weak = weak
Michał Lenart authored
20
        self.autogenerated = autogenerated
Michał Lenart authored
21
22
23
24
        self.idx = RulesNFAState.statesCounter
        RulesNFAState.statesCounter += 1

    def addTransition(self, label, targetState):
Michał Lenart authored
25
        assert label is None or len(label) == 2
Michał Lenart authored
26
27
28
29
30
31
32
33
34
35
36
37
38
        self.transitionsMap.setdefault(label, set())
        self.transitionsMap[label].add(targetState)

    def getClosure(self, visited):
        if self in visited:
            return set()
        else:
            visited.add(self)
            res = set()
            res.add(self)
            for nextState in self.transitionsMap.get(None, []):
                res |= nextState.getClosure(visited)
            return res
Michał Lenart authored
39
Michał Lenart authored
40
41
42
43
    def dfs(self, visitedStates=set()):
        if not self in visitedStates:
            visitedStates.add(self)
            yield self
Marcin Woliński authored
44
            for _, nextStates in list(self.transitionsMap.items()):
Michał Lenart authored
45
                for state in nextStates:
Michał Lenart authored
46
                    for state1 in state.dfs(visitedStates):
Michał Lenart authored
47
48
49
                        yield state1

    def debug(self):
Marcin Woliński authored
50
51
52
53
        print('----------------')
        print(('STATE:', self.idx))
        for label, nextStates in list(self.transitionsMap.items()):
            print((label, '-->', [s.idx for s in sorted(nextStates, key=lambda s: s.idx)]))
Michał Lenart authored
54
55
56

class RulesNFA(object):
Michał Lenart authored
57
    def __init__(self):
Michał Lenart authored
58
        self.initialState = RulesNFAState(rule=None, initial=True)
Michał Lenart authored
59
Michał Lenart authored
60
61
62
    def _groupOutputByLabels(self, nfaStates):
        res = {}
        for nfaState in nfaStates:
Marcin Woliński authored
63
            for label, nextStates in list(nfaState.transitionsMap.items()):
Michał Lenart authored
64
                if label is not None:
Michał Lenart authored
65
66
67
#                     transitionData = nfaState.transitionsDataMap[label]
                    segnum, shiftOrth = label
                    res.setdefault((segnum, shiftOrth), set())
Michał Lenart authored
68
                    for nextNFAState in nextStates:
Michał Lenart authored
69
                        res[(segnum, shiftOrth)] |= nextNFAState.getClosure(set())
Michał Lenart authored
70
71
72
        return res

    def _doConvertState(self, dfaState, nfaStates, nfaSubset2DFAState):
Marcin Woliński authored
73
        weakHits = [state.weak for state in [state for state in nfaStates if state.final and not state.autogenerated]]
Michał Lenart authored
74
75
        if not all(weakHits) \
            and any(weakHits):
Marcin Woliński authored
76
77
            weakState = list([state for state in nfaStates if state.final and state.weak])[0]
            nonWeakState = list([state for state in nfaStates if state.final and not state.weak])[0]
Michał Lenart authored
78
            raise InconsistentStateWeaknessException(weakState, nonWeakState)
Marcin Woliński authored
79
80
        weak = any([state.weak and state.final for state in [state for state in nfaStates if not state.autogenerated]])
        final = any([state.final for state in nfaStates])
Michał Lenart authored
81
#         assert not weak or not final
Michał Lenart authored
82
83
84
        if final:
            # dfaState should be final
            # and contain info about weakness
Michał Lenart authored
85
86
            dfaState.setAsAccepting(weak=weak)
#             dfaState.encodedData = bytearray([1 if weak else 0])
Marcin Woliński authored
87
        for (segnum, shiftOrth), nextNFAStates in list(self._groupOutputByLabels(nfaStates).items()):
Michał Lenart authored
88
89
90
91
            key = frozenset(nextNFAStates)
            if key in nfaSubset2DFAState:
                nextDFAState = nfaSubset2DFAState[key]
            else:
Michał Lenart authored
92
                nextDFAState = RulesState()
Michał Lenart authored
93
94
                nfaSubset2DFAState[key] = nextDFAState
                self._doConvertState(nextDFAState, nextNFAStates, nfaSubset2DFAState)
Michał Lenart authored
95
96
            dfaState.setTransition((segnum, shiftOrth), nextDFAState)
#             dfaState.setTransitionData(label, transitionData)
Michał Lenart authored
97
98

    def convertToDFA(self):
Michał Lenart authored
99
        dfa = RulesFSA()
Michał Lenart authored
100
        startStates = self.initialState.getClosure(set())
Marcin Woliński authored
101
        assert not any([s for s in startStates if s.final])
Michał Lenart authored
102
        dfa.initialState = RulesState()
Michał Lenart authored
103
104
105
106
107
108
        self._doConvertState(dfa.initialState, startStates, {frozenset(startStates): dfa.initialState})
        return dfa

    def debug(self):
        for state in self.initialState.dfs():
            state.debug()
Michał Lenart authored
109
110
111
112
113
114

class InconsistentStateWeaknessException(Exception):

    def __init__(self, weakState, nonWeakState):
        self.weakState = weakState
        self.nonWeakState = nonWeakState