symbols.fst
2.93 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% File: symbols.fst
% Author: Helmut Schmid; IMS, Universitaet Stuttgart
% Content: definition of symbol classes
% Modified: Fri Mar 24 10:10:07 2006 (schmid)
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% All symbols used by the morphology should be defined here
%%% Single Character Symbols %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% lower case consonants
#cons# = bcdfghjklmnpqrstvwxyz
% upper case consonants
#CONS# = BCDFGHJKLMNPQRSTVWXYZ
% all consonants
#Cons# = #cons# #CONS#
% lower case vowels
#vowel# = aeiou
% upper case vowels
#VOWEL# = AEIOU
% all vowels
#Vowel# = #vowel# #VOWEL#
% lower case letters
#letter# = #cons# #vowel#
% upper case letters
#LETTER# = #CONS# #VOWEL#
% all letters
#Letter# = #Cons# #Vowel#
%%% Lexicon Entry Markers %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% affix type features
#Affix# = <Prefix><Suffix>
% stem type features (internally used)
#BDKStem# = <BaseStem><DerivStem><CompStem>
% all stem types including the general stem feature <Stem>
% used in the lexicon
#EntryType# = <Stem> #BDKStem# #Affix#
%%% Agreement Features %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% word class features
#WordClass# = <ADJ><ADV><CARD><N><V>
% stem type feature
#StemType# = <base><deriv><comp>
% classic origin features
#classic# = <free><bound><short><long>
% all origin features
#Origin# = <native><foreign> #classic#
% origin features including the internally used feature <classic>
% which represents the disjunction stored in #classic#
#Origin-cl# = #Origin# <classic>
% complexity features
#Complex# = <simplex><prefderiv><suffderiv>
% inflection class features
#InflClass# = <AdjReg><AdvReg><NounReg><NounSg><NounPl><VerbReg>
% all agreement features
#AgrFeat# = #WordClass# #StemType# #Origin-cl#
% all agreement features + inflection class features
#AgrFeatInfl# = #AgrFeat# #InflClass#
%%% Analysis Features %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% number feature
#Number# = <sg><pl>
% gender feature
#Gender# = <masc><fem><neut>
% case feature
#Case# = <nom><gen><dat><acc>
% Person Feature
#Person# = <1><2><3>
% degree feature
#Degree# = <positive><comparative><superlative>
% verbal features
#VerbFeat# = <pres><past><part>
% affix markers
#AFF# = <PREF><SUFF>
% Morphosyntactic Features
#MorphSyn# = #Number# #Gender# #Case# #Person#\
#Degree# #VerbFeat# #AFF#
%%% Trigger Features %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% capitalisation feature: lower case, capitalized or fixed
#Cap# = <LC><Cap><Fix>
% Features used to mark the boundaries of morphemes and inflection
#Boundary# = <MB><IB>
% all triggers
% <NoDef> marks lexicon entries without default stems
#Trigger# = #Cap# #Boundary# <NoDef>
%%% General Symbol Classes %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
#Tag# = #EntryType# #AgrFeatInfl# #MorphSyn# #Trigger#
#AllSym# = #Letter# #Tag#