kipi2skladnica.conv
1.42 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
; This is a 'naive' conversion from KIPI to skladnica/NKJP.
; The conversion does two things:
; * casts naively kipi as nkjp,
; * adds additional 'supertag' attribute to each class (skladnica-specific).
[convert]
tagset_from=kipi
tagset_to=skladnica
check=ignore
; cast the TaKIPI tokeniser classes as ign
override=twf:ign
override=tnum:ign
override=tsym:ign
override=tdate:ign
override=ttime:ign
override=turi:ign
override=tmail:ign
; cast xxs as subst
override=xxs:subst
; comp -> com (value of deg)
override=comp:com
late-check=true
[tag]
pre=bedzie
post=VERB
[tag]
pre=fin
post=VERB
[tag]
pre=imps
post=VERB
[tag]
pre=impt
post=VERB
[tag]
pre=inf
post=VERB
[tag]
pre=praet
post=VERB
[tag]
pre=pred
post=VERB
[tag]
pre=winien
post=VERB
[tag]
pre=subst
post=SUBST
[tag]
pre=depr
post=SUBST
[tag]
pre=ger
post=SUBST
[tag]
pre=ppron12
post=SUBST
[tag]
pre=ppron3
post=SUBST
[tag]
pre=siebie
post=SUBST
[tag]
pre=adj
post=ADJ
[tag]
pre=adja
post=ADJ
[tag]
pre=adjc
post=ADJ
[tag]
pre=adjp
post=ADJ
[tag]
pre=pact
post=ADJ
[tag]
pre=ppas
post=ADJ
[tag]
pre=adv
post=ADV
[tag]
pre=pant
post=ADV
[tag]
pre=pcon
post=ADV
[tag]
pre=aglt
post=AGLT
[tag]
pre=brev
post=BREV
[tag]
pre=burk
post=BURK
[tag]
pre=comp
post=COMP
[tag]
pre=conj
post=CONJ
[tag]
pre=ign
post=IGN
[tag]
pre=interj
post=INTERJ
[tag]
pre=interp
post=INTERP
[tag]
pre=num
post=NUM
[tag]
pre=numcol
post=NUMCOL
[tag]
pre=prep
post=PREP
[tag]
pre=qub
post=QUB
[tag]
pre=xxx
post=XXX