ikipi2kipi.conv
1.51 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
[split]
tagset=ikipi
pre=fin:prt
regexp=(?i:(.+ł)(e[mś]))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:wok
t2_lemma=być
t1_post=praet:per:vcl:tns
[split]
pre=fin:prt
regexp=(?i:(.+ł[ao])([mś]))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:nwok
t2_lemma=być
t1_post=praet:per:vcl:tns
[split]
pre=fin:prt
regexp=(.+)(?i:(śmy|ście))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:nwok
t2_lemma=być
t1_post=praet:per:vcl:tns
[split]
pre=conjt:ter
regexp=(.+)(?i:(by))
t2_tag=qub
t2_lemma=by
t1_post=praet:per:vcl:tns
[3split]
pre=conjt
regexp=(.+)(?i:(by)(m|ś|śmy|ście))
copy_attrs_to_t3=nmb:per
t2_tag=qub
t2_lemma=by
t3_tag=aglt:sg:pri:imperf:nwok
t3_lemma=być
t1_post=praet:per:vcl:tns
; powinienem, winieneś: wok
[split]
pre=winien
regexp=(?i:(.+n)(e[mś]))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:wok
t2_lemma=być
t1_post=winien:per
; winn[iy]śmy: nwok
[split]
pre=winien
regexp=(.+)(?i:(śmy|ście))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:nwok
t2_lemma=być
t1_post=winien:per
; powinn[ao][mś]: nwok
[split]
pre=winien
regexp=(?i:(.+[ao])([mś]))
copy_attrs_to_t2=nmb:per
t2_tag=aglt:sg:pri:imperf:nwok
t2_lemma=być
t1_post=winien:per
; erase tenses
[tag]
pre=conjt
post=praet:tns
[tag]
pre=bedzie
post=tns
[tag]
pre=fin
post=tns
; convert finally
[convert]
tagset_from=ikipi
tagset_to=kipi
check=ignore
late-check=true
; revert aglt
[re_tag]
pre=praet
regexp=.*(?i:ó[dgkstz]ł|sechł)
post=nagl
; revert aglt
[re_tag]
pre=praet
regexp=.*(?i:o[dgkstz]ł|schł)
post=agl