morfeusz-nkjp-guesser.ini 1.21 KB
; MorfeuszSGJP outputting in NKJP but with fallback on Guesser from libcorpus1, naively converted to NKJP.
; NOTE: this config assumes Morfeusz SGJP with tweaked soname is installed.
; This version is used internally by MACA authors to have both Morfeusz SIaT and SGJP
; coexist peacefully (which is normally impossible).
; If you want to use the official SGJP version (and not to use SIaT), please use
; morfeusz-nkjp-official-guesser config.

[general]
	tagset=nkjp
	; dot and hyphen sequences as separate tokens
	toki-config=nkjp

[ma:unknown]
	class=const
	tagset=nkjp
	tag=ign

[ma:interp]
	class=const
	tagset=nkjp
	tag=interp

[ma:url]
	class=const
	tagset=nkjp
	tag=subst:sg:nom:m3

; use guesser module from corpuslib
[ma:guess]
	class=wrap_convert
	wrapped_class=guesser
	wrapped_converter=naive-kipi2nkjp.conv
	wrapped_tagset=kipi
	tagset=nkjp

[ma:morfeusz]
	class=morfeusz
	tagset=nkjp
	converter=sgjp2nkjp.conv
	library=libmorfSGJP.so.0
; comment out the above line if Morfeusz SGJP is installed normally and not alongside Morfeusz SIAT in a binary-modified version with the soname changed
	require_version=Morfeusz SGJP
[rule]
	toki_type=p
	ma=interp

[rule]
	toki_type=tu
	ma=url

[default]
	ma=morfeusz
	ma=guess
	ma=unknown