guesser.h 1.84 KB
/*
    Copyright (C) 2010 Tomasz Śniatowski, Adam Radziszewski
    Part of the libmaca project

    This program is free software; you can redistribute it and/or modify it
under the terms of the GNU General Public License as published by the Free
Software Foundation; either version 3 of the License, or (at your option)
any later version.

    This program is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
or FITNESS FOR A PARTICULAR PURPOSE. 

    See the LICENSE.MACA, LICENSE.GUESSER, COPYING.LESSER and COPYING files for more details.
*/
#ifndef LIBMACA_MORPH_GUESSER_H
#define LIBMACA_MORPH_GUESSER_H

#include <libmaca/morph/morphanalyser.h>
#include <libmaca/typedefs.h>
#include <boost/thread/mutex.hpp>

namespace Maca {

/**
 * Corpuslib guesser analyser interface.
 *
 * WARNING: Guesser might call morfeusz and end up with ambiguous segmentation,
 *          this is not handled and will result in damaged output. The Morfeusz
 *          analyser should be always used before teh Guesser analyser.
 * WARNING: There is no thread safety currently
 */
class GuesserAnalyser : public MorphAnalyser
{
public:
	/**
	 * Constructor for a Guesser analyser with the given tagset
	 */
	GuesserAnalyser(const Corpus2::Tagset* tagset);

	/**
	 * Config node constructor. No new recognized keys.
	 */
	GuesserAnalyser(const Config::Node& cfg);

	/// Cloning
	GuesserAnalyser* clone() const;

	/// Destructor
	~GuesserAnalyser();

	/// MorphAnalyser override
	bool process_functional(const Toki::Token& t,
			boost::function<void (Corpus2::Token*)> sink);

	/// Class identifier
	static const char* identifier;

	/// Registered flag
	static bool registered;
private:
	/// Set libcorpus1 flags necessary for guesser usage.
	void setup_corpus1();
};

} /* end ns Maca */

#endif // LIBMACA_MORPH_GUESSER_H