constanalyser.h
1.91 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
/*
Copyright (C) 2010 Tomasz Śniatowski, Adam Radziszewski
Part of the libmaca project
This program is free software; you can redistribute it and/or modify it
under the terms of the GNU Lesser General Public License as published by the Free
Software Foundation; either version 3 of the License, or (at your option)
any later version.
This program is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
or FITNESS FOR A PARTICULAR PURPOSE.
See the LICENSE.MACA, LICENSE.SFST, LICENSE.GUESSER, COPYING.LESSER and COPYING files for more details.
*/
#ifndef LIBMACA_CONSTANALYSER_H
#define LIBMACA_CONSTANALYSER_H
#include <libmaca/morph/morphanalyser.h>
namespace Maca {
/**
* A simple analyser that always returns the same interpretation for any
* token. The tag is pre-set, and the lemma is the token's orth.
*
* Configuration class key: \b const
*/
class ConstAnalyser : public MorphAnalyser
{
public:
/// Constructor for a ConstAnalyser with a tagset and a tag string
ConstAnalyser(const Corpus2::Tagset* tagset, const std::string& tag);
/// Constructor for a ConstAnalyser with a tagset and a tag string
ConstAnalyser(const Corpus2::Tagset* tagset, const Corpus2::Tag& tag);
/**
* Config node constructor. Recognized keys are:
* - tag - the tag to use as the analysis for all tokens
* - lower_lemma - if true, lowercase the lemma (false by default)
*/
explicit ConstAnalyser(const Config::Node& cfg);
/// Cloning
ConstAnalyser* clone() const;
/// MapAnalyser override
bool process_functional(const Toki::Token &t
, boost::function<void (Corpus2::Token*)> sink);
/// Class identifier
static const char* identifier;
/// Registered flag
static bool registered;
private:
/// The tag
Corpus2::Tag tag_;
/// flag to lowercase lemma
bool lower_lemma_;
};
} /* end ns Maca */
#endif // LIBMACA_CONSTANALYSER_H