|
1
2
3
4
5
6
7
8
9
10
11
12
|
/*
* File: test_result_equals.cpp
* Author: lennyn
*
* Created on December 6, 2013, 12:45 PM
*/
#include <cstdlib>
#include <cassert>
#include <string>
#include <sstream>
#include <fstream>
|
|
13
|
#include <iostream>
|
|
14
15
16
17
18
|
#include "Morfeusz.hpp"
#include "utils.hpp"
using namespace std;
|
|
19
20
21
22
23
|
static MorfeuszCharset getEncoding(const string& encodingStr) {
if (encodingStr == "UTF8")
return UTF8;
else if (encodingStr == "ISO8859_2")
return ISO8859_2;
|
|
24
25
|
else if (encodingStr == "CP1250")
return CP1250;
|
|
26
27
|
else if (encodingStr == "CP852")
return CP852;
|
|
28
|
else {
|
|
29
|
cerr << "Invalid encoding: " << encodingStr << " must be one of: UTF8, ISO8859_2, WINDOWS1250" << endl;
|
|
30
|
throw "Invalid encoding";
|
|
31
32
|
}
}
|
|
33
34
|
int main(int argc, char** argv) {
|
|
35
|
validate(argc == 3 || argc == 4, "Must provide exactly 2 or 3 arguments - input filename, required output filename, (optional) encoding.");
|
|
36
|
string inputFilename = argv[1];
|
|
37
38
39
|
ifstream in;
// in.exceptions(std::ifstream::failbit | std::ifstream::badbit);
cerr << "OPEN " << inputFilename << endl;
|
|
40
|
in.open(inputFilename.c_str());
|
|
41
|
string requiredOutputFilename = argv[2];
|
|
42
43
44
|
ifstream requiredIn;
// requiredIn.exceptions(std::ifstream::failbit | std::ifstream::badbit);
cerr << "OPEN " << requiredOutputFilename << endl;
|
|
45
|
requiredIn.open(requiredOutputFilename.c_str());
|
|
46
47
48
|
// string requiredOutput = readFile<char>(requiredOutputFilename);
cerr << "TEST START" << endl;
Morfeusz morfeusz;
|
|
49
50
|
if (argc == 4) {
MorfeuszCharset encoding = getEncoding(argv[3]);
|
|
51
|
morfeusz.setCharset(encoding);
|
|
52
|
}
|
|
53
54
55
56
57
58
59
60
61
62
63
64
65
66
|
string line;
while (getline(in, line)) {
cerr << "TEST " << line << endl;
vector<MorphInterpretation> res;
morfeusz.analyze(line, res);
stringstream out;
appendMorfeuszResults(res, out);
string gotOutputLine;
string requiredOutputLine;
while (getline(out, gotOutputLine)) {
getline(requiredIn, requiredOutputLine);
cerr << "REQUIRED LINE " << requiredOutputLine << endl;
cerr << "GOT LINE " << gotOutputLine << endl;
cerr << (requiredOutputLine == gotOutputLine) << endl;
|
|
67
|
validate(gotOutputLine == requiredOutputLine, "lines do not match");
|
|
68
69
70
71
72
|
}
}
return 0;
}
|