|
1
2
3
4
5
6
7
8
9
10
|
/*
* File: EncodingConverter.hpp
* Author: mlenart
*
* Created on 14 listopad 2013, 17:28
*/
#ifndef ENCODINGCONVERTER_HPP
#define ENCODINGCONVERTER_HPP
|
|
11
|
#include <inttypes.h>
|
|
12
|
#include <string>
|
|
13
14
|
#include <vector>
#include <map>
|
|
15
|
|
|
16
17
|
class CharsetConverter {
public:
|
|
18
|
uint32_t peek(const char* it, const char* end) const;
|
|
19
|
virtual uint32_t next(const char*& it, const char* end) const = 0;
|
|
20
|
virtual void append(uint32_t cp, std::string& result) const = 0;
|
|
21
|
virtual std::string fromUTF8(const std::string& input) const;
|
|
22
|
|
|
23
|
std::string toString(const std::vector<uint32_t>& codepoints) const;
|
|
24
25
|
virtual ~CharsetConverter();
|
|
26
27
28
|
private:
};
|
|
29
|
class UTF8CharsetConverter : public CharsetConverter {
|
|
30
31
|
public:
uint32_t next(const char*& it, const char* end) const;
|
|
32
|
void append(uint32_t cp, std::string& result) const;
|
|
33
|
std::string fromUTF8(const std::string& input) const;
|
|
34
35
36
|
private:
};
|
|
37
38
39
|
/*
* Converter that uses a simple conversion table
*/
|
|
40
|
class OneByteCharsetConverter : public CharsetConverter {
|
|
41
|
public:
|
|
42
|
explicit OneByteCharsetConverter(const uint32_t* array);
|
|
43
|
uint32_t next(const char*& it, const char* end) const;
|
|
44
|
void append(uint32_t cp, std::string& result) const;
|
|
45
|
private:
|
|
46
47
48
49
|
const uint32_t* array;
const std::vector<char> codepoint2Char;
};
|
|
50
|
class ISO8859_2_CharsetConverter : public OneByteCharsetConverter {
|
|
51
|
public:
|
|
52
|
ISO8859_2_CharsetConverter();
|
|
53
54
55
|
private:
};
|
|
56
|
class Windows_1250_CharsetConverter : public OneByteCharsetConverter {
|
|
57
|
public:
|
|
58
|
Windows_1250_CharsetConverter();
|
|
59
|
private:
|
|
60
61
|
};
|
|
62
63
64
65
66
67
|
class CP852_CharsetConverter : public OneByteCharsetConverter {
public:
CP852_CharsetConverter();
private:
};
|
|
68
69
|
#endif /* ENCODINGCONVERTER_HPP */
|