CharsetConverter.hpp
2.38 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
/*
* File: EncodingConverter.hpp
* Author: mlenart
*
* Created on 14 listopad 2013, 17:28
*/
#ifndef ENCODINGCONVERTER_HPP
#define ENCODINGCONVERTER_HPP
#include <inttypes.h>
#include <string>
#include <vector>
#include <map>
class CharsetConverter {
public:
virtual uint32_t peek(const char*& it, const char* end) const = 0;
virtual uint32_t next(const char*& it, const char* end) const = 0;
virtual void append(uint32_t cp, std::string& result) const = 0;
virtual std::string fromUTF8(const std::string& input) const;
std::string toString(const std::vector<uint32_t>& codepoints) const;
private:
};
class UTF8CharsetConverter : public CharsetConverter {
public:
uint32_t peek(const char*& it, const char* end) const;
uint32_t next(const char*& it, const char* end) const;
void append(uint32_t cp, std::string& result) const;
// std::string fromUTF8(const std::string& input) const;
private:
};
//class UTF16CharsetConverter : public CharsetConverter {
//public:
// enum Endianness { LE, BE };
// explicit UTF16CharsetConverter(UTF16CharsetConverter::Endianness endianness);
// uint32_t peek(const char*& it, const char* end) const;
// uint32_t next(const char*& it, const char* end) const;
// void append(uint32_t cp, std::string& result) const;
//private:
// uint16_t convertEndianness(uint16_t cp) const;
// UTF16CharsetConverter::Endianness endianness;
//};
//
//class UTF32CharsetConverter : public CharsetConverter {
//public:
// uint32_t peek(const char*& it, const char* end) const;
// uint32_t next(const char*& it, const char* end) const;
// void append(uint32_t cp, std::string& result) const;
//private:
//};
/*
* Converter that uses a simple conversion table
*/
class OneByteCharsetConverter : public CharsetConverter {
public:
explicit OneByteCharsetConverter(const uint32_t* array);
uint32_t peek(const char*& it, const char* end) const;
uint32_t next(const char*& it, const char* end) const;
void append(uint32_t cp, std::string& result) const;
private:
const uint32_t* array;
const std::vector<char> codepoint2Char;
};
class ISO8859_2_CharsetConverter : public OneByteCharsetConverter {
public:
ISO8859_2_CharsetConverter();
private:
};
class Windows_1250_CharsetConverter : public OneByteCharsetConverter {
public:
Windows_1250_CharsetConverter();
private:
};
#endif /* ENCODINGCONVERTER_HPP */