1 | #ifndef ENCODING_H |
1 | #ifndef ENCODING_H |
2 | #define ENCODING_H |
2 | #define ENCODING_H |
3 | |
3 | |
4 | #include <stdint.h> |
4 | #include <inttypes.h> |
|
|
5 | |
|
|
6 | typedef uint32_t unicode_t; |
5 | |
7 | |
6 | // order must match the table in encoding.C(!) |
8 | // order must match the table in encoding.C(!) |
7 | enum codeset { |
9 | enum codeset { |
8 | CS_UNKNOWN = 0, |
10 | CS_UNKNOWN = 0, |
9 | CS_US_ASCII, |
11 | CS_US_ASCII, |
… | |
… | |
25 | CS_ISO8859_16, |
27 | CS_ISO8859_16, |
26 | |
28 | |
27 | CS_KOI8_R, |
29 | CS_KOI8_R, |
28 | CS_KOI8_U, |
30 | CS_KOI8_U, |
29 | CS_JIS0201_1976_0, |
31 | CS_JIS0201_1976_0, |
30 | CS_JIS0208_1983_0, |
32 | CS_JIS0208_1990_0, |
31 | CS_JIS0212_1990_0, |
33 | CS_JIS0212_1990_0, |
32 | |
|
|
33 | CS_JIS0213_1, |
34 | CS_JIS0213_1, |
34 | CS_JIS0213_2, |
35 | CS_JIS0213_2, |
35 | |
36 | |
36 | CS_KSC5601_1987_0, |
37 | CS_KSC5601_1987_0, |
37 | |
38 | |
38 | CS_GB2312_1980_0, |
39 | CS_GB2312_1980_0, |
|
|
40 | CS_GBK_0, |
39 | |
41 | |
40 | CS_CNS11643_1992_1, |
42 | CS_CNS11643_1992_1, |
41 | CS_CNS11643_1992_2, |
43 | CS_CNS11643_1992_2, |
42 | CS_CNS11643_1992_3, |
44 | CS_CNS11643_1992_3, |
43 | CS_CNS11643_1992_4, |
45 | CS_CNS11643_1992_4, |
… | |
… | |
59 | }; |
61 | }; |
60 | |
62 | |
61 | codeset codeset_from_name (const char *name); |
63 | codeset codeset_from_name (const char *name); |
62 | |
64 | |
63 | enum { |
65 | enum { |
64 | ZERO_WIDTH_CHAR = 0x200b, |
66 | ZERO_WIDTH_CHAR = 0x200b, |
65 | REPLACEMENT_CHAR = 0xfffd, |
67 | REPLACEMENT_CHAR = 0xfffd, |
66 | NOCHAR = 65535, // must be invalid in ANY codeset (!) |
68 | NOCHAR = 0xffff, // must be invalid in ANY codeset (!) |
67 | }; |
69 | }; |
68 | |
70 | |
69 | struct rxvt_codeset_conv { |
71 | struct rxvt_codeset_conv |
70 | virtual uint32_t from_unicode (uint32_t unicode) const { return unicode; } |
72 | { |
71 | virtual uint32_t to_unicode (uint32_t enc) const { return enc; } |
73 | uint32_t (*from_unicode) (unicode_t unicode); |
|
|
74 | #if ENCODING_TO_UNICODE |
|
|
75 | unicode_t (*to_unicode) (uint32_t enc); |
|
|
76 | #endif |
72 | }; |
77 | }; |
73 | |
78 | |
74 | extern const rxvt_codeset_conv *rxvt_codeset[NUM_CODESETS]; |
79 | extern const rxvt_codeset_conv rxvt_codeset[NUM_CODESETS]; |
75 | |
80 | |
76 | extern uint32_t rxvt_compose (uint32_t c1, uint32_t c2); |
81 | extern unicode_t rxvt_compose (unicode_t c1, unicode_t c2); |
77 | |
82 | |
78 | #define FROM_UNICODE(cs,code) rxvt_codeset[cs]->from_unicode (code) |
83 | #define FROM_UNICODE(cs,code) rxvt_codeset[cs].from_unicode (code) |
79 | #define TO_UNICODE(cs,code) rxvt_codeset[cs]->to_unicode (code) |
84 | #define TO_UNICODE(cs,code) rxvt_codeset[cs].to_unicode (code) |
|
|
85 | |
|
|
86 | struct unicode // namespace für arme |
|
|
87 | { |
|
|
88 | static bool is_space (unicode_t c); |
|
|
89 | }; |
80 | |
90 | |
81 | #endif |
91 | #endif |
82 | |
92 | |