1 | #!/opt/bin/perl |
1 | #!/opt/bin/perl |
2 | |
2 | |
3 | # the generated tables mostly have NOT been checked so far! |
3 | # the generated tables mostly have NOT been checked so far! |
|
|
4 | |
|
|
5 | # apt install libencode-hanextra-perl libencode-jis2k-perl |
4 | |
6 | |
5 | use v5.8.2; |
7 | use v5.8.2; |
6 | use utf8; |
8 | use utf8; |
7 | use Encode; |
9 | use Encode; |
|
|
10 | use Encode::JP; |
|
|
11 | use Encode::CN; |
|
|
12 | use Encode::KR; |
|
|
13 | use Encode::HanExtra; |
|
|
14 | use Encode::JIS2K; |
8 | |
15 | |
9 | my $gen; |
16 | my $gen; |
10 | |
17 | |
11 | $TO_UNICODE = 0; # also generate to_unicode tables |
18 | $TO_UNICODE = 0; # also generate to_unicode tables |
12 | |
19 | |
… | |
… | |
88 | $fun .= sprintf "if (· == 0x%04x) return 0x%04x;\n", $b + $_, $enc->[$b + $_]; |
95 | $fun .= sprintf "if (· == 0x%04x) return 0x%04x;\n", $b + $_, $enc->[$b + $_]; |
89 | } |
96 | } |
90 | } elsif (linear $enc, $b + $l, $b + $h, $enc->[$b + $l]) { |
97 | } elsif (linear $enc, $b + $l, $b + $h, $enc->[$b + $l]) { |
91 | my $dif = $enc->[$b + $l] - ($b + $l); |
98 | my $dif = $enc->[$b + $l] - ($b + $l); |
92 | $dif = $dif < 0 ? sprintf "- 0x%04x", -$dif : sprintf "+ 0x%04x", $dif; |
99 | $dif = $dif < 0 ? sprintf "- 0x%04x", -$dif : sprintf "+ 0x%04x", $dif; |
93 | $fun .= sprintf "if (· <= 0x%04x && 0x%04x <= ·) return · %s;\n", $b + $l, $b + $h, $dif; |
100 | $fun .= sprintf "if (· >= 0x%04x && 0x%04x >= ·) return · %s;\n", $b + $l, $b + $h, $dif; |
94 | } elsif ($map2[$p] <= 5) { # defunct |
101 | } elsif ($map2[$p] <= 5) { # defunct |
95 | $fun .= "switch (·)\n {\n"; |
102 | $fun .= "switch (·)\n {\n"; |
96 | for ($l .. $h) { |
103 | for ($l .. $h) { |
97 | next unless defined $enc->[$b + $_]; |
104 | next unless defined $enc->[$b + $_]; |
98 | $fun .= sprintf " case 0x%04x: return 0x%04x;\n", $b + $_, $enc->[$b + $_]; |
105 | $fun .= sprintf " case 0x%04x: return 0x%04x;\n", $b + $_, $enc->[$b + $_]; |
… | |
… | |
264 | |
271 | |
265 | __DATA__ |
272 | __DATA__ |
266 | VN viscii viscii |
273 | VN viscii viscii |
267 | KR ksc5601_1987_0 ksc5601-raw |
274 | KR ksc5601_1987_0 ksc5601-raw |
268 | ZH gb2312_1980_0 gb2312-raw |
275 | ZH gb2312_1980_0 gb2312-raw |
|
|
276 | ZH gbk_0 gbk |
269 | ZH_EXT cns11643_1992_1 cns11643-1 |
277 | ZH_EXT cns11643_1992_1 cns11643-1 |
270 | ZH_EXT cns11643_1992_2 cns11643-2 |
278 | ZH_EXT cns11643_1992_2 cns11643-2 |
271 | ZH_EXT cns11643_1992_3 cns11643-3 |
279 | ZH_EXT cns11643_1992_3 cns11643-3 |
272 | ZH_EXT cns11643_1992_4 cns11643-4 |
280 | ZH_EXT cns11643_1992_4 cns11643-4 |
273 | ZH_EXT cns11643_1992_5 cns11643-5 |
281 | ZH_EXT cns11643_1992_5 cns11643-5 |
… | |
… | |
289 | EU iso8859_8 iso-8859-8 |
297 | EU iso8859_8 iso-8859-8 |
290 | EU iso8859_9 iso-8859-9 |
298 | EU iso8859_9 iso-8859-9 |
291 | EU iso8859_10 iso-8859-10 |
299 | EU iso8859_10 iso-8859-10 |
292 | EU iso8859_11 iso-8859-11 |
300 | EU iso8859_11 iso-8859-11 |
293 | EU iso8859_13 iso-8859-13 |
301 | EU iso8859_13 iso-8859-13 |
294 | EU iso8859_14 iso-8859-14 |
302 | EU iso8859_14 iso-8859-14 |
295 | DEFAULT iso8859_15 iso-8859-15 |
303 | DEFAULT iso8859_15 iso-8859-15 |
296 | EU iso8859_16 iso-8859-16 |
304 | EU iso8859_16 iso-8859-16 |
297 | JP jis0201_1976_0 jis0201-raw |
305 | JP jis0201_1976_0 jis0201-raw |
298 | JP jis0208_1990_0 jis0208-raw |
306 | JP jis0208_1990_0 jis0208-raw |
299 | JP jis0212_1990_0 jis0212-raw |
307 | JP jis0212_1990_0 jis0212-raw |