| 67 |
$CHARSET{G96n}->{ $_.$F }->{chars} = 96; |
$CHARSET{G96n}->{ $_.$F }->{chars} = 96; |
| 68 |
$CHARSET{G96n}->{ $_.$F }->{ucs} = |
$CHARSET{G96n}->{ $_.$F }->{ucs} = |
| 69 |
({'' => 0xF4C000}->{ $_ }||0) + 96*96 * ($f-0x30); |
({'' => 0xF4C000}->{ $_ }||0) + 96*96 * ($f-0x30); |
| 70 |
## BUG: 94^n DRCSes with I byte have no mapping area |
## BUG: 96^n DRCSes with I byte have no mapping area |
| 71 |
} |
} |
| 72 |
} |
} |
| 73 |
|
$CHARSET{G94n}->{"\x20\x40"}->{ucs} = 0x70460000; ## DRCS 94^2 04/00 |
| 74 |
|
$CHARSET{G94n}->{P4_0} = $CHARSET{G94n}->{"\x20\x40"}; |
| 75 |
|
|
| 76 |
for (0x60..0x6F) { |
for (0x60..0x6F) { |
| 77 |
my $F = pack 'C', $_; |
my $F = pack 'C', $_; |
| 78 |
## BUG: 9x^3 sets have no mapping area |
## BUG: 9x^3 sets have no mapping area |
| 109 |
$CHARSET{G94n}->{'B@'}->{dimension} = 2; ## JIS X 0208-1990 |
$CHARSET{G94n}->{'B@'}->{dimension} = 2; ## JIS X 0208-1990 |
| 110 |
$CHARSET{G94n}->{'B@'}->{chars} = 94; |
$CHARSET{G94n}->{'B@'}->{chars} = 94; |
| 111 |
$CHARSET{G94n}->{'B@'}->{ucs} = 0xE9F6C0 + 94*94*79; |
$CHARSET{G94n}->{'B@'}->{ucs} = 0xE9F6C0 + 94*94*79; |
| 112 |
|
|
| 113 |
|
## SJIS G3 mapping (JIS X 0213:2000 plane 2) |
| 114 |
|
$CHARSET{G94n}->{"\x50"}->{Csjis_kuE} = { # ku - 1 |
| 115 |
|
0xF0 => 7, 0xF1 => 3, 0xF2 => 11, 0xF3 => 13, 0xF4 => 77, |
| 116 |
|
0xF5 => 79, 0xF6 => 81, 0xF7 => 83, 0xF8 => 85, 0xF9 => 87, |
| 117 |
|
0xFA => 89, 0xFB => 91, 0xFC => 93, |
| 118 |
|
}; |
| 119 |
|
$CHARSET{G94n}->{"\x50"}->{Csjis_kuO} = { # ku - 1 |
| 120 |
|
0xF0 => 0, 0xF1 => 2, 0xF2 => 4, 0xF3 => 12, 0xF4 => 14, |
| 121 |
|
0xF5 => 78, 0xF6 => 80, 0xF7 => 82, 0xF8 => 84, 0xF9 => 86, |
| 122 |
|
0xFA => 88, 0xFB => 90, 0xFC => 92, |
| 123 |
|
}; |
| 124 |
|
$CHARSET{G94n}->{"\x50"}->{Csjis_first} = { reverse ( |
| 125 |
|
%{ $CHARSET{G94n}->{"\x50"}->{Csjis_kuE} }, |
| 126 |
|
%{ $CHARSET{G94n}->{"\x50"}->{Csjis_kuO} }, |
| 127 |
|
)}; |
| 128 |
|
|
| 129 |
## -- Control character sets |
## -- Control character sets |
| 130 |
$CHARSET{C0}->{'@'}->{ucs} = 0x00; ## ISO/IEC 6429 C0 |
$CHARSET{C0}->{'@'}->{ucs} = 0x00; ## ISO/IEC 6429 C0 |
| 131 |
for ("\x40", "\x43", "\x44", "\x45", "\x46", "\x49", "\x4A", "\x4B", "\x4C") { |
for ("\x40", "\x43", "\x44", "\x45", "\x46", "\x49", "\x4A", "\x4B", "\x4C") { |
| 203 |
sub new_object { |
sub new_object { |
| 204 |
my %C; |
my %C; |
| 205 |
$C{bit} = 8; |
$C{bit} = 8; |
| 206 |
|
$C{coding_system} = $CODING_SYSTEM{"\x40"}; ## ISO/IEC 2022 |
| 207 |
$C{CL} = 'C0'; $C{CR} = 'C1'; $C{ESC_Fe} = 'C1'; |
$C{CL} = 'C0'; $C{CR} = 'C1'; $C{ESC_Fe} = 'C1'; |
| 208 |
$C{C0} = $CHARSET{C0}->{"\x40"}; ## ISO/IEC 6429:1991 C0 |
$C{C0} = $CHARSET{C0}->{"\x40"}; ## ISO/IEC 6429:1991 C0 |
| 209 |
$C{C1} = $CHARSET{C1}->{'64291991C1'}; ## ISO/IEC 6429:1991 C1 |
$C{C1} = $CHARSET{C1}->{'64291991C1'}; ## ISO/IEC 6429:1991 C1 |
| 213 |
$C{G1} = $CHARSET{G94}->{"\x7E"}; ## empty set |
$C{G1} = $CHARSET{G94}->{"\x7E"}; ## empty set |
| 214 |
$C{G2} = $CHARSET{G94}->{"\x7E"}; ## empty set |
$C{G2} = $CHARSET{G94}->{"\x7E"}; ## empty set |
| 215 |
$C{G3} = $CHARSET{G94}->{"\x7E"}; ## empty set |
$C{G3} = $CHARSET{G94}->{"\x7E"}; ## empty set |
|
$C{coding_system} = $CODING_SYSTEM{"\x40"}; ## ISO/IEC 2022 |
|
| 216 |
$C{option} = { |
$C{option} = { |
| 217 |
C1invoke_to_right => 0, ## C1 invoked to: (0: ESC Fe, 1: CR) |
C1invoke_to_right => 0, ## C1 invoked to: (0: ESC Fe, 1: CR) |
| 218 |
G94n_designate_long => 0, ## (1: ESC 02/04 02/08 04/00..02) |
G94n_designate_long => 0, ## (1: ESC 02/04 02/08 04/00..02) |
| 219 |
designate_to => { ## Designated G buffer (-1: not be outputed) |
designate_to => { ## Designated G buffer (-1: not to be outputed) |
| 220 |
C0 => { |
C0 => { |
| 221 |
default => 0, |
default => 0, |
| 222 |
}, |
}, |
| 240 |
default => -1, |
default => -1, |
| 241 |
}, |
}, |
| 242 |
}, |
}, |
| 243 |
|
fallback_from_ucs => 'replacement', |
| 244 |
|
## 'replacement' / 'perl' / 'sgml' / 'sgml-hex' / 'x-u-escaped' / 'code' |
| 245 |
|
## / 'quiet' / 'quiet+back' / 'quiet+warn' / 'quiet+back+warn' / 'croak' |
| 246 |
|
## / code |
| 247 |
|
final_to_set => { |
| 248 |
|
C0 => {}, C1 => {}, G94 => {}, G94n => {}, |
| 249 |
|
G96 => {}, G96n => {}, coding_system => {}, |
| 250 |
|
}, |
| 251 |
Ginvoke_by_single_shift => [0,0,0,0], ## Invoked by SS |
Ginvoke_by_single_shift => [0,0,0,0], ## Invoked by SS |
| 252 |
Ginvoke_to_left => [1,1,1,1], ## Which invoked to? (1: L, 0: R) |
Ginvoke_to_left => [1,1,1,1], ## Which invoked to? (1: L, 0: R) |
| 253 |
private_set => { ## Private set vs Final byte |
private_set => { ## Private set vs Final byte |
| 254 |
C0 => [], |
C0 => [], |
| 255 |
C1 => [], |
C1 => [], |
| 256 |
G94 => [], |
G94 => [], |
| 257 |
G94n => [[],[],[],[],[]], |
G94n => [[],[],[],[],["\x20\x40"]], |
| 258 |
G96 => [], |
G96 => [], |
| 259 |
#G96n => [], ## (not implemented) |
#G96n => [], ## (not implemented) |
| 260 |
U96n => [], ## mule-unicode sets |
U96n => [], ## mule-unicode sets |
| 272 |
\%C; |
\%C; |
| 273 |
} |
} |
| 274 |
|
|
| 275 |
1; |
sub new_object_sjis { |
| 276 |
__END__ |
my $C = &new_object; |
| 277 |
|
$C->{coding_system} = $CODING_SYSTEM{Csjis}; |
| 278 |
|
$C->{CR} = undef; |
| 279 |
|
$C->{GR} = 'G2'; ## 0xA1-0xDF |
| 280 |
|
$C->{G0} = $CHARSET{G94}->{J}; ## JIS X 0201:1997 Latin |
| 281 |
|
$C->{G1} = $CHARSET{G94n}->{"\x4F"}; ## JIS X 0213:2000 |
| 282 |
|
$C->{G2} = $CHARSET{G94}->{I}; ## JIS X 0201:1997 Katakana |
| 283 |
|
$C->{G3} = $CHARSET{G94n}->{"\x50"}; ## JIS X 0213:2000 plane 2 |
| 284 |
|
## Special code area (0xFD-0xFF) |
| 285 |
|
$C->{Gsmap} = {"\xA0" => "\x{F8F0}", "\xFD" => "\x{F8F1}", "\xFE" => "\x{F8F2}", "\xFF" => "\x{F8F3}"}; |
| 286 |
|
$C->{GsmapR} = {}; ## Reversed table |
| 287 |
|
$C->{option}->{undef_char_sjis} = "\x81\xAC"; |
| 288 |
|
$C; |
| 289 |
|
} |
| 290 |
|
|
| 291 |
|
our %FallbackFromUCS = ( |
| 292 |
|
perl => sub { my $c = $_[1]; sprintf '\x{%04X}', ord $c }, |
| 293 |
|
sgml => sub { my $c = $_[1]; sprintf '&#%d;', ord $c }, |
| 294 |
|
'sgml-hex' => sub { my $c = $_[1]; sprintf '&#x%04X;', ord $c }, |
| 295 |
|
'x-u-escaped' => sub { my $c = $_[1]; my $C = ord $c; sprintf $C > 0xFFFF ? '\U%08X' : '\u%04X', $C }, |
| 296 |
|
); |
| 297 |
|
|
| 298 |
|
sub fallback_escape ($$;%) { |
| 299 |
|
my ($C, $c, %option) = @_; |
| 300 |
|
my $f = ref ($C->{option}->{fallback_from_ucs}) eq 'CODE' ? $C->{option}->{fallback_from_ucs} : |
| 301 |
|
$FallbackFromUCS{$C->{option}->{fallback_from_ucs}}; |
| 302 |
|
if (ref $f) { |
| 303 |
|
Encode::_utf8_on ($c); |
| 304 |
|
return &$f ($C, $c, %option); |
| 305 |
|
} |
| 306 |
|
undef; |
| 307 |
|
} |
| 308 |
|
|
| 309 |
=head1 AUTHORS |
=head1 AUTHORS |
| 310 |
|
|
| 311 |
Nanashi-san |
Nanashi-san <nanashi-san@nanashi.invalid> |
| 312 |
|
|
| 313 |
Wakaba <w@suika.fam.cx> |
Wakaba <w@suika.fam.cx> |
| 314 |
|
|
| 315 |
=head1 LICENSE |
=head1 LICENSE |
| 316 |
|
|
| 317 |
Copyright 2002 AUTHORS |
Copyright 2002 AUTHORS, all rights reserved. |
| 318 |
|
|
| 319 |
This library is free software; you can redistribute it |
This library is free software; you can redistribute it |
| 320 |
and/or modify it under the same terms as Perl itself. |
and/or modify it under the same terms as Perl itself. |
| 321 |
|
|
| 322 |
=cut |
=cut |
| 323 |
|
|
| 324 |
# $Date$ |
1; # $Date$ |
|
### Charset.pm ends here |
|