/[suikacvs]/perl/charclass/lib/Char/Class/UCS.pm
Suika

Contents of /perl/charclass/lib/Char/Class/UCS.pm

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.2 - (show annotations) (download)
Mon Nov 24 04:25:10 2008 UTC (16 years ago) by wakaba
Branch: MAIN
CVS Tags: HEAD
Changes since 1.1: +3 -3 lines
++ ChangeLog	24 Nov 2008 04:24:23 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* mkcommitfeed.pl: New script (copied from Harusame).

	* cvscommit.sh: New script (copied from Harusame).

	* Makefile.PL: Version changed to 2.0.

++ charclass/lib/Char/ChangeLog	24 Nov 2008 01:52:26 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* Normalize/: New directory.

++ charclass/lib/Char/Normalize/ChangeLog	24 Nov 2008 04:20:30 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* FullwidthHalfwidth.pod: New documentation.

	* FullwidthHalfwidth.pm: New module (content from SuikaWiki4
	sw.cgi).

	* ChangeLog: New file.

1 ## This file is auto-generated (at 2008-11-24T04:21:28Z).
2 ## Do not edit by hand!
3 use strict;
4
5 package Char::Class::UCS;
6 our $VERSION = '1.03';
7
8 use Exporter;
9 use vars qw(@EXPORT_OK @ISA $VERSION);
10 @ISA = qw(Exporter);
11
12 =head1 NAME
13
14 Char::Class::UCS - Regular Expression Character Classes - C<UCS>
15
16
17 =cut
18
19 sub import ($;@) {
20 my ($self, @sub) = (shift, @_);
21 for (@sub) {
22 no strict 'refs';
23 *{'main::'.$_} = \&{$_};
24 }
25 $Exporter::ExportLevel = 1;
26 $self->SUPER::import (@_);
27 $Exporter::ExportLevel = 0;
28 }
29
30 @EXPORT_OK = qw(InUCSAeganNumbers InUCSAlphabeticPresentationForms InUCSAlternateFormatCharactersExtended InUCSArabicExtended InUCSArabicPresentationFormsA InUCSArabicPresentationFormsB InUCSArmenian InUCSArrows InUCSBasicArabic InUCSBasicGeorgian InUCSBasicGreek InUCSBasicHangul InUCSBasicHebrew InUCSBasicLatin InUCSBasicMyanmar InUCSBasicTibetan InUCSBengali InUCSBiDirectionalFormatEmbeddings InUCSBiDirectionalFormatMarks InUCSBlockElements InUCSBopomofo InUCSBoxDrawing InUCSBraillePatterns InUCSBuhid InUCSByzantineMusicalSymbols InUCSCharacterShapingSelectors InUCSCherokee InUCSCombiningDiacriticalMarks InUCSCombiningDiacriticalMarksForSymbols InUCSCombiningHalfMarks InUCSControlPictures InUCSCurrencySymbols InUCSCypriotSyllabary InUCSCyrillic InUCSCyrillicSupplementary InUCSDeseret InUCSDevanagari InUCSDingbats InUCSEnclosedAlphanumerics InUCSEnclosedCJKLettersAndMonths InUCSEthiopic InUCSEtruscan InUCSExtendedMyanmar InUCSFormatSeparators InUCSGeneralFormatCharacters InUCSGeneralPunctuation InUCSGeometricShapes InUCSGeorgianExtended InUCSGothic InUCSGreekExtended InUCSGreekSymbolsAndCoptic InUCSGujarati InUCSGurmukhi InUCSHalfwidthAndFullwidthForms InUCSHangulCompatibilityJamo InUCSHangulFillCharacters InUCSHangulJamo InUCSHangulSyllables InUCSHanunoo InUCSHebrewExtended InUCSHiragana InUCSIPAExtensions InUCSIdeographicDescriptionCharacters InUCSKangxiRadicals InUCSKannada InUCSKatakana InUCSKatakanaPhoneticExtensions InUCSKhmer InUCSLao InUCSLatin1Supplement InUCSLatinExtendedA InUCSLatinExtendedAdditional InUCSLatinExtendedB InUCSLetterlikeSymbols InUCSLimbu InUCSLinearBIdeograms InUCSLinearBSyllabary InUCSMalayalam InUCSMathematicalOperators InUCSMiscellaneousSymbols InUCSMiscellaneousTechnical InUCSMiscllaneousMathmaticalSymbols InUCSMongolian InUCSNumberForms InUCSNumericShapeSelectors InUCSOgham InUCSOpticalCharacterRecognition InUCSOriya InUCSOsmanya InUCSPart2 InUCSPrivateUseArea InUCSPrivateUseGroups InUCSPrivateUsePlanes InUCSRunic InUCSScriptSpecificFormatCharacters InUCSShavian InUCSSinhala InUCSSip InUCSSmallFormVariants InUCSSmp InUCSSpacingModifierLetters InUCSSpecials InUCSSpp InUCSSuperscriptsAndSubscripts InUCSSupplementalArrows InUCSSupplementalArrowsC InUCSSupplementalCJKCompatibility InUCSSupplementalHangulA InUCSSupplementalHangulB InUCSSupplementalMathmaticalOperators InUCSSyriac InUCSTagalog InUCSTagbanwa InUCSTags InUCSTaiLe InUCSTamil InUCSTelugu InUCSThaana InUCSThai InUCSTibetan InUCSUgaritic InUCSUnicode InUCSUnifiedCanadianAboriginalSyllabics InUCSVariationSelectors InUCSVariationSelectorsSupplement InUCSWesternMusicalSymbols InUCSYiRadicals InUCSYiSyllables InUCSYijingHexagramSymbols InUCSZeroWidthBoundaryIndicators InUCS_BMP InUCS_BMPFirstEdition InUCS_BMPSecondEdition InUCS_BMP_AMD7 InUCS_CJKCompatibility InUCS_CJKCompatibilityForms InUCS_CJKCompatibilityIdeographs InUCS_CJKCompatibilityIdeographsSupplement InUCS_CJKMiscellaneous InUCS_CJKRadicalsSupplement InUCS_CJKSymbolsAndPunctuation InUCS_CJKUnifiedIdeographs InUCS_CJKUnifiedIdeographsAll InUCS_CJKUnifiedIdeographsExtensionA InUCS_CJKUnifiedIdeographsExtensionB InUCS_MES1 InUCS_MES2 InUCS_MES3A InUCS_MES3B InUCS1 InUCS10 InUCS100 InUCS1000 InUCS1001 InUCS1002 InUCS1003 InUCS1004 InUCS1005 InUCS1007 InUCS1008 InUCS1009 InUCS101 InUCS1010 InUCS1011 InUCS1012 InUCS1013 InUCS104 InUCS105 InUCS106 InUCS10646 InUCS107 InUCS108 InUCS11 InUCS12 InUCS13 InUCS14 InUCS15 InUCS16 InUCS17 InUCS18 InUCS180 InUCS19 InUCS2 InUCS20 InUCS200 InUCS2000 InUCS2001 InUCS2002 InUCS201 InUCS202 InUCS203 InUCS204 InUCS205 InUCS206 InUCS207 InUCS21 InUCS22 InUCS23 InUCS24 InUCS25 InUCS250 InUCS251 InUCS26 InUCS27 InUCS28 InUCS281 InUCS282 InUCS283 InUCS284 InUCS29 InUCS299 InUCS3 InUCS30 InUCS300 InUCS3000 InUCS3001 InUCS3002 InUCS301 InUCS302 InUCS31 InUCS32 InUCS33 InUCS34 InUCS35 InUCS36 InUCS37 InUCS38 InUCS39 InUCS4 InUCS40 InUCS4000 InUCS41 InUCS42 InUCS43 InUCS44 InUCS45 InUCS46 InUCS47 InUCS48 InUCS49 InUCS5 InUCS50 InUCS500 InUCS51 InUCS52 InUCS53 InUCS54 InUCS55 InUCS56 InUCS57 InUCS58 InUCS6 InUCS60 InUCS61 InUCS62 InUCS63 InUCS64 InUCS65 InUCS66 InUCS67 InUCS68 InUCS69 InUCS7 InUCS70 InUCS71 InUCS72 InUCS73 InUCS74 InUCS75 InUCS76 InUCS77 InUCS78 InUCS79 InUCS8 InUCS80 InUCS81 InUCS82 InUCS83 InUCS84 InUCS85 InUCS86 InUCS87 InUCS88 InUCS89 InUCS9 InUCS90 InUCS91 InUCS92 InUCS93 InUCS94 InUCS95 InUCS96 InUCS97 InUCS98 InUCS99);
31
32 sub InUCSAeganNumbers {
33 <<EOH;
34 10100 1013F
35 EOH
36 }
37
38 sub InUCSAlphabeticPresentationForms {
39 <<EOH;
40 FB00 FB4F
41 EOH
42 }
43
44 sub InUCSAlternateFormatCharactersExtended {
45 <<EOH;
46 0E0000 0E0FFF
47 EOH
48 }
49
50 sub InUCSArabicExtended {
51 <<EOH;
52 0660 06FF
53 EOH
54 }
55
56 sub InUCSArabicPresentationFormsA {
57 <<EOH;
58 FB50 FDFF
59 EOH
60 }
61
62 sub InUCSArabicPresentationFormsB {
63 <<EOH;
64 FE70 FEFE
65 EOH
66 }
67
68 sub InUCSArmenian {
69 <<EOH;
70 0530 058F
71 EOH
72 }
73
74 sub InUCSArrows {
75 <<EOH;
76 2190 21FF
77 EOH
78 }
79
80 sub InUCSBasicArabic {
81 <<EOH;
82 0600 065F
83 EOH
84 }
85
86 sub InUCSBasicGeorgian {
87 <<EOH;
88 10D0 10FF
89 EOH
90 }
91
92 sub InUCSBasicGreek {
93 <<EOH;
94 0370 03CF
95 EOH
96 }
97
98 sub InUCSBasicHangul {
99 <<EOH;
100 3400 3D3D
101 EOH
102 }
103
104 sub InUCSBasicHebrew {
105 <<EOH;
106 05D0 05EA
107 EOH
108 }
109
110 sub InUCSBasicLatin {
111 <<EOH;
112 0020 007E
113 EOH
114 }
115
116 sub InUCSBasicMyanmar {
117 <<EOH;
118 1000 104F
119 200C
120 200D
121 EOH
122 }
123
124 sub InUCSBasicTibetan {
125 <<EOH;
126 0F00 0FBF
127 EOH
128 }
129
130 sub InUCSBengali {
131 <<EOH;
132 0980 09FF
133 200C
134 200D
135 EOH
136 }
137
138 sub InUCSBiDirectionalFormatEmbeddings {
139 <<EOH;
140 202A 202E
141 EOH
142 }
143
144 sub InUCSBiDirectionalFormatMarks {
145 <<EOH;
146 200E 200F
147 EOH
148 }
149
150 sub InUCSBlockElements {
151 <<EOH;
152 2580 259F
153 EOH
154 }
155
156 sub InUCSBopomofo {
157 <<EOH;
158 3100 312F
159 31A0 31BF
160 EOH
161 }
162
163 sub InUCSBoxDrawing {
164 <<EOH;
165 2500 257F
166 EOH
167 }
168
169 sub InUCSBraillePatterns {
170 <<EOH;
171 2800 28FF
172 EOH
173 }
174
175 sub InUCSBuhid {
176 <<EOH;
177 1740 175F
178 EOH
179 }
180
181 sub InUCSByzantineMusicalSymbols {
182 <<EOH;
183 01D000 01D0FF
184 EOH
185 }
186
187 sub InUCSCharacterShapingSelectors {
188 <<EOH;
189 206A 206D
190 EOH
191 }
192
193 sub InUCSCherokee {
194 <<EOH;
195 13A0 13FF
196 EOH
197 }
198
199 sub InUCSCombiningDiacriticalMarks {
200 <<EOH;
201 0300 036F
202 EOH
203 }
204
205 sub InUCSCombiningDiacriticalMarksForSymbols {
206 <<EOH;
207 20D0 20FF
208 EOH
209 }
210
211 sub InUCSCombiningHalfMarks {
212 <<EOH;
213 FE20 FE2F
214 EOH
215 }
216
217 sub InUCSControlPictures {
218 <<EOH;
219 2400 243F
220 EOH
221 }
222
223 sub InUCSCurrencySymbols {
224 <<EOH;
225 20A0 20CF
226 EOH
227 }
228
229 sub InUCSCypriotSyllabary {
230 <<EOH;
231 10800 1083F
232 EOH
233 }
234
235 sub InUCSCyrillic {
236 <<EOH;
237 0400 04FF
238 EOH
239 }
240
241 sub InUCSCyrillicSupplementary {
242 <<EOH;
243 0500 052F
244 EOH
245 }
246
247 sub InUCSDeseret {
248 <<EOH;
249 010400 01044F
250 EOH
251 }
252
253 sub InUCSDevanagari {
254 <<EOH;
255 0900 097F
256 200C
257 200D
258 EOH
259 }
260
261 sub InUCSDingbats {
262 <<EOH;
263 2700 27BF
264 EOH
265 }
266
267 sub InUCSEnclosedAlphanumerics {
268 <<EOH;
269 2460 24FF
270 EOH
271 }
272
273 sub InUCSEnclosedCJKLettersAndMonths {
274 <<EOH;
275 3200 32FF
276 EOH
277 }
278
279 sub InUCSEthiopic {
280 <<EOH;
281 1200 137F
282 EOH
283 }
284
285 sub InUCSEtruscan {
286 <<EOH;
287 010300 01032F
288 EOH
289 }
290
291 sub InUCSExtendedMyanmar {
292 <<EOH;
293 1050 109F
294 EOH
295 }
296
297 sub InUCSFormatSeparators {
298 <<EOH;
299 2028 2029
300 EOH
301 }
302
303 sub InUCSGeneralFormatCharacters {
304 <<EOH;
305 200B 200D
306 FEFF
307 2028 2029
308 200E 200F
309 202A 202E
310 EOH
311 }
312
313 sub InUCSGeneralPunctuation {
314 <<EOH;
315 2000 206F
316 EOH
317 }
318
319 sub InUCSGeometricShapes {
320 <<EOH;
321 25A0 25FF
322 EOH
323 }
324
325 sub InUCSGeorgianExtended {
326 <<EOH;
327 10A0 10CF
328 EOH
329 }
330
331 sub InUCSGothic {
332 <<EOH;
333 010330 01034F
334 EOH
335 }
336
337 sub InUCSGreekExtended {
338 <<EOH;
339 1F00 1FFF
340 EOH
341 }
342
343 sub InUCSGreekSymbolsAndCoptic {
344 <<EOH;
345 03D0 03FF
346 EOH
347 }
348
349 sub InUCSGujarati {
350 <<EOH;
351 0A80 0AFF
352 200C
353 200D
354 EOH
355 }
356
357 sub InUCSGurmukhi {
358 <<EOH;
359 0A00 0A7F
360 200C
361 200D
362 EOH
363 }
364
365 sub InUCSHalfwidthAndFullwidthForms {
366 <<EOH;
367 FF00 FFEF
368 EOH
369 }
370
371 sub InUCSHangulCompatibilityJamo {
372 <<EOH;
373 3130 318F
374 EOH
375 }
376
377 sub InUCSHangulFillCharacters {
378 <<EOH;
379 3164
380 FFA0
381 EOH
382 }
383
384 sub InUCSHangulJamo {
385 <<EOH;
386 1100 11FF
387 EOH
388 }
389
390 sub InUCSHangulSyllables {
391 <<EOH;
392 AC00 D7A3
393 EOH
394 }
395
396 sub InUCSHanunoo {
397 <<EOH;
398 1720 173F
399 EOH
400 }
401
402 sub InUCSHebrewExtended {
403 <<EOH;
404 0590 05CF
405 05EB 05FF
406 EOH
407 }
408
409 sub InUCSHiragana {
410 <<EOH;
411 3040 309F
412 EOH
413 }
414
415 sub InUCSIPAExtensions {
416 <<EOH;
417 0250 02AF
418 EOH
419 }
420
421 sub InUCSIdeographicDescriptionCharacters {
422 <<EOH;
423 2FF0 2FFF
424 EOH
425 }
426
427 sub InUCSKangxiRadicals {
428 <<EOH;
429 2F00 2FDF
430 EOH
431 }
432
433 sub InUCSKannada {
434 <<EOH;
435 0C80 0CFF
436 200C
437 200D
438 EOH
439 }
440
441 sub InUCSKatakana {
442 <<EOH;
443 30A0 30FF
444 EOH
445 }
446
447 sub InUCSKatakanaPhoneticExtensions {
448 <<EOH;
449 31F0 31FF
450 EOH
451 }
452
453 sub InUCSKhmer {
454 <<EOH;
455 1780 17FF
456 200C
457 200D
458 EOH
459 }
460
461 sub InUCSLao {
462 <<EOH;
463 0E80 0EFF
464 EOH
465 }
466
467 sub InUCSLatin1Supplement {
468 <<EOH;
469 00A0 00FF
470 EOH
471 }
472
473 sub InUCSLatinExtendedA {
474 <<EOH;
475 0100 017F
476 EOH
477 }
478
479 sub InUCSLatinExtendedAdditional {
480 <<EOH;
481 1E00 1EFF
482 EOH
483 }
484
485 sub InUCSLatinExtendedB {
486 <<EOH;
487 0180 024F
488 EOH
489 }
490
491 sub InUCSLetterlikeSymbols {
492 <<EOH;
493 2100 214F
494 EOH
495 }
496
497 sub InUCSLimbu {
498 <<EOH;
499 1900 194F
500 EOH
501 }
502
503 sub InUCSLinearBIdeograms {
504 <<EOH;
505 10080 100FF
506 EOH
507 }
508
509 sub InUCSLinearBSyllabary {
510 <<EOH;
511 10000 1007F
512 EOH
513 }
514
515 sub InUCSMalayalam {
516 <<EOH;
517 0D00 0D7F
518 200C
519 200D
520 EOH
521 }
522
523 sub InUCSMathematicalOperators {
524 <<EOH;
525 2200 22FF
526 EOH
527 }
528
529 sub InUCSMiscellaneousSymbols {
530 <<EOH;
531 2600 26FF
532 EOH
533 }
534
535 sub InUCSMiscellaneousTechnical {
536 <<EOH;
537 2300 23FF
538 EOH
539 }
540
541 sub InUCSMiscllaneousMathmaticalSymbols {
542 <<EOH;
543 2980 29FF
544 EOH
545 }
546
547 sub InUCSMongolian {
548 <<EOH;
549 1800 18AF
550 EOH
551 }
552
553 sub InUCSNumberForms {
554 <<EOH;
555 2150 218F
556 EOH
557 }
558
559 sub InUCSNumericShapeSelectors {
560 <<EOH;
561 206E 206F
562 EOH
563 }
564
565 sub InUCSOgham {
566 <<EOH;
567 1680 169F
568 EOH
569 }
570
571 sub InUCSOpticalCharacterRecognition {
572 <<EOH;
573 2440 245F
574 EOH
575 }
576
577 sub InUCSOriya {
578 <<EOH;
579 0B00 0B7F
580 200C
581 200D
582 EOH
583 }
584
585 sub InUCSOsmanya {
586 <<EOH;
587 10480 104AF
588 EOH
589 }
590
591 sub InUCSPart2 {
592 <<EOH;
593 010000 01FFFD
594 020000 02FFFD
595 0E0000 0EFFFD
596 EOH
597 }
598
599 sub InUCSPrivateUseArea {
600 <<EOH;
601 E000 F8FF
602 EOH
603 }
604
605 sub InUCSPrivateUseGroups {
606 <<EOH;
607 0030
608 0030
609 0030
610 0030
611 0030
612 0030
613 0030
614 0036
615 0037
616 0046
617 0046
618 0046
619 0046
620 0046
621 0046
622 0046
623 EOH
624 }
625
626 sub InUCSPrivateUsePlanes {
627 <<EOH;
628 0030
629 0030
630 0030
631 0030
632 0030
633 0030
634 0030
635 0030
636 0030
637 0030
638 0030
639 0031
640 0045
641 0046
642 0046
643 0046
644 0046
645 0046
646 0046
647 0046
648 0046
649 0046
650 0046
651 0046
652 EOH
653 }
654
655 sub InUCSRunic {
656 <<EOH;
657 16A0 16FF
658 EOH
659 }
660
661 sub InUCSScriptSpecificFormatCharacters {
662 <<EOH;
663 3164
664 FFA0
665 206A 206D
666 206E 206F
667 2FF0 2FFF
668 EOH
669 }
670
671 sub InUCSShavian {
672 <<EOH;
673 10450 1047F
674 EOH
675 }
676
677 sub InUCSSinhala {
678 <<EOH;
679 0D80 0DFF
680 EOH
681 }
682
683 sub InUCSSip {
684 <<EOH;
685 020000 02FFFD
686 EOH
687 }
688
689 sub InUCSSmallFormVariants {
690 <<EOH;
691 FE50 FE6F
692 EOH
693 }
694
695 sub InUCSSmp {
696 <<EOH;
697 010000 01FFFD
698 EOH
699 }
700
701 sub InUCSSpacingModifierLetters {
702 <<EOH;
703 02B0 02FF
704 EOH
705 }
706
707 sub InUCSSpecials {
708 <<EOH;
709 FFF0 FFFD
710 EOH
711 }
712
713 sub InUCSSpp {
714 <<EOH;
715 0E0000 0EFFFD
716 EOH
717 }
718
719 sub InUCSSuperscriptsAndSubscripts {
720 <<EOH;
721 2070 209F
722 EOH
723 }
724
725 sub InUCSSupplementalArrows {
726 <<EOH;
727 2900 297F
728 EOH
729 }
730
731 sub InUCSSupplementalArrowsC {
732 <<EOH;
733 2B00 2B2F
734 EOH
735 }
736
737 sub InUCSSupplementalCJKCompatibility {
738 <<EOH;
739 31C0 31EF
740 EOH
741 }
742
743 sub InUCSSupplementalHangulA {
744 <<EOH;
745 3D2E 44B7
746 EOH
747 }
748
749 sub InUCSSupplementalHangulB {
750 <<EOH;
751 44BE 4DFF
752 EOH
753 }
754
755 sub InUCSSupplementalMathmaticalOperators {
756 <<EOH;
757 2A00 2AFF
758 EOH
759 }
760
761 sub InUCSSyriac {
762 <<EOH;
763 0700 074F
764 EOH
765 }
766
767 sub InUCSTagalog {
768 <<EOH;
769 1700 171F
770 EOH
771 }
772
773 sub InUCSTagbanwa {
774 <<EOH;
775 1760 177F
776 EOH
777 }
778
779 sub InUCSTags {
780 <<EOH;
781 0E0000 0E007F
782 EOH
783 }
784
785 sub InUCSTaiLe {
786 <<EOH;
787 1950 197F
788 EOH
789 }
790
791 sub InUCSTamil {
792 <<EOH;
793 0B80 0BFF
794 200C
795 200D
796 EOH
797 }
798
799 sub InUCSTelugu {
800 <<EOH;
801 0C00 0C7F
802 200C
803 200D
804 EOH
805 }
806
807 sub InUCSThaana {
808 <<EOH;
809 0780 07BF
810 EOH
811 }
812
813 sub InUCSThai {
814 <<EOH;
815 0E00 0E7F
816 EOH
817 }
818
819 sub InUCSTibetan {
820 <<EOH;
821 0F00 0FFF
822 EOH
823 }
824
825 sub InUCSUgaritic {
826 <<EOH;
827 10380 1039F
828 EOH
829 }
830
831 sub InUCSUnicode {
832 <<EOH;
833 0000 FDCF
834 FDF0 FFFD
835 10000 1FFFD
836 20000 2FFFD
837 E0000 EFFFD
838 F0000 FFFFD
839 100000 10FFFD
840 EOH
841 }
842
843 sub InUCSUnifiedCanadianAboriginalSyllabics {
844 <<EOH;
845 1400 167F
846 EOH
847 }
848
849 sub InUCSVariationSelectors {
850 <<EOH;
851 FE00 FE0F
852 EOH
853 }
854
855 sub InUCSVariationSelectorsSupplement {
856 <<EOH;
857 E0110 E01FF
858 EOH
859 }
860
861 sub InUCSWesternMusicalSymbols {
862 <<EOH;
863 01D100 01D1FF
864 EOH
865 }
866
867 sub InUCSYiRadicals {
868 <<EOH;
869 A490 A4CF
870 EOH
871 }
872
873 sub InUCSYiSyllables {
874 <<EOH;
875 A000 A48F
876 EOH
877 }
878
879 sub InUCSYijingHexagramSymbols {
880 <<EOH;
881 4DC0 4DFF
882 EOH
883 }
884
885 sub InUCSZeroWidthBoundaryIndicators {
886 <<EOH;
887 200B 200D
888 FEFF
889 EOH
890 }
891
892 sub InUCS_BMP {
893 <<EOH;
894 0000 D7FF
895 E000 FFFD
896 EOH
897 }
898
899 sub InUCS_BMPFirstEdition {
900 <<EOH;
901 0020 007E
902 00A0 00FF
903 0100 01F5
904 01FA 01FF
905 0200 0217
906 0250 02A8
907 02B0 02DE
908 02E0 02E9
909 0300 0345
910 0360 0361
911 0374 0375
912 037A
913 037E
914 0384 038A
915 038C
916 038E 03A1
917 03A3 03CE
918 03D0 03D6
919 03DA
920 03DC
921 03DE
922 03E0
923 03E2 03F3
924 0401 040C
925 040E 044F
926 0451 045C
927 045E 0486
928 0490 04C4
929 04C7 04C8
930 04CB 04CC
931 04D0 04EB
932 04EE 04F5
933 04F8 04F9
934 0531 0556
935 0559 055F
936 0561 0587
937 0589
938 05B0 05B9
939 05BB 05C3
940 05D0 05EA
941 05F0 05F4
942 060C
943 061B
944 061F
945 0621 063A
946 0640 0652
947 0660 066D
948 0670 06B7
949 06BA 06BE
950 06C0 06CE
951 06D0 06ED
952 06F0 06F9
953 0901 0903
954 0905 0939
955 093C 094D
956 0950 0954
957 0958 0970
958 0981 0983
959 0985 098C
960 098F 0990
961 0993 09A8
962 09AA 09B0
963 09B2
964 09B6 09B9
965 09BC
966 09BE 09C4
967 09C7 09C8
968 09CB 09CD
969 09D7
970 09DC 09DD
971 09DF 09E3
972 09E6 09FA
973 0A02
974 0A05 0A0A
975 0A0F 0A10
976 0A13 0A28
977 0A2A 0A30
978 0A32 0A33
979 0A35 0A36
980 0A38 0A39
981 0A3C
982 0A3E 0A42
983 0A47 0A48
984 0A4B 0A4D
985 0A59 0A5C
986 0A5E
987 0A66 0A74
988 0A81 0A83
989 0A85 0A8B
990 0A8D
991 0A8F 0A91
992 0A93 0AA8
993 0AAA 0AB0
994 0AB2 0AB3
995 0AB5 0AB9
996 0ABC 0AC5
997 0AC7 0AC9
998 0ACB 0ACD
999 0AD0
1000 0AE0
1001 0AE6 0AEF
1002 0B01 0B03
1003 0B05 0B0C
1004 0B0F 0B10
1005 0B13 0B28
1006 0B2A 0B30
1007 0B32 0B33
1008 0B36 0B39
1009 0B3C 0B43
1010 0B47 0B48
1011 0B4B 0B4D
1012 0B56 0B57
1013 0B5C 0B5D
1014 0B5F 0B61
1015 0B66 0B70
1016 0B82 0B83
1017 0B85 0B8A
1018 0B8E 0B90
1019 0B92 0B25
1020 0B99 0B9A
1021 0B9C
1022 0B9E 0B9F
1023 0BA3 0BA4
1024 0BA8 0BAA
1025 0BAE 0BB5
1026 0BB7 0BB9
1027 0BBE 0BC2
1028 0BC6 0BC8
1029 0BCA 0BCD
1030 0BD7
1031 0BE7 0BF2
1032 0C01 0C03
1033 0C05 0C0C
1034 0C0E 0C10
1035 0C12 0C28
1036 0C2A 0C33
1037 0C35 0C39
1038 0C3E 0C44
1039 0C46 0C48
1040 0C4A 0C4D
1041 0C55 0C56
1042 0C60 0C61
1043 0C66 0C6F
1044 0C82 0C83
1045 0C85 0C8C
1046 0C8E 0C90
1047 0C92 0CA8
1048 0CAA 0CB3
1049 0CB5 0CB9
1050 0CBE 0CC4
1051 0CC6 0CC8
1052 0CCA 0CCD
1053 0CD5 0CD6
1054 0CDE
1055 0CE0 0CE1
1056 0CE6 0CEF
1057 0D02 0D03
1058 0D05 0D0C
1059 0D0E 0D10
1060 0D12 0D28
1061 0D2A 0D39
1062 0D3E 0D43
1063 0D46 0D48
1064 0D4A 0D4D
1065 0D57
1066 0D60 0D61
1067 0D66 0D6F
1068 0E01 0E3A
1069 0E3F 0E5B
1070 0E81 0E82
1071 0E84
1072 0E87 0E88
1073 0E8A
1074 0E8D
1075 0E94 0E97
1076 0E99 0E9F
1077 0EA1 0EA3
1078 0EA5
1079 0EA7
1080 0EAA 0EAB
1081 0EAD 0EB9
1082 0EBB 0EBD
1083 0EC0 0EC4
1084 0EC6
1085 0EC8 0ECD
1086 0ED0 0ED9
1087 0EDC 0EDD
1088 10A0 10C5
1089 10D0 10F6
1090 10FB
1091 1100 1159
1092 115F 11A2
1093 11A8 11F9
1094 1E00 1E9A
1095 1EA0 1EF9
1096 1F00 1F15
1097 1F18 1F1D
1098 1F20 1F45
1099 1F48 1F4D
1100 1F50 1F57
1101 1F59
1102 1F5B
1103 1F5D
1104 1F5F 1F7D
1105 1F80 1FB4
1106 1FB6 1FC4
1107 1FC6 1FD3
1108 1FD6 1FDB
1109 1FDD 1FEF
1110 1FF2 1FF4
1111 1FF6 1FFE
1112 2000 202E
1113 2030 2046
1114 206A 2070
1115 2074 208E
1116 20A0 20AA
1117 20D0 20E1
1118 2100 2138
1119 2153 2182
1120 2190 21EA
1121 2200 22F1
1122 2300
1123 2302 237A
1124 2400 2424
1125 2440 244A
1126 2460 24EA
1127 2500 2595
1128 25A0 25EF
1129 2600 2613
1130 261A 266F
1131 2701 2704
1132 2706 2709
1133 270C 2727
1134 2729 274B
1135 274D
1136 274F 2752
1137 2756
1138 2758 275E
1139 2761 2767
1140 2776 2794
1141 2798 27AF
1142 27B1 27BE
1143 3000 3037
1144 303F
1145 3041 3094
1146 3099 309E
1147 30A1 30FE
1148 3105 312C
1149 3131 318E
1150 3190 319F
1151 3200 321C
1152 3220 3243
1153 3260 327B
1154 327F 32B0
1155 32C0 32CB
1156 32D0 32FE
1157 3300 3376
1158 337B 33DD
1159 33E0 33FE
1160 FB00 FB06
1161 FB13 FB17
1162 FB1E FB36
1163 FB38 FB3C
1164 FB3E
1165 FB40 FB41
1166 FB43 FB44
1167 FB46 FBB1
1168 FBD3 FBFF
1169 FC00 FCFF
1170 FD00 FD3F
1171 FD50 FD8F
1172 FD92 FDC7
1173 FDF0 FDFB
1174 FE20 FE23
1175 FE30 FE44
1176 FE49 FE52
1177 FE54 FE66
1178 FE68 FE6B
1179 FE70 FE72
1180 FE74
1181 FE76 FEFC
1182 FEFF
1183 FF01 FF5E
1184 FF61 FFBE
1185 FFC2 FFC7
1186 FFCA FFCF
1187 FFD2 FFD7
1188 FFDA FFDC
1189 FFE0 FFE6
1190 FFE8 FFEE
1191 FFFD
1192 3400 4DFF
1193 4E00 9FA5
1194 E000 F8FF
1195 F900 FA2D
1196 EOH
1197 }
1198
1199 sub InUCS_BMPSecondEdition {
1200 <<EOH;
1201 0020 007E
1202 00A0 00FF
1203 0100 01FF
1204 0200 0233
1205 0250 02AD
1206 02B0 02EE
1207 0300 034E
1208 0360 0362
1209 0374 0375
1210 037A
1211 037E
1212 0384 038A
1213 038C
1214 038E 03A1
1215 03A3 03CE
1216 03D0 03D7
1217 03DA 03F3
1218 0400 0486
1219 0488 0489
1220 048C 04C4
1221 04C7 04C8
1222 04CB 04CC
1223 04D0 04F5
1224 04F8 04F9
1225 0531 0556
1226 0559 055F
1227 0561 0587
1228 0589 058A
1229 0591 05A1
1230 05A3 05B9
1231 05BB 05C4
1232 05D0 05EA
1233 05F0 05F4
1234 060C
1235 061B
1236 061F
1237 0621 063A
1238 0640 0655
1239 0660 066D
1240 0670 06ED
1241 06F0 06FE
1242 0700 070D
1243 070F 072C
1244 0730 074A
1245 0780 07BF
1246 0901 0903
1247 0905 0939
1248 093C 094D
1249 0950 0954
1250 0958 0970
1251 0981 0983
1252 0985 098C
1253 098F 0990
1254 0993 09A8
1255 09AA 09B0
1256 09B2
1257 09B6 09B9
1258 09BC
1259 09BE 09C4
1260 09C7 09C8
1261 09CB 09CD
1262 09D7
1263 09DC 09DD
1264 09DF 09E3
1265 09E6 09FA
1266 0A02
1267 0A05 0A0A
1268 0A0F 0A10
1269 0A13 0A28
1270 0A2A 0A30
1271 0A32 0A33
1272 0A35 0A36
1273 0A38 0A39
1274 0A3C
1275 0A3E 0A42
1276 0A47 0A48
1277 0A4B 0A4D
1278 0A59 0A5C
1279 0A5E
1280 0A66 0A74
1281 0A81 0A83
1282 0A85 0A8B
1283 0A8D
1284 0A8F 0A91
1285 0A93 0AA8
1286 0AAA 0AB0
1287 0AB2 0AB3
1288 0AB5 0AB9
1289 0ABC 0AC5
1290 0AC7 0AC9
1291 0ACB 0ACD
1292 0AD0
1293 0AE0
1294 0AE6 0AEF
1295 0B01 0B03
1296 0B05 0B0C
1297 0B0F 0B10
1298 0B13 0B28
1299 0B2A 0B30
1300 0B32 0B33
1301 0B36 0B39
1302 0B3C 0B43
1303 0B47 0B48
1304 0B4B 0B4D
1305 0B56 0B57
1306 0B5C 0B5D
1307 0B5F 0B61
1308 0B66 0B70
1309 0B82 0B83
1310 0B85 0B8A
1311 0B8E 0B90
1312 0B92 0B95
1313 0B99 0B9A
1314 0B9C
1315 0B9E 0B9F
1316 0BA3 0BA4
1317 0BA8 0BAA
1318 0BAE 0BB5
1319 0BB7 0BB9
1320 0BBE 0BC2
1321 0BC6 0BC8
1322 0BCA 0BCD
1323 0BD7
1324 0BE7 0BF2
1325 0C01 0C03
1326 0C05 0C0C
1327 0C0E 0C10
1328 0C12 0C28
1329 0C2A 0C33
1330 0C35 0C39
1331 0C3E 0C44
1332 0C46 0C48
1333 0C4A 0C4D
1334 0C55 0C56
1335 0C60 0C61
1336 0C66 0C6F
1337 0C82 0C83
1338 0C85 0C8C
1339 0C8E 0C90
1340 0C92 0CA8
1341 0CAA 0CB3
1342 0CB5 0CB9
1343 0CBE 0CC4
1344 0CC6 0CC8
1345 0CCA 0CCD
1346 0CD5 0CD6
1347 0CDE
1348 0CE0 0CE1
1349 0CE6 0CEF
1350 0D02 0D03
1351 0D05 0D0C
1352 0D0E 0D10
1353 0D12 0D28
1354 0D2A 0D39
1355 0D3E 0D43
1356 0D46 0D48
1357 0D4A 0D4D
1358 0D57
1359 0D60 0D61
1360 0D66 0D6F
1361 0D82 0D83
1362 0D85 0D96
1363 0D9A 0DB1
1364 0DB3 0DBB
1365 0DBD
1366 0DC0 0DC6
1367 0DCA
1368 0DCF 0DD4
1369 0DD6
1370 0DD8 0DDF
1371 0DF2 0DF4
1372 0E01 0E3A
1373 0E3F 0E5B
1374 0E81 0E82
1375 0E84
1376 0E87 0E88
1377 0E8A
1378 0E8D
1379 0E94 0E97
1380 0E99 0E9F
1381 0EA1 0EA3
1382 0EA5
1383 0EA7
1384 0EAA 0EAB
1385 0EAD 0EB9
1386 0EBB 0EBD
1387 0EC0 0EC4
1388 0EC6
1389 0EC8 0ECD
1390 0ED0 0ED9
1391 0EDC 0EDD
1392 0F00 0F47
1393 0F49 0F6A
1394 0F71 0F8B
1395 0F90 0F97
1396 0F99 0FBC
1397 0FBE 0FCC
1398 0FCF
1399 1000 1021
1400 1023 1027
1401 1029 102A
1402 102C 1032
1403 1036 1039
1404 1040 1059
1405 10A0 10C5
1406 10D0 10F6
1407 10FB
1408 1100 1159
1409 115F 11A2
1410 11A8 11F9
1411 1220 1226
1412 1228 1246
1413 1248
1414 124A 124D
1415 1250 1256
1416 1258
1417 125A 125D
1418 1260 1286
1419 1288
1420 128A 128D
1421 1290 12AE
1422 12B0
1423 12B2 12B5
1424 12B8 12BE
1425 12C0
1426 12C2 12C5
1427 12C8 12CE
1428 12D0 12D6
1429 12D8 12EE
1430 12F0 12FF
1431 1300 130E
1432 1310
1433 1312 1315
1434 1318 131E
1435 1320 1346
1436 1348 135A
1437 1361 137C
1438 13A0 13F4
1439 1600 1676
1440 1680 169C
1441 16A0 16F0
1442 1780 17DC
1443 17E0 17E9
1444 1800 180E
1445 1810 1819
1446 1820 1877
1447 1880 18A9
1448 1E00 1E9B
1449 1EA0 1EF9
1450 1F00 1F15
1451 1F18 1F1D
1452 1F20 1F45
1453 1F48 1F4D
1454 1F50 1F57
1455 1F59
1456 1F5B
1457 1F5D
1458 1F5F 1F7D
1459 1F80 1FB4
1460 1FB6 1FC4
1461 1FC6 1FD3
1462 1FD6 1FDB
1463 1FDD 1FEF
1464 1FF2 1FF4
1465 1FF6 1FFE
1466 2000 2046
1467 2048 204D
1468 204F
1469 206A 2070
1470 2074 208E
1471 20A0 20AF
1472 20D0 20E3
1473 2100 213A
1474 2153 2183
1475 2190 21F3
1476 2200 22F1
1477 2300 237B
1478 237D 239A
1479 2400 2426
1480 2440 244A
1481 2460 24EA
1482 2500 2595
1483 25A0 25F7
1484 2600 2613
1485 2619 2671
1486 2701 2704
1487 2706 2709
1488 270C 2727
1489 2729 274B
1490 274D
1491 274F 2752
1492 2756
1493 2758 275E
1494 2761 2767
1495 2776 2794
1496 2798 27AF
1497 27B1 27BE
1498 2800 28FF
1499 2E80 2E99
1500 2E9B 2EF3
1501 2F00 2FD5
1502 2FF0 2FFB
1503 3000 303A
1504 303E 303F
1505 3041 3094
1506 3099 309E
1507 30A1 30FE
1508 3105 312C
1509 3131 318E
1510 3190 31B7
1511 3200 321C
1512 3220 3243
1513 3260 327B
1514 327F 32B0
1515 32C0 32CB
1516 32D0 32FE
1517 3300 3376
1518 337B 33DD
1519 33E0 33FE
1520 A400 A48C
1521 A490 A4A1
1522 A4A4 A4B3
1523 A4B5 A4C0
1524 A4C2 A4C4
1525 A4C6
1526 FB00 FB06
1527 FB13 FB17
1528 FB1D FB36
1529 FB38 FB3C
1530 FB3E
1531 FB40 FB41
1532 FB43 FB44
1533 FB46 FBB1
1534 FBD3 FBFF
1535 FC00 FCFF
1536 FD00 FD3F
1537 FD50 FD8F
1538 FD92 FDC7
1539 FDF0 FDFB
1540 FE20 FE23
1541 FE30 FE44
1542 FE49 FE52
1543 FE54 FE66
1544 FE68 FE6B
1545 FE70 FE72
1546 FE74
1547 FE76 FEFC
1548 FEFF
1549 FF01 FF5E
1550 FF61 FFBE
1551 FFC2 FFC7
1552 FFCA FFCF
1553 FFD2 FFD7
1554 FFDA FFDC
1555 FFE0 FFE6
1556 FFE8 FFEE
1557 FFF9 FFFD
1558 1401 15FF
1559 4E00 9FA5
1560 AC00 D7A3
1561 E000 F8FF
1562 F900 FA2D
1563 EOH
1564 }
1565
1566 sub InUCS_BMP_AMD7 {
1567 <<EOH;
1568 0020 007E
1569 00A0 00FF
1570 0100 01F5
1571 01FA 01FF
1572 0200 0217
1573 0250 02A8
1574 02B0 02DE
1575 02E0 02E9
1576 0300 0345
1577 0360 0361
1578 0374 0375
1579 037A
1580 037E
1581 0384 038A
1582 038C
1583 038E 03A1
1584 03A3 03CE
1585 03D0 03D6
1586 03DA
1587 03DC
1588 03DE
1589 03E0
1590 03E2 03F3
1591 0401 040C
1592 040E 044F
1593 0451 045C
1594 045E 0486
1595 0490 04C4
1596 04C7 04C8
1597 04CB 04CC
1598 04D0 04EB
1599 04EE 04F5
1600 04F8 04F9
1601 0531 0556
1602 0559 055F
1603 0561 0587
1604 0589
1605 0591 05A1
1606 05A3 05B9
1607 05BB 05C4
1608 05D0 05EA
1609 05F0 05F4
1610 060C
1611 061B
1612 061F
1613 0621 063A
1614 0640 0652
1615 0660 066D
1616 0670 06B7
1617 06BA 06BE
1618 06C0 06CE
1619 06D0 06ED
1620 06F0 06F9
1621 0901 0903
1622 0905 0939
1623 093C 094D
1624 0950 0954
1625 0958 0970
1626 0981 0983
1627 0985 098C
1628 098F 0990
1629 0993 09A8
1630 09AA 09B0
1631 09B2
1632 09B6 09B9
1633 09BC
1634 09BE 09C4
1635 09C7 09C8
1636 09CB 09CD
1637 09D7
1638 09DC 09DD
1639 09DF 09E3
1640 09E6 09FA
1641 0A02
1642 0A05 0A0A
1643 0A0F 0A10
1644 0A13 0A28
1645 0A2A 0A30
1646 0A32 0A33
1647 0A35 0A36
1648 0A38 0A39
1649 0A3C
1650 0A3E 0A42
1651 0A47 0A48
1652 0A4B 0A4D
1653 0A59 0A5C
1654 0A5E
1655 0A66 0A74
1656 0A81 0A83
1657 0A85 0A8B
1658 0A8D
1659 0A8F 0A91
1660 0A93 0AA8
1661 0AAA 0AB0
1662 0AB2 0AB3
1663 0AB5 0AB9
1664 0ABC 0AC5
1665 0AC7 0AC9
1666 0ACB 0ACD
1667 0AD0
1668 0AE0
1669 0AE6 0AEF
1670 0B01 0B03
1671 0B05 0B0C
1672 0B0F 0B10
1673 0B13 0B28
1674 0B2A 0B30
1675 0B32 0B33
1676 0B36 0B39
1677 0B3C 0B43
1678 0B47 0B48
1679 0B4B 0B4D
1680 0B56 0B57
1681 0B5C 0B5D
1682 0B5F 0B61
1683 0B66 0B70
1684 0B82 0B83
1685 0B85 0B8A
1686 0B8E 0B90
1687 0B92 0B25
1688 0B99 0B9A
1689 0B9C
1690 0B9E 0B9F
1691 0BA3 0BA4
1692 0BA8 0BAA
1693 0BAE 0BB5
1694 0BB7 0BB9
1695 0BBE 0BC2
1696 0BC6 0BC8
1697 0BCA 0BCD
1698 0BD7
1699 0BE7 0BF2
1700 0C01 0C03
1701 0C05 0C0C
1702 0C0E 0C10
1703 0C12 0C28
1704 0C2A 0C33
1705 0C35 0C39
1706 0C3E 0C44
1707 0C46 0C48
1708 0C4A 0C4D
1709 0C55 0C56
1710 0C60 0C61
1711 0C66 0C6F
1712 0C82 0C83
1713 0C85 0C8C
1714 0C8E 0C90
1715 0C92 0CA8
1716 0CAA 0CB3
1717 0CB5 0CB9
1718 0CBE 0CC4
1719 0CC6 0CC8
1720 0CCA 0CCD
1721 0CD5 0CD6
1722 0CDE
1723 0CE0 0CE1
1724 0CE6 0CEF
1725 0D02 0D03
1726 0D05 0D0C
1727 0D0E 0D10
1728 0D12 0D28
1729 0D2A 0D39
1730 0D3E 0D43
1731 0D46 0D48
1732 0D4A 0D4D
1733 0D57
1734 0D60 0D61
1735 0D66 0D6F
1736 0E01 0E3A
1737 0E3F 0E5B
1738 0E81 0E82
1739 0E84
1740 0E87 0E88
1741 0E8A
1742 0E8D
1743 0E94 0E97
1744 0E99 0E9F
1745 0EA1 0EA3
1746 0EA5
1747 0EA7
1748 0EAA 0EAB
1749 0EAD 0EB9
1750 0EBB 0EBD
1751 0EC0 0EC4
1752 0EC6
1753 0EC8 0ECD
1754 0ED0 0ED9
1755 0EDC 0EDD
1756 0F00 0F47
1757 0F49 0F69
1758 0F71 0F8B
1759 0F90 0F95
1760 0F97
1761 0F99 0FAD
1762 0FB1 0FB7
1763 0FB9
1764 10A0 10C5
1765 10D0 10F6
1766 10FB
1767 1100 1159
1768 115F 11A2
1769 11A8 11F9
1770 1E00 1E9B
1771 1EA0 1EF9
1772 1F00 1F15
1773 1F18 1F1D
1774 1F20 1F45
1775 1F48 1F4D
1776 1F50 1F57
1777 1F59
1778 1F5B
1779 1F5D
1780 1F5F 1F7D
1781 1F80 1FB4
1782 1FB6 1FC4
1783 1FC6 1FD3
1784 1FD6 1FDB
1785 1FDD 1FEF
1786 1FF2 1FF4
1787 1FF6 1FFE
1788 2000 202E
1789 2030 2046
1790 206A 2070
1791 2074 208E
1792 20A0 20AB
1793 20D0 20E1
1794 2100 2138
1795 2153 2182
1796 2190 21EA
1797 2200 22F1
1798 2300
1799 2302 237A
1800 2400 2424
1801 2440 244A
1802 2460 24EA
1803 2500 2595
1804 25A0 25EF
1805 2600 2613
1806 261A 266F
1807 2701 2704
1808 2706 2709
1809 270C 2727
1810 2729 274B
1811 274D
1812 274F 2752
1813 2756
1814 2758 275E
1815 2761 2767
1816 2776 2794
1817 2798 27AF
1818 27B1 27BE
1819 3000 3037
1820 303F
1821 3041 3094
1822 3099 309E
1823 30A1 30FE
1824 3105 312C
1825 3131 318E
1826 3190 319F
1827 3200 321C
1828 3220 3243
1829 3260 327B
1830 327F 32B0
1831 32C0 32CB
1832 32D0 32FE
1833 3300 3376
1834 337B 33DD
1835 33E0 33FE
1836 FB00 FB06
1837 FB13 FB17
1838 FB1E FB36
1839 FB38 FB3C
1840 FB3E
1841 FB40 FB41
1842 FB43 FB44
1843 FB46 FBB1
1844 FBD3 FBFF
1845 FC00 FCFF
1846 FD00 FD3F
1847 FD50 FD8F
1848 FD92 FDC7
1849 FDF0 FDFB
1850 FE20 FE23
1851 FE30 FE44
1852 FE49 FE52
1853 FE54 FE66
1854 FE68 FE6B
1855 FE70 FE72
1856 FE74
1857 FE76 FEFC
1858 FEFF
1859 FF01 FF5E
1860 FF61 FFBE
1861 FFC2 FFC7
1862 FFCA FFCF
1863 FFD2 FFD7
1864 FFDA FFDC
1865 FFE0 FFE6
1866 FFE8 FFEE
1867 FFFD
1868 4E00 9FA5
1869 AC00 D7A3
1870 E000 F8FF
1871 F900 FA2D
1872 EOH
1873 }
1874
1875 sub InUCS_CJKCompatibility {
1876 <<EOH;
1877 3300 33FF
1878 EOH
1879 }
1880
1881 sub InUCS_CJKCompatibilityForms {
1882 <<EOH;
1883 FE30 FE4F
1884 EOH
1885 }
1886
1887 sub InUCS_CJKCompatibilityIdeographs {
1888 <<EOH;
1889 F900 FAFF
1890 EOH
1891 }
1892
1893 sub InUCS_CJKCompatibilityIdeographsSupplement {
1894 <<EOH;
1895 02F800 02FA1F
1896 EOH
1897 }
1898
1899 sub InUCS_CJKMiscellaneous {
1900 <<EOH;
1901 3190 319F
1902 EOH
1903 }
1904
1905 sub InUCS_CJKRadicalsSupplement {
1906 <<EOH;
1907 2E80 2EFF
1908 EOH
1909 }
1910
1911 sub InUCS_CJKSymbolsAndPunctuation {
1912 <<EOH;
1913 3000 303F
1914 EOH
1915 }
1916
1917 sub InUCS_CJKUnifiedIdeographs {
1918 <<EOH;
1919 4E00 9FFF
1920 EOH
1921 }
1922
1923 sub InUCS_CJKUnifiedIdeographsAll {
1924 <<EOH;
1925 3400 4DBF
1926 4E00 9FFF
1927 FA0E FA0F
1928 FA11
1929 FA14 FA14
1930 FA1F
1931 FA21
1932 FA23 FA24
1933 FA27 FA29
1934 20000 2A6DF
1935 EOH
1936 }
1937
1938 sub InUCS_CJKUnifiedIdeographsExtensionA {
1939 <<EOH;
1940 3400 4DBF
1941 EOH
1942 }
1943
1944 sub InUCS_CJKUnifiedIdeographsExtensionB {
1945 <<EOH;
1946 020000 02A71F
1947 EOH
1948 }
1949
1950 sub InUCS_MES1 {
1951 <<EOH;
1952 0020 007E
1953 00A0 00FF
1954 0100 0113
1955 0116 012B
1956 012E 014D
1957 0150 017E
1958 02C7
1959 02D8 02DB
1960 02DD
1961 2015
1962 2018 2019
1963 201C 201D
1964 20AC
1965 2122
1966 2126
1967 215B 215E
1968 2190 2193
1969 266A
1970 EOH
1971 }
1972
1973 sub InUCS_MES2 {
1974 <<EOH;
1975 0020 007E
1976 00A0 00FF
1977 0100 017F
1978 018F
1979 0192
1980 01B7
1981 01DE 01EF
1982 01FA 01FF
1983 0218 021B
1984 021E 021F
1985 0259
1986 027C
1987 0292
1988 02BB 02BD
1989 02C6 02C7
1990 02C9
1991 02D8 02DD
1992 02EE
1993 0374 0375
1994 037A
1995 037E
1996 0384 038A
1997 038C
1998 038E 03A1
1999 03A3 03CE
2000 03D7
2001 03DA 03E1
2002 0400 045F
2003 0490 04C4
2004 04C7 04C8
2005 04CB 04CC
2006 04D0 04EB
2007 04EE 04F5
2008 04F8 04F9
2009 1E02 1E03
2010 1E0A 1E0B
2011 1E1E 1E1F
2012 1E40 1E41
2013 1E56 1E57
2014 1E60 1E61
2015 1E6A 1E6B
2016 1E80 1E85
2017 1E9B
2018 1EF2 1EF3
2019 1F00 1F15
2020 1F18 1F1D
2021 1F20 1F45
2022 1F48 1F4D
2023 1F50 1F57
2024 1F59
2025 1F5B
2026 1F5D
2027 1F5F 1F7D
2028 1F80 1FB4
2029 1FB6 1FC4
2030 1FC6 1FD3
2031 1FD6 1FDB
2032 1FDD 1FEF
2033 1FF2 1FF4
2034 1FF6 1FFE
2035 2013 2015
2036 2017 201E
2037 2020 2022
2038 2026
2039 2030
2040 2032 2033
2041 2039 203A
2042 203C
2043 203E
2044 2044
2045 204A
2046 207F
2047 2082
2048 20A3 20A4
2049 20A7
2050 20AC
2051 20AF
2052 2105
2053 2116
2054 2122
2055 2126
2056 215B 215E
2057 2190 2195
2058 21A8
2059 2200
2060 2202 2203
2061 2206
2062 2208 2209
2063 220F
2064 2211 2212
2065 2219 221A
2066 221E 221F
2067 2227 222B
2068 2248
2069 2259
2070 2260 2261
2071 2264 2265
2072 2282 2283
2073 2295
2074 2297
2075 2302
2076 2310
2077 2320 2321
2078 2329 232A
2079 2500
2080 2502
2081 250C
2082 2510
2083 2514
2084 2518
2085 251C
2086 2524
2087 252C
2088 2534
2089 253C
2090 2550 256C
2091 2580
2092 2584
2093 2588
2094 258C
2095 2590 2593
2096 25A0
2097 25AC
2098 25B2
2099 25BA
2100 25BC
2101 25C4
2102 25CA 25CB
2103 25D8 25D9
2104 263A 263C
2105 2640
2106 2642
2107 2660
2108 2663
2109 2665 2666
2110 266A 266B
2111 FB01 FB02
2112 FFFD
2113 EOH
2114 }
2115
2116 sub InUCS_MES3A {
2117 <<EOH;
2118 0020 007E
2119 00A0 00FF
2120 0100 017F
2121 0180 024F
2122 0250 02AF
2123 02B0 02FF
2124 0300 036F
2125 0370 03CF
2126 03D0 03FF
2127 0400 04FF
2128 0530 058F
2129 10D0 10FF
2130 1E00 1EFF
2131 1F00 1FFF
2132 2000 206F
2133 2070 209F
2134 20A0 20CF
2135 20D0 20FF
2136 2100 214F
2137 2150 218F
2138 2190 21FF
2139 2200 22FF
2140 2300 23FF
2141 2440 245F
2142 2500 257F
2143 2580 259F
2144 25A0 25FF
2145 2600 26FF
2146 FB00 FB4F
2147 FE20 FE2F
2148 FFF0 FFFD
2149 EOH
2150 }
2151
2152 sub InUCS_MES3B {
2153 <<EOH;
2154 0020 007E
2155 00A0 00FF
2156 0100 01FF
2157 0200 021F
2158 0222 0233
2159 0250 02AD
2160 02B0 02EE
2161 0300 034E
2162 0360 0362
2163 0374 0375
2164 037A
2165 037E
2166 0384 038A
2167 038C
2168 038E 03A1
2169 03A3 03CE
2170 03D0 03D7
2171 03DA 03F3
2172 0400 0486
2173 0488 0489
2174 048C 04C4
2175 04C7 04C8
2176 04CB 04CC
2177 04D0 04F5
2178 04F8 04F9
2179 0531 0556
2180 0559 055F
2181 0561 0587
2182 0589 058A
2183 10D0 10F6
2184 10FB
2185 1E00 1E9B
2186 1EA0 1EF9
2187 1F00 1F15
2188 1F18 1F1D
2189 1F20 1F45
2190 1F48 1F4D
2191 1F50 1F57
2192 1F59
2193 1F5B
2194 1F5D
2195 1F5F 1F7D
2196 1F80 1FB4
2197 1FB6 1FC4
2198 1FC6 1FD3
2199 1FD6 1FDB
2200 1FDD 1FEF
2201 1FF2 1FF4
2202 1FF6 1FFE
2203 2000 2046
2204 2048 204D
2205 206A 2070
2206 2074 208E
2207 20A0 20AF
2208 20D0 20E3
2209 2100 213A
2210 2153 2183
2211 2190 21F3
2212 2200 22F1
2213 2300 237B
2214 237D 239A
2215 2440 244A
2216 2500 2595
2217 25A0 25F7
2218 2600 2613
2219 2619 2671
2220 FB00 FB06
2221 FB13 FB17
2222 FE20 FE23
2223 FFF9 FFFD
2224 EOH
2225 }
2226
2227 *InUCS1 = \&InUCSBasicLatin;
2228
2229 *InUCS10 = \&InUCSCyrillic;
2230
2231 *InUCS100 = \&InUCSKatakanaPhoneticExtensions;
2232
2233 *InUCS1000 = \&InUCSSmp;
2234
2235 *InUCS1001 = \&InUCSEtruscan;
2236
2237 *InUCS1002 = \&InUCSGothic;
2238
2239 *InUCS1003 = \&InUCSDeseret;
2240
2241 *InUCS1004 = \&InUCSByzantineMusicalSymbols;
2242
2243 *InUCS1005 = \&InUCSWesternMusicalSymbols;
2244
2245 *InUCS1007 = \&InUCSLinearBSyllabary;
2246
2247 *InUCS1008 = \&InUCSLinearBIdeograms;
2248
2249 *InUCS1009 = \&InUCSAeganNumbers;
2250
2251 *InUCS101 = \&InUCSVariationSelectors;
2252
2253 *InUCS1010 = \&InUCSUgaritic;
2254
2255 *InUCS1011 = \&InUCSShavian;
2256
2257 *InUCS1012 = \&InUCSOsmanya;
2258
2259 *InUCS1013 = \&InUCSCypriotSyllabary;
2260
2261 *InUCS104 = \&InUCSLimbu;
2262
2263 *InUCS105 = \&InUCSTaiLe;
2264
2265 *InUCS106 = \&InUCSSupplementalArrowsC;
2266
2267 *InUCS10646 = \&InUCSUnicode;
2268
2269 *InUCS107 = \&InUCSSupplementalCJKCompatibility;
2270
2271 *InUCS108 = \&InUCSYijingHexagramSymbols;
2272
2273 *InUCS11 = \&InUCSArmenian;
2274
2275 *InUCS12 = \&InUCSBasicHebrew;
2276
2277 *InUCS13 = \&InUCSHebrewExtended;
2278
2279 *InUCS14 = \&InUCSBasicArabic;
2280
2281 *InUCS15 = \&InUCSArabicExtended;
2282
2283 *InUCS16 = \&InUCSDevanagari;
2284
2285 *InUCS17 = \&InUCSBengali;
2286
2287 *InUCS18 = \&InUCSGurmukhi;
2288
2289 *InUCS180 = \&InUCS_CJKUnifiedIdeographsAll;
2290
2291 *InUCS19 = \&InUCSGujarati;
2292
2293 *InUCS2 = \&InUCSLatin1Supplement;
2294
2295 *InUCS20 = \&InUCSOriya;
2296
2297 *InUCS200 = \&InUCSZeroWidthBoundaryIndicators;
2298
2299 *InUCS2000 = \&InUCSSip;
2300
2301 *InUCS2001 = \&InUCS_CJKUnifiedIdeographsExtensionB;
2302
2303 *InUCS2002 = \&InUCS_CJKCompatibilityIdeographsSupplement;
2304
2305 *InUCS201 = \&InUCSFormatSeparators;
2306
2307 *InUCS202 = \&InUCSBiDirectionalFormatMarks;
2308
2309 *InUCS203 = \&InUCSBiDirectionalFormatEmbeddings;
2310
2311 *InUCS204 = \&InUCSHangulFillCharacters;
2312
2313 *InUCS205 = \&InUCSCharacterShapingSelectors;
2314
2315 *InUCS206 = \&InUCSNumericShapeSelectors;
2316
2317 *InUCS207 = \&InUCSIdeographicDescriptionCharacters;
2318
2319 *InUCS21 = \&InUCSTamil;
2320
2321 *InUCS22 = \&InUCSTelugu;
2322
2323 *InUCS23 = \&InUCSKannada;
2324
2325 *InUCS24 = \&InUCSMalayalam;
2326
2327 *InUCS25 = \&InUCSThai;
2328
2329 *InUCS250 = \&InUCSGeneralFormatCharacters;
2330
2331 *InUCS251 = \&InUCSScriptSpecificFormatCharacters;
2332
2333 *InUCS26 = \&InUCSLao;
2334
2335 *InUCS27 = \&InUCSBasicGeorgian;
2336
2337 *InUCS28 = \&InUCSGeorgianExtended;
2338
2339 *InUCS281 = \&InUCS_MES1;
2340
2341 *InUCS282 = \&InUCS_MES2;
2342
2343 *InUCS283 = \&InUCS_MES3A;
2344
2345 *InUCS284 = \&InUCS_MES3B;
2346
2347 *InUCS29 = \&InUCSHangulJamo;
2348
2349 *InUCS299 = \&InUCS_BMPFirstEdition;
2350
2351 *InUCS3 = \&InUCSLatinExtendedA;
2352
2353 *InUCS30 = \&InUCSLatinExtendedAdditional;
2354
2355 *InUCS300 = \&InUCS_BMP;
2356
2357 *InUCS3000 = \&InUCSSpp;
2358
2359 *InUCS3001 = \&InUCSTags;
2360
2361 *InUCS3002 = \&InUCSVariationSelectorsSupplement;
2362
2363 *InUCS301 = \&InUCS_BMP_AMD7;
2364
2365 *InUCS302 = \&InUCS_BMPSecondEdition;
2366
2367 *InUCS31 = \&InUCSGreekExtended;
2368
2369 *InUCS32 = \&InUCSGeneralPunctuation;
2370
2371 *InUCS33 = \&InUCSSuperscriptsAndSubscripts;
2372
2373 *InUCS34 = \&InUCSCurrencySymbols;
2374
2375 *InUCS35 = \&InUCSCombiningDiacriticalMarksForSymbols;
2376
2377 *InUCS36 = \&InUCSLetterlikeSymbols;
2378
2379 *InUCS37 = \&InUCSNumberForms;
2380
2381 *InUCS38 = \&InUCSArrows;
2382
2383 *InUCS39 = \&InUCSMathematicalOperators;
2384
2385 *InUCS4 = \&InUCSLatinExtendedB;
2386
2387 *InUCS40 = \&InUCSMiscellaneousTechnical;
2388
2389 *InUCS4000 = \&InUCSPart2;
2390
2391 *InUCS41 = \&InUCSControlPictures;
2392
2393 *InUCS42 = \&InUCSOpticalCharacterRecognition;
2394
2395 *InUCS43 = \&InUCSEnclosedAlphanumerics;
2396
2397 *InUCS44 = \&InUCSBoxDrawing;
2398
2399 *InUCS45 = \&InUCSBlockElements;
2400
2401 *InUCS46 = \&InUCSGeometricShapes;
2402
2403 *InUCS47 = \&InUCSMiscellaneousSymbols;
2404
2405 *InUCS48 = \&InUCSDingbats;
2406
2407 *InUCS49 = \&InUCS_CJKSymbolsAndPunctuation;
2408
2409 *InUCS5 = \&InUCSIPAExtensions;
2410
2411 *InUCS50 = \&InUCSHiragana;
2412
2413 *InUCS500 = \&InUCSPrivateUseGroups;
2414
2415 *InUCS51 = \&InUCSKatakana;
2416
2417 *InUCS52 = \&InUCSBopomofo;
2418
2419 *InUCS53 = \&InUCSHangulCompatibilityJamo;
2420
2421 *InUCS54 = \&InUCS_CJKMiscellaneous;
2422
2423 *InUCS55 = \&InUCSEnclosedCJKLettersAndMonths;
2424
2425 *InUCS56 = \&InUCS_CJKCompatibility;
2426
2427 *InUCS57 = \&InUCSBasicHangul;
2428
2429 *InUCS58 = \&InUCSSupplementalHangulB;
2430
2431 *InUCS6 = \&InUCSSpacingModifierLetters;
2432
2433 *InUCS60 = \&InUCS_CJKUnifiedIdeographs;
2434
2435 *InUCS61 = \&InUCSPrivateUseArea;
2436
2437 *InUCS62 = \&InUCS_CJKCompatibilityIdeographs;
2438
2439 *InUCS63 = \&InUCSAlphabeticPresentationForms;
2440
2441 *InUCS64 = \&InUCSArabicPresentationFormsA;
2442
2443 *InUCS65 = \&InUCSCombiningHalfMarks;
2444
2445 *InUCS66 = \&InUCS_CJKCompatibilityForms;
2446
2447 *InUCS67 = \&InUCSSmallFormVariants;
2448
2449 *InUCS68 = \&InUCSArabicPresentationFormsB;
2450
2451 *InUCS69 = \&InUCSHalfwidthAndFullwidthForms;
2452
2453 *InUCS7 = \&InUCSCombiningDiacriticalMarks;
2454
2455 *InUCS70 = \&InUCSSpecials;
2456
2457 *InUCS71 = \&InUCSHangulSyllables;
2458
2459 *InUCS72 = \&InUCSBasicTibetan;
2460
2461 *InUCS73 = \&InUCSEthiopic;
2462
2463 *InUCS74 = \&InUCSUnifiedCanadianAboriginalSyllabics;
2464
2465 *InUCS75 = \&InUCSCherokee;
2466
2467 *InUCS76 = \&InUCSYiSyllables;
2468
2469 *InUCS77 = \&InUCSYiRadicals;
2470
2471 *InUCS78 = \&InUCSKangxiRadicals;
2472
2473 *InUCS79 = \&InUCS_CJKRadicalsSupplement;
2474
2475 *InUCS8 = \&InUCSBasicGreek;
2476
2477 *InUCS80 = \&InUCSBraillePatterns;
2478
2479 *InUCS81 = \&InUCS_CJKUnifiedIdeographsExtensionA;
2480
2481 *InUCS82 = \&InUCSOgham;
2482
2483 *InUCS83 = \&InUCSRunic;
2484
2485 *InUCS84 = \&InUCSSinhala;
2486
2487 *InUCS85 = \&InUCSSyriac;
2488
2489 *InUCS86 = \&InUCSThaana;
2490
2491 *InUCS87 = \&InUCSBasicMyanmar;
2492
2493 *InUCS88 = \&InUCSKhmer;
2494
2495 *InUCS89 = \&InUCSMongolian;
2496
2497 *InUCS9 = \&InUCSGreekSymbolsAndCoptic;
2498
2499 *InUCS90 = \&InUCSExtendedMyanmar;
2500
2501 *InUCS91 = \&InUCSTibetan;
2502
2503 *InUCS92 = \&InUCSCyrillicSupplementary;
2504
2505 *InUCS93 = \&InUCSTagalog;
2506
2507 *InUCS94 = \&InUCSHanunoo;
2508
2509 *InUCS95 = \&InUCSBuhid;
2510
2511 *InUCS96 = \&InUCSTagbanwa;
2512
2513 *InUCS97 = \&InUCSSupplementalArrows;
2514
2515 *InUCS98 = \&InUCSMiscllaneousMathmaticalSymbols;
2516
2517 *InUCS99 = \&InUCSSupplementalMathmaticalOperators;
2518
2519 =head1 COLLECTION NAMES
2520
2521 =over 4
2522
2523 =item C<InUCS1>
2524
2525 An alias for InUCSBasicLatin.
2526
2527 =item C<InUCS10>
2528
2529 An alias for InUCSCyrillic.
2530
2531 =item C<InUCS100>
2532
2533 An alias for InUCSKatakanaPhoneticExtensions.
2534
2535 =item C<InUCS1000>
2536
2537 An alias for InUCSSmp.
2538
2539 =item C<InUCS1001>
2540
2541 An alias for InUCSEtruscan.
2542
2543 =item C<InUCS1002>
2544
2545 An alias for InUCSGothic.
2546
2547 =item C<InUCS1003>
2548
2549 An alias for InUCSDeseret.
2550
2551 =item C<InUCS1004>
2552
2553 An alias for InUCSByzantineMusicalSymbols.
2554
2555 =item C<InUCS1005>
2556
2557 An alias for InUCSWesternMusicalSymbols.
2558
2559 =item C<InUCS1007>
2560
2561 An alias for InUCSLinearBSyllabary.
2562
2563 =item C<InUCS1008>
2564
2565 An alias for InUCSLinearBIdeograms.
2566
2567 =item C<InUCS1009>
2568
2569 An alias for InUCSAeganNumbers.
2570
2571 =item C<InUCS101>
2572
2573 An alias for InUCSVariationSelectors.
2574
2575 =item C<InUCS1010>
2576
2577 An alias for InUCSUgaritic.
2578
2579 =item C<InUCS1011>
2580
2581 An alias for InUCSShavian.
2582
2583 =item C<InUCS1012>
2584
2585 An alias for InUCSOsmanya.
2586
2587 =item C<InUCS1013>
2588
2589 An alias for InUCSCypriotSyllabary.
2590
2591 =item C<InUCS104>
2592
2593 An alias for InUCSLimbu.
2594
2595 =item C<InUCS105>
2596
2597 An alias for InUCSTaiLe.
2598
2599 =item C<InUCS106>
2600
2601 An alias for InUCSSupplementalArrowsC.
2602
2603 =item C<InUCS10646>
2604
2605 An alias for InUCSUnicode.
2606
2607 =item C<InUCS107>
2608
2609 An alias for InUCSSupplementalCJKCompatibility.
2610
2611 =item C<InUCS108>
2612
2613 An alias for InUCSYijingHexagramSymbols.
2614
2615 =item C<InUCS11>
2616
2617 An alias for InUCSArmenian.
2618
2619 =item C<InUCS12>
2620
2621 An alias for InUCSBasicHebrew.
2622
2623 =item C<InUCS13>
2624
2625 An alias for InUCSHebrewExtended.
2626
2627 =item C<InUCS14>
2628
2629 An alias for InUCSBasicArabic.
2630
2631 =item C<InUCS15>
2632
2633 An alias for InUCSArabicExtended.
2634
2635 =item C<InUCS16>
2636
2637 An alias for InUCSDevanagari.
2638
2639 =item C<InUCS17>
2640
2641 An alias for InUCSBengali.
2642
2643 =item C<InUCS18>
2644
2645 An alias for InUCSGurmukhi.
2646
2647 =item C<InUCS180>
2648
2649 An alias for InUCS_CJKUnifiedIdeographsAll.
2650
2651 =item C<InUCS19>
2652
2653 An alias for InUCSGujarati.
2654
2655 =item C<InUCS2>
2656
2657 An alias for InUCSLatin1Supplement.
2658
2659 =item C<InUCS20>
2660
2661 An alias for InUCSOriya.
2662
2663 =item C<InUCS200>
2664
2665 An alias for InUCSZeroWidthBoundaryIndicators.
2666
2667 =item C<InUCS2000>
2668
2669 An alias for InUCSSip.
2670
2671 =item C<InUCS2001>
2672
2673 An alias for InUCS_CJKUnifiedIdeographsExtensionB.
2674
2675 =item C<InUCS2002>
2676
2677 An alias for InUCS_CJKCompatibilityIdeographsSupplement.
2678
2679 =item C<InUCS201>
2680
2681 An alias for InUCSFormatSeparators.
2682
2683 =item C<InUCS202>
2684
2685 An alias for InUCSBiDirectionalFormatMarks.
2686
2687 =item C<InUCS203>
2688
2689 An alias for InUCSBiDirectionalFormatEmbeddings.
2690
2691 =item C<InUCS204>
2692
2693 An alias for InUCSHangulFillCharacters.
2694
2695 =item C<InUCS205>
2696
2697 An alias for InUCSCharacterShapingSelectors.
2698
2699 =item C<InUCS206>
2700
2701 An alias for InUCSNumericShapeSelectors.
2702
2703 =item C<InUCS207>
2704
2705 An alias for InUCSIdeographicDescriptionCharacters.
2706
2707 =item C<InUCS21>
2708
2709 An alias for InUCSTamil.
2710
2711 =item C<InUCS22>
2712
2713 An alias for InUCSTelugu.
2714
2715 =item C<InUCS23>
2716
2717 An alias for InUCSKannada.
2718
2719 =item C<InUCS24>
2720
2721 An alias for InUCSMalayalam.
2722
2723 =item C<InUCS25>
2724
2725 An alias for InUCSThai.
2726
2727 =item C<InUCS250>
2728
2729 An alias for InUCSGeneralFormatCharacters.
2730
2731 =item C<InUCS251>
2732
2733 An alias for InUCSScriptSpecificFormatCharacters.
2734
2735 =item C<InUCS26>
2736
2737 An alias for InUCSLao.
2738
2739 =item C<InUCS27>
2740
2741 An alias for InUCSBasicGeorgian.
2742
2743 =item C<InUCS28>
2744
2745 An alias for InUCSGeorgianExtended.
2746
2747 =item C<InUCS281>
2748
2749 An alias for InUCS_MES1.
2750
2751 =item C<InUCS282>
2752
2753 An alias for InUCS_MES2.
2754
2755 =item C<InUCS283>
2756
2757 An alias for InUCS_MES3A.
2758
2759 =item C<InUCS284>
2760
2761 An alias for InUCS_MES3B.
2762
2763 =item C<InUCS29>
2764
2765 An alias for InUCSHangulJamo.
2766
2767 =item C<InUCS299>
2768
2769 An alias for InUCS_BMPFirstEdition.
2770
2771 =item C<InUCS3>
2772
2773 An alias for InUCSLatinExtendedA.
2774
2775 =item C<InUCS30>
2776
2777 An alias for InUCSLatinExtendedAdditional.
2778
2779 =item C<InUCS300>
2780
2781 An alias for InUCS_BMP.
2782
2783 =item C<InUCS3000>
2784
2785 An alias for InUCSSpp.
2786
2787 =item C<InUCS3001>
2788
2789 An alias for InUCSTags.
2790
2791 =item C<InUCS3002>
2792
2793 An alias for InUCSVariationSelectorsSupplement.
2794
2795 =item C<InUCS301>
2796
2797 An alias for InUCS_BMP_AMD7.
2798
2799 =item C<InUCS302>
2800
2801 An alias for InUCS_BMPSecondEdition.
2802
2803 =item C<InUCS31>
2804
2805 An alias for InUCSGreekExtended.
2806
2807 =item C<InUCS32>
2808
2809 An alias for InUCSGeneralPunctuation.
2810
2811 =item C<InUCS33>
2812
2813 An alias for InUCSSuperscriptsAndSubscripts.
2814
2815 =item C<InUCS34>
2816
2817 An alias for InUCSCurrencySymbols.
2818
2819 =item C<InUCS35>
2820
2821 An alias for InUCSCombiningDiacriticalMarksForSymbols.
2822
2823 =item C<InUCS36>
2824
2825 An alias for InUCSLetterlikeSymbols.
2826
2827 =item C<InUCS37>
2828
2829 An alias for InUCSNumberForms.
2830
2831 =item C<InUCS38>
2832
2833 An alias for InUCSArrows.
2834
2835 =item C<InUCS39>
2836
2837 An alias for InUCSMathematicalOperators.
2838
2839 =item C<InUCS4>
2840
2841 An alias for InUCSLatinExtendedB.
2842
2843 =item C<InUCS40>
2844
2845 An alias for InUCSMiscellaneousTechnical.
2846
2847 =item C<InUCS4000>
2848
2849 An alias for InUCSPart2.
2850
2851 =item C<InUCS41>
2852
2853 An alias for InUCSControlPictures.
2854
2855 =item C<InUCS42>
2856
2857 An alias for InUCSOpticalCharacterRecognition.
2858
2859 =item C<InUCS43>
2860
2861 An alias for InUCSEnclosedAlphanumerics.
2862
2863 =item C<InUCS44>
2864
2865 An alias for InUCSBoxDrawing.
2866
2867 =item C<InUCS45>
2868
2869 An alias for InUCSBlockElements.
2870
2871 =item C<InUCS46>
2872
2873 An alias for InUCSGeometricShapes.
2874
2875 =item C<InUCS47>
2876
2877 An alias for InUCSMiscellaneousSymbols.
2878
2879 =item C<InUCS48>
2880
2881 An alias for InUCSDingbats.
2882
2883 =item C<InUCS49>
2884
2885 An alias for InUCS_CJKSymbolsAndPunctuation.
2886
2887 =item C<InUCS5>
2888
2889 An alias for InUCSIPAExtensions.
2890
2891 =item C<InUCS50>
2892
2893 An alias for InUCSHiragana.
2894
2895 =item C<InUCS500>
2896
2897 An alias for InUCSPrivateUseGroups.
2898
2899 =item C<InUCS51>
2900
2901 An alias for InUCSKatakana.
2902
2903 =item C<InUCS52>
2904
2905 An alias for InUCSBopomofo.
2906
2907 =item C<InUCS53>
2908
2909 An alias for InUCSHangulCompatibilityJamo.
2910
2911 =item C<InUCS54>
2912
2913 An alias for InUCS_CJKMiscellaneous.
2914
2915 =item C<InUCS55>
2916
2917 An alias for InUCSEnclosedCJKLettersAndMonths.
2918
2919 =item C<InUCS56>
2920
2921 An alias for InUCS_CJKCompatibility.
2922
2923 =item C<InUCS57>
2924
2925 An alias for InUCSBasicHangul.
2926
2927 =item C<InUCS58>
2928
2929 An alias for InUCSSupplementalHangulB.
2930
2931 =item C<InUCS6>
2932
2933 An alias for InUCSSpacingModifierLetters.
2934
2935 =item C<InUCS60>
2936
2937 An alias for InUCS_CJKUnifiedIdeographs.
2938
2939 =item C<InUCS61>
2940
2941 An alias for InUCSPrivateUseArea.
2942
2943 =item C<InUCS62>
2944
2945 An alias for InUCS_CJKCompatibilityIdeographs.
2946
2947 =item C<InUCS63>
2948
2949 An alias for InUCSAlphabeticPresentationForms.
2950
2951 =item C<InUCS64>
2952
2953 An alias for InUCSArabicPresentationFormsA.
2954
2955 =item C<InUCS65>
2956
2957 An alias for InUCSCombiningHalfMarks.
2958
2959 =item C<InUCS66>
2960
2961 An alias for InUCS_CJKCompatibilityForms.
2962
2963 =item C<InUCS67>
2964
2965 An alias for InUCSSmallFormVariants.
2966
2967 =item C<InUCS68>
2968
2969 An alias for InUCSArabicPresentationFormsB.
2970
2971 =item C<InUCS69>
2972
2973 An alias for InUCSHalfwidthAndFullwidthForms.
2974
2975 =item C<InUCS7>
2976
2977 An alias for InUCSCombiningDiacriticalMarks.
2978
2979 =item C<InUCS70>
2980
2981 An alias for InUCSSpecials.
2982
2983 =item C<InUCS71>
2984
2985 An alias for InUCSHangulSyllables.
2986
2987 =item C<InUCS72>
2988
2989 An alias for InUCSBasicTibetan.
2990
2991 =item C<InUCS73>
2992
2993 An alias for InUCSEthiopic.
2994
2995 =item C<InUCS74>
2996
2997 An alias for InUCSUnifiedCanadianAboriginalSyllabics.
2998
2999 =item C<InUCS75>
3000
3001 An alias for InUCSCherokee.
3002
3003 =item C<InUCS76>
3004
3005 An alias for InUCSYiSyllables.
3006
3007 =item C<InUCS77>
3008
3009 An alias for InUCSYiRadicals.
3010
3011 =item C<InUCS78>
3012
3013 An alias for InUCSKangxiRadicals.
3014
3015 =item C<InUCS79>
3016
3017 An alias for InUCS_CJKRadicalsSupplement.
3018
3019 =item C<InUCS8>
3020
3021 An alias for InUCSBasicGreek.
3022
3023 =item C<InUCS80>
3024
3025 An alias for InUCSBraillePatterns.
3026
3027 =item C<InUCS81>
3028
3029 An alias for InUCS_CJKUnifiedIdeographsExtensionA.
3030
3031 =item C<InUCS82>
3032
3033 An alias for InUCSOgham.
3034
3035 =item C<InUCS83>
3036
3037 An alias for InUCSRunic.
3038
3039 =item C<InUCS84>
3040
3041 An alias for InUCSSinhala.
3042
3043 =item C<InUCS85>
3044
3045 An alias for InUCSSyriac.
3046
3047 =item C<InUCS86>
3048
3049 An alias for InUCSThaana.
3050
3051 =item C<InUCS87>
3052
3053 An alias for InUCSBasicMyanmar.
3054
3055 =item C<InUCS88>
3056
3057 An alias for InUCSKhmer.
3058
3059 =item C<InUCS89>
3060
3061 An alias for InUCSMongolian.
3062
3063 =item C<InUCS9>
3064
3065 An alias for InUCSGreekSymbolsAndCoptic.
3066
3067 =item C<InUCS90>
3068
3069 An alias for InUCSExtendedMyanmar.
3070
3071 =item C<InUCS91>
3072
3073 An alias for InUCSTibetan.
3074
3075 =item C<InUCS92>
3076
3077 An alias for InUCSCyrillicSupplementary.
3078
3079 =item C<InUCS93>
3080
3081 An alias for InUCSTagalog.
3082
3083 =item C<InUCS94>
3084
3085 An alias for InUCSHanunoo.
3086
3087 =item C<InUCS95>
3088
3089 An alias for InUCSBuhid.
3090
3091 =item C<InUCS96>
3092
3093 An alias for InUCSTagbanwa.
3094
3095 =item C<InUCS97>
3096
3097 An alias for InUCSSupplementalArrows.
3098
3099 =item C<InUCS98>
3100
3101 An alias for InUCSMiscllaneousMathmaticalSymbols.
3102
3103 =item C<InUCS99>
3104
3105 An alias for InUCSSupplementalMathmaticalOperators.
3106
3107 =item C<InUCSAeganNumbers>
3108
3109 =item C<InUCSAlphabeticPresentationForms>
3110
3111 =item C<InUCSAlternateFormatCharactersExtended>
3112
3113 =item C<InUCSArabicExtended>
3114
3115 =item C<InUCSArabicPresentationFormsA>
3116
3117 =item C<InUCSArabicPresentationFormsB>
3118
3119 =item C<InUCSArmenian>
3120
3121 =item C<InUCSArrows>
3122
3123 =item C<InUCSBasicArabic>
3124
3125 =item C<InUCSBasicGeorgian>
3126
3127 =item C<InUCSBasicGreek>
3128
3129 =item C<InUCSBasicHangul>
3130
3131 =item C<InUCSBasicHebrew>
3132
3133 =item C<InUCSBasicLatin>
3134
3135 =item C<InUCSBasicMyanmar>
3136
3137 =item C<InUCSBasicTibetan>
3138
3139 =item C<InUCSBengali>
3140
3141 =item C<InUCSBiDirectionalFormatEmbeddings>
3142
3143 =item C<InUCSBiDirectionalFormatMarks>
3144
3145 =item C<InUCSBlockElements>
3146
3147 =item C<InUCSBopomofo>
3148
3149 =item C<InUCSBoxDrawing>
3150
3151 =item C<InUCSBraillePatterns>
3152
3153 =item C<InUCSBuhid>
3154
3155 =item C<InUCSByzantineMusicalSymbols>
3156
3157 =item C<InUCSCharacterShapingSelectors>
3158
3159 =item C<InUCSCherokee>
3160
3161 =item C<InUCSCombiningDiacriticalMarks>
3162
3163 =item C<InUCSCombiningDiacriticalMarksForSymbols>
3164
3165 =item C<InUCSCombiningHalfMarks>
3166
3167 =item C<InUCSControlPictures>
3168
3169 =item C<InUCSCurrencySymbols>
3170
3171 =item C<InUCSCypriotSyllabary>
3172
3173 =item C<InUCSCyrillic>
3174
3175 =item C<InUCSCyrillicSupplementary>
3176
3177 =item C<InUCSDeseret>
3178
3179 =item C<InUCSDevanagari>
3180
3181 =item C<InUCSDingbats>
3182
3183 =item C<InUCSEnclosedAlphanumerics>
3184
3185 =item C<InUCSEnclosedCJKLettersAndMonths>
3186
3187 =item C<InUCSEthiopic>
3188
3189 =item C<InUCSEtruscan>
3190
3191 =item C<InUCSExtendedMyanmar>
3192
3193 =item C<InUCSFormatSeparators>
3194
3195 =item C<InUCSGeneralFormatCharacters>
3196
3197 =item C<InUCSGeneralPunctuation>
3198
3199 =item C<InUCSGeometricShapes>
3200
3201 =item C<InUCSGeorgianExtended>
3202
3203 =item C<InUCSGothic>
3204
3205 =item C<InUCSGreekExtended>
3206
3207 =item C<InUCSGreekSymbolsAndCoptic>
3208
3209 =item C<InUCSGujarati>
3210
3211 =item C<InUCSGurmukhi>
3212
3213 =item C<InUCSHalfwidthAndFullwidthForms>
3214
3215 =item C<InUCSHangulCompatibilityJamo>
3216
3217 =item C<InUCSHangulFillCharacters>
3218
3219 =item C<InUCSHangulJamo>
3220
3221 =item C<InUCSHangulSyllables>
3222
3223 =item C<InUCSHanunoo>
3224
3225 =item C<InUCSHebrewExtended>
3226
3227 =item C<InUCSHiragana>
3228
3229 =item C<InUCSIPAExtensions>
3230
3231 =item C<InUCSIdeographicDescriptionCharacters>
3232
3233 =item C<InUCSKangxiRadicals>
3234
3235 =item C<InUCSKannada>
3236
3237 =item C<InUCSKatakana>
3238
3239 =item C<InUCSKatakanaPhoneticExtensions>
3240
3241 =item C<InUCSKhmer>
3242
3243 =item C<InUCSLao>
3244
3245 =item C<InUCSLatin1Supplement>
3246
3247 =item C<InUCSLatinExtendedA>
3248
3249 =item C<InUCSLatinExtendedAdditional>
3250
3251 =item C<InUCSLatinExtendedB>
3252
3253 =item C<InUCSLetterlikeSymbols>
3254
3255 =item C<InUCSLimbu>
3256
3257 =item C<InUCSLinearBIdeograms>
3258
3259 =item C<InUCSLinearBSyllabary>
3260
3261 =item C<InUCSMalayalam>
3262
3263 =item C<InUCSMathematicalOperators>
3264
3265 =item C<InUCSMiscellaneousSymbols>
3266
3267 =item C<InUCSMiscellaneousTechnical>
3268
3269 =item C<InUCSMiscllaneousMathmaticalSymbols>
3270
3271 =item C<InUCSMongolian>
3272
3273 =item C<InUCSNumberForms>
3274
3275 =item C<InUCSNumericShapeSelectors>
3276
3277 =item C<InUCSOgham>
3278
3279 =item C<InUCSOpticalCharacterRecognition>
3280
3281 =item C<InUCSOriya>
3282
3283 =item C<InUCSOsmanya>
3284
3285 =item C<InUCSPart2>
3286
3287 =item C<InUCSPrivateUseArea>
3288
3289 =item C<InUCSPrivateUseGroups>
3290
3291 =item C<InUCSPrivateUsePlanes>
3292
3293 =item C<InUCSRunic>
3294
3295 =item C<InUCSScriptSpecificFormatCharacters>
3296
3297 =item C<InUCSShavian>
3298
3299 =item C<InUCSSinhala>
3300
3301 =item C<InUCSSip>
3302
3303 =item C<InUCSSmallFormVariants>
3304
3305 =item C<InUCSSmp>
3306
3307 =item C<InUCSSpacingModifierLetters>
3308
3309 =item C<InUCSSpecials>
3310
3311 =item C<InUCSSpp>
3312
3313 =item C<InUCSSuperscriptsAndSubscripts>
3314
3315 =item C<InUCSSupplementalArrows>
3316
3317 =item C<InUCSSupplementalArrowsC>
3318
3319 =item C<InUCSSupplementalCJKCompatibility>
3320
3321 =item C<InUCSSupplementalHangulA>
3322
3323 =item C<InUCSSupplementalHangulB>
3324
3325 =item C<InUCSSupplementalMathmaticalOperators>
3326
3327 =item C<InUCSSyriac>
3328
3329 =item C<InUCSTagalog>
3330
3331 =item C<InUCSTagbanwa>
3332
3333 =item C<InUCSTags>
3334
3335 =item C<InUCSTaiLe>
3336
3337 =item C<InUCSTamil>
3338
3339 =item C<InUCSTelugu>
3340
3341 =item C<InUCSThaana>
3342
3343 =item C<InUCSThai>
3344
3345 =item C<InUCSTibetan>
3346
3347 =item C<InUCSUgaritic>
3348
3349 =item C<InUCSUnicode>
3350
3351 =item C<InUCSUnifiedCanadianAboriginalSyllabics>
3352
3353 =item C<InUCSVariationSelectors>
3354
3355 =item C<InUCSVariationSelectorsSupplement>
3356
3357 =item C<InUCSWesternMusicalSymbols>
3358
3359 =item C<InUCSYiRadicals>
3360
3361 =item C<InUCSYiSyllables>
3362
3363 =item C<InUCSYijingHexagramSymbols>
3364
3365 =item C<InUCSZeroWidthBoundaryIndicators>
3366
3367 =item C<InUCS_BMP>
3368
3369 =item C<InUCS_BMPFirstEdition>
3370
3371 =item C<InUCS_BMPSecondEdition>
3372
3373 =item C<InUCS_BMP_AMD7>
3374
3375 =item C<InUCS_CJKCompatibility>
3376
3377 =item C<InUCS_CJKCompatibilityForms>
3378
3379 =item C<InUCS_CJKCompatibilityIdeographs>
3380
3381 =item C<InUCS_CJKCompatibilityIdeographsSupplement>
3382
3383 =item C<InUCS_CJKMiscellaneous>
3384
3385 =item C<InUCS_CJKRadicalsSupplement>
3386
3387 =item C<InUCS_CJKSymbolsAndPunctuation>
3388
3389 =item C<InUCS_CJKUnifiedIdeographs>
3390
3391 =item C<InUCS_CJKUnifiedIdeographsAll>
3392
3393 =item C<InUCS_CJKUnifiedIdeographsExtensionA>
3394
3395 =item C<InUCS_CJKUnifiedIdeographsExtensionB>
3396
3397 =item C<InUCS_MES1>
3398
3399 =item C<InUCS_MES2>
3400
3401 =item C<InUCS_MES3A>
3402
3403 =item C<InUCS_MES3B>
3404
3405 =back
3406
3407 =cut
3408
3409
3410 =head1 EXAMPLE
3411
3412 use Char::Class::UCS;
3413 if ($s =~ /\p{InIPAExtensions}/) {
3414 print "Match!\n";
3415 }
3416
3417 =head1 SEE ALSO
3418
3419 L<Char::Class::JISX0221>
3420
3421 L<Char::Class::RFC1815>
3422
3423 =head1 LICENSE
3424
3425 Copyright 2008 Wakaba <w@suika.fam.cx>
3426
3427 This library and the library generated by it is free software;
3428 you can redistribute them and/or modify them under the same
3429 terms as Perl itself.
3430
3431 =cut
3432
3433 1;
3434 ### UCS.pm ends here

admin@suikawiki.org
ViewVC Help
Powered by ViewVC 1.1.24