/[suikacvs]/perl/charclass/lib/Char/Class/JISX4051.pm
Suika

Contents of /perl/charclass/lib/Char/Class/JISX4051.pm

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.2 - (hide annotations) (download)
Mon Nov 24 04:25:10 2008 UTC (16 years ago) by wakaba
Branch: MAIN
CVS Tags: HEAD
Changes since 1.1: +2 -2 lines
++ ChangeLog	24 Nov 2008 04:24:23 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* mkcommitfeed.pl: New script (copied from Harusame).

	* cvscommit.sh: New script (copied from Harusame).

	* Makefile.PL: Version changed to 2.0.

++ charclass/lib/Char/ChangeLog	24 Nov 2008 01:52:26 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* Normalize/: New directory.

++ charclass/lib/Char/Normalize/ChangeLog	24 Nov 2008 04:20:30 -0000
2008-11-24  Wakaba  <wakaba@suika.fam.cx>

	* FullwidthHalfwidth.pod: New documentation.

	* FullwidthHalfwidth.pm: New module (content from SuikaWiki4
	sw.cgi).

	* ChangeLog: New file.

1 wakaba 1.2 ## This file is auto-generated (at 2008-11-24T04:21:26Z).
2 wakaba 1.1 ## Do not edit by hand!
3     use strict;
4    
5     package Char::Class::JISX4051;
6     our $VERSION = '1.01';
7    
8     use Exporter;
9     use vars qw(@EXPORT_OK @ISA $VERSION);
10     @ISA = qw(Exporter);
11    
12     =head1 NAME
13    
14     Char::Class::JISX4051 - Regular Expression Character Classes - C<JISX4051>
15    
16     =head1 DESCRIPTION
17    
18     JIS X 4051 character classes represented in UCS,
19     defined by JIS X 4051 Appendix
20    
21    
22     =cut
23    
24     sub import ($;@) {
25     my ($self, @sub) = (shift, @_);
26     for (@sub) {
27     no strict 'refs';
28     *{'main::'.$_} = \&{$_};
29     }
30     $Exporter::ExportLevel = 1;
31     $self->SUPER::import (@_);
32     $Exporter::ExportLevel = 0;
33     }
34    
35     @EXPORT_OK = qw(InJISX4051AlphabeticExceptSpace InJISX4051AlphabeticSpace InJISX4051CharacterInDigits InJISX4051CharacterInUnitSymbol InJISX4051CloseBracket InJISX4051FullStop InJISX4051Hiragana InJISX4051JapaneseSpace InJISX4051LineStartKinsokuJapaneseCharacter InJISX4051MiddleDot InJISX4051MiscJapaneseCharacter InJISX4051OpenBracket InJISX4051PostShortenedSymbol InJISX4051PreShortenedSymbol InJISX4051SeparationSymbol InJISX4051UnseparatableCharacter InJISX4051WarichuuCloseBracket InJISX4051WarichuuOpenBracket);
36    
37     sub InJISX4051AlphabeticExceptSpace {
38     <<EOH;
39     0021 007E
40     00A1 00FF
41     0100 017F
42     0250 02A8
43     0374 0375
44     037A
45     037E
46     0384 038A
47     038C
48     038E 03A1
49     03A3 03CE
50     0401 040C
51     040E 044F
52     0451 045C
53     045E 047F
54     0480 0486
55     0490 04C4
56     04C7 04C8
57     04CB 04CC
58     04D0 04EB
59     04EE 04F5
60     04F8 04F9
61     2000 202E
62     2030 2046
63     2070
64     2074 208E
65     20A0 20AA
66     2100 2138
67     2153 2182
68     2190 21EA
69     2200 227F
70     2280 22F1
71     2312
72     2460 24EA
73     2500 257F
74     2580 2595
75     25A0 25EF
76     2600 2613
77     261A 266F
78     2701 2704
79     2706 2709
80     270C 2727
81     2729 274B
82     274D
83     274F 2752
84     2756
85     2758 275E
86     2761 2767
87     2776 2794
88     2798 27AF
89     27B1 27BE
90     EOH
91     }
92    
93     sub InJISX4051AlphabeticSpace {
94     <<EOH;
95     0020
96     EOH
97     }
98    
99     sub InJISX4051CharacterInDigits {
100     <<EOH;
101     0030 0039
102     002C
103     002E
104     EOH
105     }
106    
107     sub InJISX4051CharacterInUnitSymbol {
108     <<EOH;
109     0041 005A
110     0061 007A
111     2126
112     EOH
113     }
114    
115     sub InJISX4051CloseBracket {
116     <<EOH;
117     0029
118     002C
119     005D
120     007D
121     2019
122     201A
123     201D
124     201E
125     3001
126     3009
127     300B
128     300D
129     300F
130     3011
131     3015
132     3017
133     3019
134     301B
135     301E
136     301F
137     EOH
138     }
139    
140     sub InJISX4051FullStop {
141     <<EOH;
142     002E
143     3002
144     EOH
145     }
146    
147     sub InJISX4051Hiragana {
148     <<EOH;
149     3042
150     3044
151     3046
152     3048
153     304A 3062
154     3064 3082
155     3084
156     3086
157     3088 308D
158     308F 3094
159     EOH
160     }
161    
162     sub InJISX4051JapaneseSpace {
163     <<EOH;
164     3000
165     EOH
166     }
167    
168     sub InJISX4051LineStartKinsokuJapaneseCharacter {
169     <<EOH;
170     203C
171     2044
172     301C
173     3041
174     3043
175     3045
176     3047
177     3049
178     3063
179     3083
180     3085
181     3087
182     308E
183     309D
184     309E
185     30A1
186     30A3
187     30A5
188     30A7
189     30A9
190     30C3
191     30E3
192     30E5
193     30E7
194     30EE
195     30F5
196     30F6
197     30FC
198     30FD
199     30FE
200     EOH
201     }
202    
203     sub InJISX4051MiddleDot {
204     <<EOH;
205     003A
206     003B
207     00FB
208     EOH
209     }
210    
211     sub InJISX4051MiscJapaneseCharacter {
212     <<EOH;
213     002B
214     002D
215     003C
216     003D
217     003E
218     00A7
219     00A9
220     00AE
221     00B1
222     00B6
223     00D7
224     00F7
225     203B
226     2160 217F
227     2190 21EA
228     2460 24EA
229     2500 257F
230     2580 2595
231     25A0 25EF
232     2600 2613
233     261A 266E
234     2701 2704
235     2706 2709
236     270C 2727
237     2729 274B
238     274D
239     274F 2752
240     2756
241     2758 275E
242     2761 2767
243     2776 2794
244     2798 27AF
245     27B1 27BE
246     3003
247     3004
248     3006
249     3007
250     3012
251     3013
252     3020
253     3036
254     30A2
255     30A4
256     30A6
257     30A8
258     30AA 30C2
259     30C4 30E2
260     30E4
261     30E6
262     30E8 30ED
263     30EF 30F4
264     30F7 30FA
265     3220 3243
266     3280 32B0
267     32D0 32FE
268     3300 3357
269     3371 3376
270     3380 33DD
271     4E00 9FA5
272     EOH
273     }
274    
275     sub InJISX4051OpenBracket {
276     <<EOH;
277     0028
278     005B
279     007B
280     2018
281     201B
282     201C
283     201F
284     3008
285     300A
286     300C
287     300E
288     3010
289     3014
290     3016
291     3018
292     301A
293     301D
294     EOH
295     }
296    
297     sub InJISX4051PostShortenedSymbol {
298     <<EOH;
299     0025
300     00A2
301     00B0
302     2030 2033
303     EOH
304     }
305    
306     sub InJISX4051PreShortenedSymbol {
307     <<EOH;
308     0024
309     00A3
310     00A5
311     2116
312     EOH
313     }
314    
315     sub InJISX4051SeparationSymbol {
316     <<EOH;
317     0021
318     003F
319     EOH
320     }
321    
322     sub InJISX4051UnseparatableCharacter {
323     <<EOH;
324     2014
325     2024 2026
326     EOH
327     }
328    
329     sub InJISX4051WarichuuCloseBracket {
330     <<EOH;
331     0029
332     005D
333     3015
334     EOH
335     }
336    
337     sub InJISX4051WarichuuOpenBracket {
338     <<EOH;
339     0028
340     005B
341     3014
342     EOH
343     }
344    
345     =head1 COLLECTION NAMES
346    
347     =over 4
348    
349     =item C<InJISX4051AlphabeticExceptSpace>
350    
351     (18) 欧文間隔以外の欧文用文字
352    
353     =item C<InJISX4051AlphabeticSpace>
354    
355     (17) 欧文間隔
356    
357     =item C<InJISX4051CharacterInDigits>
358    
359     (15) 連数字中の文字
360    
361     =item C<InJISX4051CharacterInUnitSymbol>
362    
363     (16) 単位記号中の文字
364    
365     =item C<InJISX4051CloseBracket>
366    
367     (2) 終わり括弧類
368    
369     =item C<InJISX4051FullStop>
370    
371     (6) 句点類
372    
373     =item C<InJISX4051Hiragana>
374    
375     (11) 平仮名
376    
377     =item C<InJISX4051JapaneseSpace>
378    
379     (10) 和字間隔
380    
381     =item C<InJISX4051LineStartKinsokuJapaneseCharacter>
382    
383     (3) 行頭禁則和字
384    
385     =item C<InJISX4051MiddleDot>
386    
387     (5) 中点類
388    
389     =item C<InJISX4051MiscJapaneseCharacter>
390    
391     (12) (1)〜(11)以外の和字
392    
393     =item C<InJISX4051OpenBracket>
394    
395     (1) 始め括弧類
396    
397     =item C<InJISX4051PostShortenedSymbol>
398    
399     (9) 後置省略記号
400    
401     =item C<InJISX4051PreShortenedSymbol>
402    
403     (8) 前置省略記号
404    
405     =item C<InJISX4051SeparationSymbol>
406    
407     (4) 区切り約物
408    
409     =item C<InJISX4051UnseparatableCharacter>
410    
411     (7) 分離禁止文字
412    
413     =item C<InJISX4051WarichuuCloseBracket>
414    
415     (20) 割注終わり括弧類
416    
417     =item C<InJISX4051WarichuuOpenBracket>
418    
419     (19) 割注始め括弧類
420    
421     =back
422    
423     =cut
424    
425    
426     =head1 EXAMPLE
427    
428     use Char::Class::JISX4051;
429     if ($s =~ /\p{InCharacterInUnitSymbol}/) {
430     print "Match!\n";
431     }
432    
433     =head1 SEE ALSO
434    
435     JIS X 4051-1995, 『日本語文書の行組版方法 Line composition rules
436     for Japanese documents』, 日本工業標準調査会 Japanese Industrial
437     Standard Commitee (JISC <http://www.jisc.go.jp/>), 1995.
438    
439     =head1 LICENSE
440    
441 wakaba 1.2 Copyright 2008 わかば Wakaba <w@suika.fam.cx>
442 wakaba 1.1
443     This library and the library generated by it is free software;
444     you can redistribute them and/or modify them under the same
445     terms as Perl itself.
446    
447     =cut
448    
449     1;
450     ### JISX4051.pm ends here

admin@suikawiki.org
ViewVC Help
Powered by ViewVC 1.1.24