18 |
unless defined $lang; |
unless defined $lang; |
19 |
$lang =~ tr/A-Z/a-z/; ## ASCII case-insensitive. |
$lang =~ tr/A-Z/a-z/; ## ASCII case-insensitive. |
20 |
|
|
21 |
use Message::DOM::DOMImplementation; |
require Message::DOM::DOMImplementation; |
22 |
my $dom = Message::DOM::DOMImplementation->new; |
my $dom = Message::DOM::DOMImplementation->new; |
23 |
|
|
24 |
my $doc = $dom->create_document; |
my $doc = $dom->create_document; |
93 |
return $c_el; |
return $c_el; |
94 |
} # get_content_element |
} # get_content_element |
95 |
|
|
96 |
|
__END__ |
97 |
|
|
98 |
|
=head1 NAME |
99 |
|
|
100 |
|
harusame.pl - Multilingual Web page management tool |
101 |
|
|
102 |
|
=head1 SYNOPSIS |
103 |
|
|
104 |
|
perl harusame.pl --lang LANGCODE < input.html > output.html |
105 |
|
|
106 |
|
perl harusame.pl --help |
107 |
|
|
108 |
|
=head1 DESCRIPTION |
109 |
|
|
110 |
|
The C<harusame.pl> script extracts a version of the HTML document |
111 |
|
written in the specified natural language, from a source HTML document |
112 |
|
that contains paragraphs in multiple natural languages. |
113 |
|
|
114 |
|
The document management of a multilingual Web site where there are |
115 |
|
multiple versions of a (conceptually same) document is somewhat |
116 |
|
difficult in general. If the author of an HTML document wants to edit |
117 |
|
a part of the document, then he or she has to ensure not to forget |
118 |
|
updating translations at the same time, otherwise documents in |
119 |
|
different language versions also differ in their content versions. |
120 |
|
|
121 |
|
Using the C<harusame.pl>, one can generate versions of an HTML |
122 |
|
document in different language from one source HTML document that |
123 |
|
contains paragraphs written in all of those languages, such that |
124 |
|
authors no longer have to manage different content versions and |
125 |
|
different language versions in separate files. |
126 |
|
|
127 |
|
=head1 ARGUMENTS |
128 |
|
|
129 |
|
The source document must be provided to the script using the |
130 |
|
I<standard input>. It must be encoded in UTF-8. |
131 |
|
|
132 |
|
The script outputs the generated document encoded in UTF-8 to the |
133 |
|
I<standard output>. |
134 |
|
|
135 |
|
Following command-line options are available to this script: |
136 |
|
|
137 |
|
=over 4 |
138 |
|
|
139 |
|
=item C<--help> |
140 |
|
|
141 |
|
Show the help message and exit. |
142 |
|
|
143 |
|
=item C<--lang I<LANGCODE>> (B<REQUIRED>) |
144 |
|
|
145 |
|
The language of the version to generate. This option must be |
146 |
|
specified. The value must be a value that is valid for HTML |
147 |
|
C<lang=""> attribute. |
148 |
|
|
149 |
|
=back |
150 |
|
|
151 |
|
=head1 SEE ALSO |
152 |
|
|
153 |
|
Readme L<http://suika.fam.cx/www/harusame/readme>. How to mark up the |
154 |
|
source HTML document is described in this document. |
155 |
|
|
156 |
|
=head1 AUTHOR |
157 |
|
|
158 |
|
Wakaba <w@suika.fam.cx>. |
159 |
|
|
160 |
|
=head1 LICENSE |
161 |
|
|
162 |
|
Copyright 2008 Wakaba <w@suika.fam.cx>. |
163 |
|
|
164 |
|
This library is free software; you can redistribute it and/or modify |
165 |
|
it under the same terms as Perl itself. |
166 |
|
|
167 |
|
=cut |
168 |
|
|
169 |
## $Date$ |
## $Date$ |