/[suikacvs]/markup/html/html5/spec-ja/common.pl
Suika

Diff of /markup/html/html5/spec-ja/common.pl

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 1.4 by wakaba, Wed Aug 13 10:00:09 2008 UTC revision 1.19 by wakaba, Wed Nov 5 01:29:08 2008 UTC
# Line 1  Line 1 
1  use strict;  use strict;
2    use utf8;
3    
 my $data_suffix = q[.dat];  
4  my $data_dir_name = q[data/];  my $data_dir_name = q[data/];
5    my $data2_dir_name = q[data2/];
6    my $data2_suffix = q[.dat];
7    my $lock_suffix = q[.lock];
8    
9    ## SEE ALSO: |Makefile|.
10    my $fallback_file_name = $data2_dir_name . 'fallback' . $data2_suffix;
11    
12    ## SEE ALSO: |Makefile|.
13    my $patch_file_name = $data2_dir_name . 'modified.txt';
14    
15    our $UseCVS //= 1;
16    
17  sub normalize ($) {  sub normalize ($) {
18    my $s = shift;    my $s = shift;
# Line 11  sub normalize ($) { Line 22  sub normalize ($) {
22    return $s;    return $s;
23  } # normalize  } # normalize
24    
25    sub get_hash ($) {
26      require Digest::MD5;
27      require Encode;
28      return Digest::MD5::md5_hex (Encode::encode ('utf8', normalize ($_[0])));
29    } # get_hash
30    
31  sub create_pattern1 ($) {  sub create_pattern1 ($) {
32    my $s = quotemeta shift;    my $s = quotemeta shift;
33    $s =~ s/\\\*/(.+)/g;    $s =~ s/\\\*/(.+)/g;
# Line 24  sub replace_pattern2 ($@) { Line 41  sub replace_pattern2 ($@) {
41    return $s;    return $s;
42  } # replace_pattern2  } # replace_pattern2
43    
44  sub load_data_file ($$$$) {  sub read_data_file ($) {
45    my ($data_file_name, $exact_data, $pattern_data,    my $file_name = shift;
46        $id_variant_pattern_data) = @_;    if (-f $file_name) {
47        warn "Loading $file_name...\n";
48    open my $data_file, '<:utf8', $data_file_name      return do $file_name;
49        or die "$0: $data_file_name: $!";    } else {
50    local $/ = undef;      warn "File $file_name not found\n";
51    my $data = <$data_file>;      return {};
52    $data =~ s/\x0D?\x0A/\n/g;    }
53    for (split /\n\n+(?=#)/, $data) {  } # read_data_file
54      my ($en, $ja) = split /\n#ja\n/, $_;  
55      if ($en =~ s/^#en\n//) {  sub write_data_file ($$) {
56        $exact_data->{normalize ($en)} = $ja;    my ($file_name, $data) = @_;
57      } elsif ($en =~ s/^#pattern\n//) {  
58        $pattern_data->{create_pattern1 (normalize ($en))} = $ja;    require Data::Dumper;
59      local $Data::Dumper::Sortkeys = 1;
60      local $Data::Dumper::Useqq = 1;
61      local *Data::Dumper::qquote = sub {
62        my $s = shift;
63        $s =~ s/([\x24\x27\x40\x5C])/sprintf '\x%02X', ord $1/ge;
64        return q<qq'> . $s . q<'>;
65      }; # Data::Dumper::qquote
66      
67      my $had_file = -f $file_name;
68      open my $file, '>:encoding(utf8)', $file_name or die "$0: $file_name: $!";
69      print $file "use utf8;\n";
70      print $file Data::Dumper::Dumper ($data);
71      close $file;
72      unless ($had_file) {
73        system_ ('cvs', 'add', $file_name) if $UseCVS;
74      }
75    } # write_data_file
76    
77    sub hash_to_file_name ($) {
78      return $data2_dir_name . substr ($_[0], 0, 2) . $data2_suffix;
79    } # hash_to_file_name
80    
81    my $Entry = {};
82    my $ModifiedHash = {};
83    
84    sub get_entry ($) {
85      my $hash = shift;
86      
87      my $file_name = hash_to_file_name ($hash);
88      unless ($Entry->{$file_name}) {
89        $Entry->{$file_name} = read_data_file ($file_name);
90      }
91      
92      if ($Entry->{$file_name}->{exact}->{$hash}) {
93        return (0, $Entry->{$file_name}->{exact}->{$hash});
94      } elsif ($Entry->{$file_name}->{pattern}->{$hash}) {
95        return (1, $Entry->{$file_name}->{pattern}->{$hash});
96      } else {
97        return (undef, undef);
98      }
99    } # get_entry
100    
101    sub set_entry ($$$) {
102      my ($hash, $is_pattern, $value) = @_;
103      
104      my $file_name = hash_to_file_name ($hash);
105      unless ($Entry->{$file_name}) {
106        $Entry->{$file_name} = read_data_file ($file_name);    
107      }
108    
109      unless ($value) {
110        delete $Entry->{$file_name}->{exact}->{$hash};
111        delete $Entry->{$file_name}->{pattern}->{$hash};
112      } elsif ($is_pattern) {
113        delete $Entry->{$file_name}->{exact}->{$hash};
114        $Entry->{$file_name}->{pattern}->{$hash} = $value;
115      } else {
116        $Entry->{$file_name}->{exact}->{$hash} = $value;
117        delete $Entry->{$file_name}->{pattern}->{$hash};
118      }
119      $Entry->{$file_name}->{modified} = 1;
120      $ModifiedHash->{$hash} = 1;
121    } # set_entry
122    
123    use Fcntl ':flock';
124    my $Lock;
125    
126    sub lock_entry ($) {
127      if ($Lock) {
128        die "$0: lock_entry: Another entry is locked";
129      }
130    
131      my $hash = shift;
132      my $file_name = hash_to_file_name ($hash) . $lock_suffix;
133      open $Lock, '>', $file_name or die "$0: $file_name: $!";
134      flock $Lock, LOCK_EX;
135    } # lock_entry
136    
137    sub commit_entries ($) {
138      for my $file_name (keys %{$Entry}) {
139        if ($Entry->{$file_name}->{modified}) {
140          delete $Entry->{$file_name}->{modified};
141          write_data_file ($file_name => $Entry->{$file_name});
142      }      }
143    }    }
144    
145    for my $p (keys %$exact_data) {    open my $file, '>>', $patch_file_name or die "$0: $patch_file_name: $!";
146      next if $p =~ /\bhref="#/;    for (keys %$ModifiedHash) {
147      my $o = $p;      print $file "$_\n";
     $p = quotemeta $p;  
     my @oldname;  
     $p =~ s{\bhref\\=\\"\\#([^"]+)"}{  
       push @oldname, $1;  
       'href="#([^"]+)"';  
     }ge;  
     $id_variant_pattern_data->{$p} = [$exact_data->{$o}, \@oldname, $o];  
   }  
 } # load_data_file  
   
 sub for_each_data_file ($) {  
   my ($code) = @_;  
   
   opendir my $data_dir, $data_dir_name or die "$0: $data_dir_name: $!";  
   for (sort {$a cmp $b} readdir $data_dir) {  
     next if /^\./; # hidden files  
     next if /^_/; # editable but not-used files  
     my $data_file_name = qq[$data_dir_name$_];  
     next unless $data_file_name =~ /\Q$data_suffix\E$/;  
     $code->($data_file_name, $_);  
148    }    }
149  } # for_each_data_file    close $file;
150    
151      my $msg = shift // $0;
152      system_ ('cvs', 'commit', -m => $msg, $data2_dir_name) if $UseCVS;
153    } # commit_entries
154    
155    sub get_all_entries () {
156      opendir my $dir, $data2_dir_name or die "$0: $data2_dir_name: $!";
157      for (readdir $dir) {
158        next unless /\Q$data2_suffix\E$/;
159        my $file_name = $data2_dir_name . $_;
160        next if $Entry->{$file_name};
161    
162        $Entry->{$file_name} = read_data_file ($file_name);
163      }
164    
165      return $Entry;
166    } # get_all_entries
167    
168    sub for_each_entry_set ($;$) {
169      my $code = shift;
170      my $on_the_fly = shift;
171      
172      opendir my $dir, $data2_dir_name or die "$0: $data2_dir_name: $!";
173      for (readdir $dir) {
174        next unless /\Q$data2_suffix\E$/;
175        my $file_name = $data2_dir_name . $_;
176        next if $file_name eq $fallback_file_name;
177    
178        if ($Entry->{$file_name}) {
179          $code->($file_name, $Entry->{$file_name});
180        } elsif ($on_the_fly) {
181          $code->($file_name, read_data_file ($file_name));
182        } else {
183          $Entry->{$file_name} = read_data_file ($file_name);
184          $code->($file_name, $Entry->{$file_name});
185        }
186      }
187    } # for_each_entry_set
188    
189    my $FallbackEntry;
190    sub get_fallback_entry ($) {
191      my $hash = shift;
192      unless (defined $FallbackEntry) {
193        $FallbackEntry = read_data_file ($fallback_file_name);
194      }
195      return $FallbackEntry->{$hash} // {};
196    } # get_fallback_entry
197    
198    sub get_entry_or_fallback_entry ($) {
199      my $hash = shift;
200    
201      my ($is_pattern, $entry) = get_entry ($hash);
202      unless (defined $entry->{en}) {
203        $entry = get_fallback_entry ($hash);
204      }
205      $entry->{tags} ||= [];
206      $entry->{isPattern} = 1 if $is_pattern;
207    
208      return $entry;
209    } # get_entry_or_fallback_entry
210    
211    sub set_fallback_entry ($$) {
212      my ($hash, $value) = @_;
213      unless (defined $FallbackEntry) {
214        $FallbackEntry = read_data_file ($fallback_file_name);
215      }
216      $FallbackEntry->{$hash} = $value;
217    } # set_fallback_entry
218    
219    sub get_fallback_entries () {
220      unless (defined $FallbackEntry) {
221        $FallbackEntry = read_data_file ($fallback_file_name);
222      }
223      
224      return $FallbackEntry;
225    } # get_fallback_entries
226    
227    sub save_fallback_entries () {
228      write_data_file ($fallback_file_name => $FallbackEntry)
229          if defined $FallbackEntry;
230    } # save_fallback_entries
231    
232    sub get_modified_hashes () {
233      open my $file, '<', $patch_file_name or die "$0: $patch_file_name: $!";
234      return map {tr/\x0D\x0A//d; $_} <$file>;
235    } # get_modified_hashes
236    
237    sub normalize_width ($) {
238      my $s = shift;
239      $s =~ tr{\x{3000}\x{FF01}-\x{FF5E}\x{FF61}-\x{FF9F}\x{FFE0}-\x{FFE6}}
240              { !-~。「」、・ヲァィゥェォャュョッーアイウエオカキクケコサシスセソタチツテトナニヌネノハヒフヘホマミムメモヤユヨラリルレロワン\x{3099}\x{309A}\xA2\xA3\xAC\xAF\xA6\xA5\x{20A9}};
241      return $s;
242    } # normalize_width
243    
244    sub htescape ($) {
245      my $s = shift;
246      $s =~ s/&/&amp;/g;
247      $s =~ s/</&lt;/g;
248      $s =~ s/"/&quot;/g;
249      return $s;
250    } # htescape
251    
252    sub system_ (@) {
253      (system join (' ', map {quotemeta $_} @_) . " > /dev/null") == 0
254          or die "$0: $?";
255    } # system_
256    
257  1;  1;
258    
259    ## Author: Wakaba <w@suika.fam.cx>.
260    ## License: Copyright 2008 Wakaba.  You are granted a license to use,
261    ##     reproduce and create derivative works of this script.
262    ## $Date$

Legend:
Removed from v.1.4  
changed lines
  Added in v.1.19

admin@suikawiki.org
ViewVC Help
Powered by ViewVC 1.1.24