1 |
wakaba |
1.1 |
package Whatpm::HTMLTable; |
2 |
|
|
use strict; |
3 |
|
|
|
4 |
|
|
## An implementation of "Forming a table" algorithm in HTML5 |
5 |
wakaba |
1.9 |
sub form_table ($$$;$) { |
6 |
wakaba |
1.15 |
my (undef, $table_el, $onerror, $levels) = @_; |
7 |
wakaba |
1.2 |
$onerror ||= sub { }; |
8 |
wakaba |
1.15 |
$levels ||= {must => 'm'}; |
9 |
wakaba |
1.1 |
|
10 |
|
|
## Step 1 |
11 |
wakaba |
1.7 |
my $x_width = 0; |
12 |
wakaba |
1.1 |
|
13 |
|
|
## Step 2 |
14 |
wakaba |
1.7 |
my $y_height = 0; |
15 |
wakaba |
1.1 |
my $y_max_node; |
16 |
wakaba |
1.8 |
|
17 |
|
|
## Step 3 |
18 |
|
|
my $pending_tfoot = []; |
19 |
wakaba |
1.1 |
|
20 |
wakaba |
1.8 |
## Step 4 |
21 |
wakaba |
1.1 |
my $table = { |
22 |
|
|
#caption |
23 |
|
|
column => [], |
24 |
|
|
column_group => [], |
25 |
wakaba |
1.9 |
row => [], ## NOTE: HTML5 algorithm doesn't associate rows with <tr>s. |
26 |
wakaba |
1.1 |
row_group => [], |
27 |
|
|
cell => [], |
28 |
wakaba |
1.11 |
height => 0, |
29 |
|
|
width => 0, |
30 |
wakaba |
1.12 |
element => $table_el, |
31 |
wakaba |
1.1 |
}; |
32 |
|
|
|
33 |
wakaba |
1.9 |
my @column_has_anchored_cell; |
34 |
|
|
my @row_has_anchored_cell; |
35 |
wakaba |
1.1 |
my @column_generated_by; |
36 |
wakaba |
1.9 |
my @row_generated_by; |
37 |
|
|
|
38 |
|
|
## Step 5 |
39 |
|
|
my @table_child = @{$table_el->child_nodes}; |
40 |
|
|
return $table unless @table_child; |
41 |
|
|
|
42 |
wakaba |
1.10 |
## Step 6 |
43 |
|
|
for (0..$#table_child) { |
44 |
|
|
my $el = $table_child[$_]; |
45 |
|
|
next unless $el->node_type == 1; # ELEMENT_NODE |
46 |
|
|
next unless $el->manakai_local_name eq 'caption'; |
47 |
|
|
my $nsuri = $el->namespace_uri; |
48 |
|
|
next unless defined $nsuri; |
49 |
|
|
next unless $nsuri eq q<http://www.w3.org/1999/xhtml>; |
50 |
|
|
$table->{caption} = {element => $el}; |
51 |
|
|
splice @table_child, $_, 1, (); |
52 |
|
|
last; |
53 |
|
|
} |
54 |
|
|
|
55 |
wakaba |
1.9 |
my $process_row_group; |
56 |
|
|
my $end = sub { |
57 |
wakaba |
1.10 |
## Step 19 (End) |
58 |
wakaba |
1.9 |
for (@$pending_tfoot) { |
59 |
|
|
$process_row_group->($_); |
60 |
|
|
} |
61 |
|
|
|
62 |
wakaba |
1.10 |
## Step 20 |
63 |
wakaba |
1.7 |
for (0 .. $x_width - 1) { |
64 |
wakaba |
1.9 |
unless ($column_has_anchored_cell[$_]) { |
65 |
wakaba |
1.1 |
if ($table->{column}->[$_]) { |
66 |
|
|
$onerror->(type => 'column with no anchored cell', |
67 |
wakaba |
1.9 |
node => $table->{column}->[$_]->{element}, |
68 |
wakaba |
1.15 |
level => $levels->{must}); |
69 |
wakaba |
1.1 |
} else { |
70 |
wakaba |
1.4 |
$onerror->(type => 'colspan creates column with no anchored cell', |
71 |
wakaba |
1.9 |
node => $column_generated_by[$_], |
72 |
wakaba |
1.15 |
level => $levels->{must}); |
73 |
wakaba |
1.1 |
} |
74 |
wakaba |
1.9 |
last; # only one error. |
75 |
wakaba |
1.1 |
} |
76 |
|
|
} |
77 |
wakaba |
1.9 |
for (0 .. $y_height - 1) { |
78 |
|
|
unless ($row_has_anchored_cell[$_]) { |
79 |
|
|
if ($table->{row}->[$_]) { |
80 |
|
|
$onerror->(type => 'row with no anchored cell', |
81 |
|
|
node => $table->{row}->[$_]->{element}, |
82 |
wakaba |
1.15 |
level => $levels->{must}); |
83 |
wakaba |
1.9 |
} else { |
84 |
|
|
$onerror->(type => 'rowspan creates row with no anchored cell', |
85 |
|
|
node => $row_generated_by[$_], |
86 |
wakaba |
1.15 |
level => $levels->{must}); |
87 |
wakaba |
1.9 |
} |
88 |
|
|
last; # only one error. |
89 |
|
|
} |
90 |
|
|
} |
91 |
|
|
|
92 |
wakaba |
1.10 |
## Step 21 |
93 |
wakaba |
1.9 |
#return $table; |
94 |
|
|
}; # $end |
95 |
wakaba |
1.1 |
|
96 |
wakaba |
1.10 |
## Step 7, 8 |
97 |
wakaba |
1.1 |
my $current_element; |
98 |
|
|
my $current_ln; |
99 |
|
|
NEXT_CHILD: { |
100 |
|
|
$current_element = shift @table_child; |
101 |
|
|
if (defined $current_element) { |
102 |
|
|
redo NEXT_CHILD unless $current_element->node_type == 1; |
103 |
|
|
my $nsuri = $current_element->namespace_uri; |
104 |
|
|
redo NEXT_CHILD unless defined $nsuri and |
105 |
|
|
$nsuri eq q<http://www.w3.org/1999/xhtml>; |
106 |
|
|
$current_ln = $current_element->manakai_local_name; |
107 |
|
|
|
108 |
|
|
redo NEXT_CHILD unless { |
109 |
|
|
colgroup => 1, |
110 |
|
|
thead => 1, |
111 |
|
|
tbody => 1, |
112 |
|
|
tfoot => 1, |
113 |
|
|
tr => 1, |
114 |
|
|
}->{$current_ln}; |
115 |
|
|
} else { |
116 |
wakaba |
1.8 |
## Step 6 2nd paragraph |
117 |
wakaba |
1.9 |
$end->(); |
118 |
wakaba |
1.11 |
$table->{width} = $x_width; |
119 |
|
|
$table->{height} = $y_height; |
120 |
wakaba |
1.9 |
return $table; |
121 |
wakaba |
1.1 |
} |
122 |
|
|
} # NEXT_CHILD |
123 |
|
|
|
124 |
wakaba |
1.10 |
## Step 9 |
125 |
|
|
while ($current_ln eq 'colgroup') { # Step 9, Step 9.4 |
126 |
|
|
## Step 9.1: column groups |
127 |
wakaba |
1.1 |
my @col = grep { |
128 |
|
|
$_->node_type == 1 and |
129 |
|
|
defined $_->namespace_uri and |
130 |
|
|
$_->namespace_uri eq q<http://www.w3.org/1999/xhtml> and |
131 |
|
|
$_->manakai_local_name eq 'col' |
132 |
|
|
} @{$current_element->child_nodes}; |
133 |
|
|
if (@col) { |
134 |
|
|
## Step 1 |
135 |
wakaba |
1.7 |
my $x_start = $x_width; |
136 |
wakaba |
1.1 |
|
137 |
|
|
## Step 2, 6 |
138 |
|
|
while (@col) { |
139 |
|
|
my $current_column = shift @col; |
140 |
|
|
|
141 |
|
|
## Step 3: columns |
142 |
|
|
my $span = 1; |
143 |
|
|
my $col_span = $current_column->get_attribute_ns (undef, 'span'); |
144 |
|
|
## Parse non-negative integer |
145 |
|
|
if (defined $col_span and $col_span =~ /^[\x09-\x0D\x20]*([0-9]+)/) { |
146 |
|
|
$span = $1 || 1; |
147 |
|
|
} |
148 |
|
|
|
149 |
|
|
## Step 4, 5 |
150 |
wakaba |
1.11 |
$table->{column}->[$x_width++] = {element => $current_column} |
151 |
wakaba |
1.7 |
for 1..$span; |
152 |
wakaba |
1.1 |
} |
153 |
|
|
|
154 |
|
|
## Step 7 |
155 |
|
|
my $cg = {element => $current_element, |
156 |
wakaba |
1.7 |
x => $x_start, y => 0, |
157 |
|
|
width => $x_width - $x_start}; |
158 |
|
|
$table->{column_group}->[$_] = $cg for $x_start .. $x_width - 1; |
159 |
wakaba |
1.1 |
} else { # no <col> children |
160 |
|
|
## Step 1 |
161 |
|
|
my $span = 1; |
162 |
|
|
my $col_span = $current_element->get_attribute_ns (undef, 'span'); |
163 |
|
|
## Parse non-negative integer |
164 |
|
|
if (defined $col_span and $col_span =~ /^[\x09-\x0D\x20]*([0-9]+)/) { |
165 |
|
|
$span = $1 || 1; |
166 |
|
|
} |
167 |
|
|
|
168 |
|
|
## Step 2 |
169 |
wakaba |
1.7 |
$x_width += $span; |
170 |
wakaba |
1.1 |
|
171 |
|
|
## Step 3 |
172 |
|
|
my $cg = {element => $current_element, |
173 |
wakaba |
1.7 |
x => $x_width - $span, y => 0, |
174 |
wakaba |
1.1 |
width => $span}; |
175 |
wakaba |
1.7 |
$table->{column_group}->[$_] = $cg for $cg->{x} .. $x_width - 1; |
176 |
wakaba |
1.1 |
} |
177 |
|
|
|
178 |
wakaba |
1.10 |
## Step 9.2, 9.3 |
179 |
wakaba |
1.1 |
NEXT_CHILD: { |
180 |
|
|
$current_element = shift @table_child; |
181 |
|
|
if (defined $current_element) { |
182 |
|
|
redo NEXT_CHILD unless $current_element->node_type == 1; |
183 |
|
|
my $nsuri = $current_element->namespace_uri; |
184 |
|
|
redo NEXT_CHILD unless defined $nsuri and |
185 |
|
|
$nsuri eq q<http://www.w3.org/1999/xhtml>; |
186 |
|
|
$current_ln = $current_element->manakai_local_name; |
187 |
|
|
|
188 |
|
|
redo NEXT_CHILD unless { |
189 |
|
|
colgroup => 1, |
190 |
|
|
thead => 1, |
191 |
|
|
tbody => 1, |
192 |
|
|
tfoot => 1, |
193 |
|
|
tr => 1, |
194 |
|
|
}->{$current_ln}; |
195 |
|
|
} else { |
196 |
|
|
## End of subsection |
197 |
wakaba |
1.9 |
|
198 |
wakaba |
1.1 |
## Step 5 of overall steps 2nd paragraph |
199 |
wakaba |
1.9 |
$end->(); |
200 |
wakaba |
1.11 |
$table->{width} = $x_width; |
201 |
|
|
$table->{height} = $y_height; |
202 |
wakaba |
1.9 |
return $table; |
203 |
wakaba |
1.1 |
} |
204 |
|
|
} # NEXT_CHILD |
205 |
|
|
} |
206 |
|
|
|
207 |
wakaba |
1.10 |
## Step 10 |
208 |
wakaba |
1.1 |
my $y_current = 0; |
209 |
|
|
|
210 |
wakaba |
1.10 |
## Step 11 |
211 |
wakaba |
1.1 |
my @downward_growing_cells; |
212 |
|
|
|
213 |
|
|
my $growing_downward_growing_cells = sub { |
214 |
|
|
for (@downward_growing_cells) { |
215 |
|
|
for my $x ($_->[1] .. ($_->[1] + $_->[2] - 1)) { |
216 |
|
|
$table->{cell}->[$x]->[$y_current] = [$_->[0]]; |
217 |
|
|
$_->[0]->{height}++; |
218 |
|
|
} |
219 |
|
|
} |
220 |
|
|
}; # $growing_downward_growing_cells |
221 |
|
|
|
222 |
|
|
my $process_row = sub { |
223 |
|
|
## Step 1 |
224 |
wakaba |
1.7 |
$y_height++ if $y_height == $y_current; |
225 |
wakaba |
1.1 |
|
226 |
|
|
## Step 2 |
227 |
wakaba |
1.7 |
my $x_current = 0; |
228 |
|
|
|
229 |
wakaba |
1.1 |
## Step 3 |
230 |
|
|
my $tr = shift; |
231 |
wakaba |
1.9 |
$table->{row}->[$y_current] = {element => $tr}; |
232 |
wakaba |
1.1 |
my @tdth = grep { |
233 |
|
|
$_->node_type == 1 and |
234 |
|
|
defined $_->namespace_uri and |
235 |
|
|
$_->namespace_uri eq q<http://www.w3.org/1999/xhtml> and |
236 |
|
|
{td => 1, th => 1}->{$_->manakai_local_name} |
237 |
|
|
} @{$tr->child_nodes}; |
238 |
wakaba |
1.7 |
my $current_cell = shift @tdth; |
239 |
|
|
|
240 |
|
|
## Step 4 |
241 |
|
|
$growing_downward_growing_cells->(); |
242 |
wakaba |
1.1 |
|
243 |
wakaba |
1.9 |
return unless $current_cell; |
244 |
|
|
## ISSUE: Support for empty <tr></tr> (removed at revision 1376). |
245 |
|
|
|
246 |
wakaba |
1.7 |
CELL: while (1) { |
247 |
|
|
## Step 5: cells |
248 |
wakaba |
1.1 |
$x_current++ |
249 |
wakaba |
1.7 |
while ($x_current < $x_width and |
250 |
wakaba |
1.1 |
$table->{cell}->[$x_current]->[$y_current]); |
251 |
|
|
|
252 |
wakaba |
1.7 |
## Step 6 |
253 |
|
|
$x_width++ if $x_current == $x_width; |
254 |
|
|
|
255 |
wakaba |
1.1 |
## Step 7 |
256 |
|
|
my $colspan = 1; |
257 |
|
|
my $attr_value = $current_cell->get_attribute_ns (undef, 'colspan'); |
258 |
|
|
if (defined $attr_value and $attr_value =~ /^[\x09-\x0D\x20]*([0-9]+)/) { |
259 |
|
|
$colspan = $1 || 1; |
260 |
|
|
} |
261 |
|
|
|
262 |
wakaba |
1.7 |
## Step 8 |
263 |
wakaba |
1.1 |
my $rowspan = 1; |
264 |
|
|
my $attr_value = $current_cell->get_attribute_ns (undef, 'rowspan'); |
265 |
|
|
if (defined $attr_value and $attr_value =~ /^[\x09-\x0D\x20]*([0-9]+)/) { |
266 |
|
|
$rowspan = $1; |
267 |
|
|
} |
268 |
|
|
|
269 |
wakaba |
1.7 |
## Step 9 |
270 |
wakaba |
1.1 |
my $cell_grows_downward; |
271 |
|
|
if ($rowspan == 0) { |
272 |
|
|
$cell_grows_downward = 1; |
273 |
|
|
$rowspan = 1; |
274 |
|
|
} |
275 |
|
|
|
276 |
wakaba |
1.7 |
## Step 10 |
277 |
|
|
if ($x_width < $x_current + $colspan) { |
278 |
wakaba |
1.1 |
@column_generated_by[$_] = $current_cell |
279 |
wakaba |
1.7 |
for $x_width .. $x_current + $colspan - 1; |
280 |
|
|
$x_width = $x_current + $colspan; |
281 |
wakaba |
1.1 |
} |
282 |
|
|
|
283 |
wakaba |
1.7 |
## Step 11 |
284 |
|
|
if ($y_height < $y_current + $rowspan) { |
285 |
wakaba |
1.9 |
@row_generated_by[$_] = $current_cell |
286 |
|
|
for $y_height .. $y_current + $rowspan - 1; |
287 |
wakaba |
1.7 |
$y_height = $y_current + $rowspan; |
288 |
wakaba |
1.1 |
$y_max_node = $current_cell; |
289 |
|
|
} |
290 |
|
|
|
291 |
wakaba |
1.7 |
## Step 12 |
292 |
wakaba |
1.1 |
my $cell = { |
293 |
wakaba |
1.2 |
is_header => ($current_cell->manakai_local_name eq 'th'), |
294 |
wakaba |
1.1 |
element => $current_cell, |
295 |
|
|
x => $x_current, y => $y_current, |
296 |
|
|
width => $colspan, height => $rowspan, |
297 |
|
|
}; |
298 |
wakaba |
1.9 |
$column_has_anchored_cell[$x_current] = 1; |
299 |
|
|
$row_has_anchored_cell[$y_current] = 1; |
300 |
wakaba |
1.1 |
for my $x ($x_current .. ($x_current + $colspan - 1)) { |
301 |
|
|
for my $y ($y_current .. ($y_current + $rowspan - 1)) { |
302 |
|
|
unless ($table->{cell}->[$x]->[$y]) { |
303 |
|
|
$table->{cell}->[$x]->[$y] = [$cell]; |
304 |
|
|
} else { |
305 |
wakaba |
1.15 |
$onerror->(type => 'cell overlapping', |
306 |
|
|
text => "$x,$y", |
307 |
|
|
node => $current_cell, |
308 |
|
|
level => $levels->{must}); |
309 |
wakaba |
1.1 |
push @{$table->{cell}->[$x]->[$y]}, $cell; |
310 |
|
|
} |
311 |
|
|
} |
312 |
|
|
} |
313 |
wakaba |
1.11 |
|
314 |
|
|
## Whether the cell is an empty data cell or not |
315 |
|
|
if (not $cell->{is_header}) { |
316 |
|
|
$cell->{is_empty} = 1; |
317 |
|
|
for my $node (@{$current_cell->child_nodes}) { |
318 |
|
|
my $nt = $node->node_type; |
319 |
|
|
if ($nt == 3 or $nt == 4) { # TEXT_NODE / CDATA_SECTION_NODE |
320 |
wakaba |
1.16 |
if ($node->data =~ /\P{WhiteSpace}/) { |
321 |
wakaba |
1.11 |
delete $cell->{is_empty}; |
322 |
|
|
last; |
323 |
|
|
} |
324 |
|
|
} elsif ($nt == 1) { # ELEMENT_NODE |
325 |
|
|
delete $cell->{is_empty}; |
326 |
|
|
last; |
327 |
|
|
} |
328 |
|
|
} |
329 |
|
|
## NOTE: Entity references are not supported |
330 |
|
|
} |
331 |
wakaba |
1.1 |
|
332 |
wakaba |
1.7 |
## Step 13 |
333 |
wakaba |
1.1 |
if ($cell_grows_downward) { |
334 |
|
|
push @downward_growing_cells, [$cell, $x_current, $colspan]; |
335 |
|
|
} |
336 |
|
|
|
337 |
wakaba |
1.7 |
## Step 14 |
338 |
wakaba |
1.1 |
$x_current += $colspan; |
339 |
wakaba |
1.7 |
|
340 |
|
|
## Step 15-17 |
341 |
|
|
$current_cell = shift @tdth; |
342 |
|
|
if (defined $current_cell) { |
343 |
|
|
## Step 16-17 |
344 |
|
|
# |
345 |
|
|
} else { |
346 |
|
|
## Step 15 |
347 |
|
|
$y_current++; |
348 |
|
|
last CELL; |
349 |
|
|
} |
350 |
|
|
} # CELL |
351 |
wakaba |
1.1 |
}; # $process_row |
352 |
|
|
|
353 |
wakaba |
1.9 |
$process_row_group = sub ($) { |
354 |
wakaba |
1.8 |
## Step 1 |
355 |
|
|
my $y_start = $y_height; |
356 |
|
|
|
357 |
|
|
## Step 2 |
358 |
|
|
for (grep { |
359 |
|
|
$_->node_type == 1 and |
360 |
|
|
defined $_->namespace_uri and |
361 |
|
|
$_->namespace_uri eq q<http://www.w3.org/1999/xhtml> and |
362 |
|
|
$_->manakai_local_name eq 'tr' |
363 |
|
|
} @{$_[0]->child_nodes}) { |
364 |
|
|
$process_row->($_); |
365 |
|
|
} |
366 |
|
|
|
367 |
|
|
## Step 3 |
368 |
|
|
if ($y_height > $y_start) { |
369 |
wakaba |
1.14 |
my $rg = {element => $current_element, ## ISSUE: "element being processed"? Otherwise, $current_element may be a thead element while the element being processed is a tfoot element, for example. |
370 |
wakaba |
1.8 |
x => 0, y => $y_start, |
371 |
|
|
height => $y_height - $y_start}; |
372 |
|
|
$table->{row_group}->[$_] = $rg for $y_start .. $y_height - 1; |
373 |
|
|
} |
374 |
|
|
|
375 |
|
|
## Step 4 |
376 |
|
|
## Ending a row group |
377 |
|
|
## Step 1 |
378 |
|
|
while ($y_current < $y_height) { |
379 |
|
|
## Step 1 |
380 |
|
|
$growing_downward_growing_cells->(); |
381 |
|
|
|
382 |
|
|
## Step 2 |
383 |
|
|
$y_current++; |
384 |
|
|
} |
385 |
wakaba |
1.9 |
## Step 2 |
386 |
wakaba |
1.8 |
@downward_growing_cells = (); |
387 |
|
|
}; # $process_row_group |
388 |
|
|
|
389 |
wakaba |
1.10 |
## Step 12: rows |
390 |
wakaba |
1.1 |
unshift @table_child, $current_element; |
391 |
|
|
ROWS: { |
392 |
|
|
NEXT_CHILD: { |
393 |
|
|
$current_element = shift @table_child; |
394 |
|
|
if (defined $current_element) { |
395 |
|
|
redo NEXT_CHILD unless $current_element->node_type == 1; |
396 |
|
|
my $nsuri = $current_element->namespace_uri; |
397 |
|
|
redo NEXT_CHILD unless defined $nsuri and |
398 |
|
|
$nsuri eq q<http://www.w3.org/1999/xhtml>; |
399 |
|
|
$current_ln = $current_element->manakai_local_name; |
400 |
|
|
|
401 |
|
|
redo NEXT_CHILD unless { |
402 |
|
|
thead => 1, |
403 |
|
|
tbody => 1, |
404 |
|
|
tfoot => 1, |
405 |
|
|
tr => 1, |
406 |
|
|
}->{$current_ln}; |
407 |
|
|
} else { |
408 |
wakaba |
1.8 |
## Step 6 2nd paragraph |
409 |
wakaba |
1.9 |
$end->(); |
410 |
wakaba |
1.11 |
$table->{width} = $x_width; |
411 |
|
|
$table->{height} = $y_height; |
412 |
wakaba |
1.9 |
return $table; |
413 |
wakaba |
1.1 |
} |
414 |
|
|
} # NEXT_CHILD |
415 |
|
|
|
416 |
wakaba |
1.10 |
## Step 13 |
417 |
wakaba |
1.1 |
if ($current_ln eq 'tr') { |
418 |
|
|
$process_row->($current_element); |
419 |
wakaba |
1.8 |
# advance (done at the first of ROWS) |
420 |
wakaba |
1.1 |
redo ROWS; |
421 |
|
|
} |
422 |
|
|
|
423 |
wakaba |
1.10 |
## Step 14 |
424 |
wakaba |
1.1 |
## Ending a row group |
425 |
|
|
## Step 1 |
426 |
wakaba |
1.7 |
while ($y_current < $y_height) { |
427 |
wakaba |
1.1 |
## Step 1 |
428 |
wakaba |
1.9 |
$growing_downward_growing_cells->(); |
429 |
|
|
|
430 |
|
|
## Step 2 |
431 |
wakaba |
1.1 |
$y_current++; |
432 |
|
|
} |
433 |
wakaba |
1.9 |
## Step 2 |
434 |
wakaba |
1.1 |
@downward_growing_cells = (); |
435 |
|
|
|
436 |
wakaba |
1.10 |
## Step 15 |
437 |
wakaba |
1.8 |
if ($current_ln eq 'tfoot') { |
438 |
|
|
push @$pending_tfoot, $current_element; |
439 |
|
|
# advance (done at the top of ROWS) |
440 |
|
|
redo ROWS; |
441 |
wakaba |
1.1 |
} |
442 |
|
|
|
443 |
wakaba |
1.10 |
## Step 16 |
444 |
wakaba |
1.8 |
# thead or tbody |
445 |
|
|
$process_row_group->($current_element); |
446 |
wakaba |
1.1 |
|
447 |
wakaba |
1.10 |
## Step 17 |
448 |
wakaba |
1.8 |
# Advance (done at the top of ROWS). |
449 |
wakaba |
1.1 |
|
450 |
wakaba |
1.10 |
## Step 18 |
451 |
wakaba |
1.8 |
redo ROWS; |
452 |
wakaba |
1.1 |
} # ROWS |
453 |
wakaba |
1.8 |
|
454 |
wakaba |
1.9 |
$end->(); |
455 |
wakaba |
1.11 |
$table->{width} = $x_width; |
456 |
|
|
$table->{height} = $y_height; |
457 |
wakaba |
1.8 |
return $table; |
458 |
wakaba |
1.1 |
} # form_table |
459 |
|
|
|
460 |
wakaba |
1.11 |
sub assign_header ($$;$$) { |
461 |
wakaba |
1.15 |
my (undef, $table, $onerror, $levels) = @_; |
462 |
wakaba |
1.11 |
$onerror ||= sub { }; |
463 |
wakaba |
1.15 |
$levels ||= {must => 'm'}; |
464 |
wakaba |
1.11 |
|
465 |
|
|
my $assign_header = sub ($$$) { |
466 |
|
|
my $_cell = shift; |
467 |
|
|
my ($x, $y) = @_; |
468 |
|
|
|
469 |
|
|
for my $__cell (@{$_cell or []}) { |
470 |
|
|
if ($__cell and $__cell->{element} and |
471 |
|
|
not $__cell->{is_header} and |
472 |
|
|
not $__cell->{element}->has_attribute_ns (undef, 'headers')) { |
473 |
|
|
$__cell->{header}->{$x}->{$y} = 1; |
474 |
|
|
} |
475 |
|
|
} |
476 |
|
|
}; # $assign_header |
477 |
|
|
|
478 |
wakaba |
1.12 |
my @headers_cell; |
479 |
|
|
my $id_to_cell = {}; |
480 |
|
|
## ISSUE: ID duplication, non-TH reference |
481 |
|
|
|
482 |
wakaba |
1.11 |
for my $x (0 .. $table->{width} - 1) { |
483 |
|
|
for my $y (0 .. $table->{height} - 1) { |
484 |
|
|
my $cell = $table->{cell}->[$x]->[$y]; |
485 |
|
|
$cell = $cell->[0] if $cell; # anchored cell is always ->{cell}[][][0]. |
486 |
|
|
next if $cell->{x} != $x; |
487 |
|
|
next if $cell->{y} != $y; |
488 |
|
|
if ($cell) { |
489 |
|
|
if ($cell->{is_header}) { |
490 |
wakaba |
1.12 |
my $id = $cell->{element}->get_attribute_ns (undef, 'id'); |
491 |
|
|
if (defined $id and not $id_to_cell->{$id}) { |
492 |
|
|
$id_to_cell->{$id} = $cell; |
493 |
|
|
} |
494 |
|
|
|
495 |
wakaba |
1.11 |
my $scope = $cell->{element}->get_attribute_ns (undef, 'scope'); |
496 |
|
|
$scope = $scope ? lc $scope : ''; ## TODO: case |
497 |
|
|
if ($scope eq 'row') { |
498 |
|
|
for my $_x ($x + $cell->{width} .. $table->{width} - 1) { |
499 |
|
|
for my $_y ($y .. $y + $cell->{height} - 1) { |
500 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
501 |
|
|
} |
502 |
|
|
} |
503 |
|
|
} elsif ($scope eq 'col') { |
504 |
|
|
for my $_x ($x .. $x + $cell->{width} - 1) { |
505 |
|
|
for my $_y ($y .. $table->{height} - 1) { |
506 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
507 |
|
|
} |
508 |
|
|
} |
509 |
|
|
} elsif ($scope eq 'rowgroup') { |
510 |
|
|
## NOTE: A cell cannot exceed across a row group boundary. |
511 |
|
|
if ($table->{row_group}->[$y] and |
512 |
|
|
$table->{row_group}->[$y]->{height}) { |
513 |
|
|
for my $_x ($x .. $table->{width} - 1) { |
514 |
|
|
for my $_y ($y .. |
515 |
|
|
$table->{row_group}->[$y]->{y} + |
516 |
|
|
$table->{row_group}->[$y]->{height} - 1) { |
517 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
518 |
|
|
} |
519 |
|
|
} |
520 |
|
|
} |
521 |
|
|
## TODO: Should we raise a warning? |
522 |
|
|
} elsif ($scope eq 'colgroup') { |
523 |
|
|
if ($table->{column_group}->[$x] and |
524 |
|
|
$table->{column_group}->{width} and |
525 |
|
|
$table->{column_group}->[$x]->{x} == $x) { # anchored |
526 |
|
|
for my $_x ($x .. |
527 |
|
|
$table->{column_group}->[$x]->{x} + |
528 |
|
|
$table->{column_group}->[$x]->{width} - 1) { |
529 |
|
|
for my $_y ($y .. $table->{height} - 1) { |
530 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
531 |
|
|
} |
532 |
|
|
} |
533 |
|
|
} |
534 |
|
|
## TODO: Warning? |
535 |
|
|
} else { # auto |
536 |
|
|
## 1. |
537 |
|
|
my $header_width = $cell->{width}; |
538 |
|
|
W: for ($x + $cell->{width} .. $table->{width} - 1) { |
539 |
|
|
my $_cell = $table->{cell}->[$_]->[$y]; |
540 |
|
|
for (@{$_cell or []}) { |
541 |
|
|
if ($_->{element} and not $_->{is_empty}) { |
542 |
|
|
last W; # not empty |
543 |
|
|
} |
544 |
|
|
} |
545 |
|
|
$header_width++; |
546 |
|
|
} # W |
547 |
|
|
|
548 |
|
|
## 2. |
549 |
|
|
my $_x = $x + $header_width; |
550 |
|
|
|
551 |
|
|
## 3. |
552 |
|
|
HORIZONTAL: { |
553 |
|
|
last HORIZONTAL if $_x == $table->{width}; # goto Vertical |
554 |
|
|
|
555 |
|
|
## 4. # goto Vertical |
556 |
|
|
last HORIZONTAL |
557 |
|
|
if $table->{cell}->[$_x]->[$y] and |
558 |
|
|
$table->{cell}->[$_x]->[$y]->[0] and # anchored |
559 |
|
|
$table->{cell}->[$_x]->[$y]->[0]->{is_header}; |
560 |
|
|
|
561 |
|
|
## 5. |
562 |
|
|
for my $_y ($y .. $y + $cell->{height} - 1) { |
563 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
564 |
|
|
} |
565 |
|
|
|
566 |
|
|
## 6. |
567 |
|
|
$_x++; |
568 |
|
|
|
569 |
|
|
## 7. |
570 |
|
|
redo HORIZONTAL; |
571 |
|
|
} # HORIZONTAL |
572 |
|
|
|
573 |
|
|
## 8. Vertical |
574 |
|
|
my $_y = $y + $cell->{height}; |
575 |
|
|
|
576 |
|
|
VERTICAL: { |
577 |
|
|
## 9. # goto END |
578 |
|
|
last VERTICAL if $_y == $table->{height}; |
579 |
|
|
|
580 |
|
|
## 10. |
581 |
|
|
if ($table->{cell}->[$x]->[$_y]) { |
582 |
|
|
my $h_cell = $table->{cell}->[$x]->[$_y]->[0]; # anchored cell |
583 |
|
|
if ($h_cell and $h_cell->{is_header}) { |
584 |
|
|
## 10.1. |
585 |
|
|
my $width = $h_cell->{width}; |
586 |
|
|
W: for ($h_cell->{x} + $width .. $table->{width} - 1) { |
587 |
|
|
my $_cell = $table->{cell}->[$_]->[$y]; |
588 |
|
|
for (@{$_cell or []}) { |
589 |
|
|
if ($_->{element} and not $_->{is_empty}) { |
590 |
|
|
last W; # not empty |
591 |
|
|
} |
592 |
|
|
} |
593 |
|
|
$width++; |
594 |
|
|
} # W |
595 |
|
|
|
596 |
|
|
## 10.2. # goto end |
597 |
|
|
last VERTICAL if $width == $header_width; |
598 |
|
|
} # 10. |
599 |
|
|
} |
600 |
|
|
|
601 |
|
|
## 11. |
602 |
|
|
for my $_x ($x .. $x + $header_width - 1) { |
603 |
|
|
$assign_header->($table->{cell}->[$_x]->[$_y] => $x, $y); |
604 |
|
|
} |
605 |
|
|
|
606 |
|
|
## 12. |
607 |
|
|
$_y++; |
608 |
|
|
|
609 |
|
|
## 13. # goto vertical (wrong) |
610 |
|
|
redo VERTICAL; |
611 |
|
|
} # VERTICAL |
612 |
|
|
|
613 |
|
|
## 14. End |
614 |
|
|
# (we have already done) |
615 |
|
|
} |
616 |
|
|
} else { # data cell |
617 |
wakaba |
1.12 |
if ($cell->{element} and |
618 |
|
|
$cell->{element}->has_attribute_ns (undef, 'headers')) { |
619 |
|
|
push @headers_cell, $cell; |
620 |
|
|
} |
621 |
wakaba |
1.11 |
} |
622 |
|
|
} |
623 |
|
|
} |
624 |
|
|
} |
625 |
|
|
|
626 |
wakaba |
1.12 |
for my $headers_cell (@headers_cell) { |
627 |
|
|
my @headers = split /[\x09-\x0D\x20]+/, |
628 |
|
|
$headers_cell->{element}->get_attribute_ns (undef, 'headers'); |
629 |
|
|
my %headers; |
630 |
|
|
for my $header_id (@headers) { |
631 |
|
|
next unless length $header_id; |
632 |
|
|
if ($headers{$header_id}) { |
633 |
|
|
$onerror->(type => 'duplicate token', value => $header_id, |
634 |
|
|
node => $headers_cell->{element}->get_attribute_node_ns |
635 |
|
|
(undef, 'headers'), |
636 |
wakaba |
1.15 |
level => $levels->{must}); |
637 |
wakaba |
1.12 |
next; |
638 |
|
|
} |
639 |
|
|
$headers{$header_id} = 1; |
640 |
|
|
|
641 |
|
|
if ($id_to_cell->{$header_id}) { |
642 |
|
|
my $header_cell = $id_to_cell->{$header_id}; |
643 |
|
|
$headers_cell->{header}->{$header_cell->{x}}->{$header_cell->{y}} = 1; |
644 |
|
|
} else { |
645 |
wakaba |
1.15 |
$onerror->(type => 'no referenced header cell', value => $header_id, |
646 |
wakaba |
1.12 |
node => $headers_cell->{element}->get_attribute_node_ns |
647 |
|
|
(undef, 'headers'), |
648 |
wakaba |
1.15 |
level => $levels->{must}); |
649 |
wakaba |
1.12 |
} |
650 |
|
|
} |
651 |
|
|
} |
652 |
wakaba |
1.11 |
|
653 |
|
|
## NOTE: The "tree order" constraints in the spec algorithm are irrelevant |
654 |
|
|
## in fact. |
655 |
wakaba |
1.12 |
|
656 |
|
|
## NOTE: We does not support ID attributes other than HTML "id" attribute. |
657 |
wakaba |
1.11 |
} # assign_header |
658 |
wakaba |
1.1 |
|
659 |
|
|
1; |
660 |
wakaba |
1.16 |
## $Date: 2008/08/15 14:13:42 $ |