218 |
print_listing_section ({ |
print_listing_section ({ |
219 |
id => 'classes', label => 'Classes', heading => 'Classes', |
id => 'classes', label => 'Classes', heading => 'Classes', |
220 |
}, $input, $elements->{class}) if keys %{$elements->{class}}; |
}, $input, $elements->{class}) if keys %{$elements->{class}}; |
221 |
|
print_uri_section ($input, $elements->{uri}) if keys %{$elements->{uri}}; |
222 |
print_rdf_section ($input, $elements->{rdf}) if @{$elements->{rdf}}; |
print_rdf_section ($input, $elements->{rdf}) if @{$elements->{rdf}}; |
223 |
} elsif (defined $cssom) { |
} elsif (defined $cssom) { |
224 |
print_structure_dump_cssom_section ($input, $cssom); |
print_structure_dump_cssom_section ($input, $cssom); |
323 |
if (defined $inner_html_element and length $inner_html_element) { |
if (defined $inner_html_element and length $inner_html_element) { |
324 |
$input->{charset} ||= 'windows-1252'; ## TODO: for now. |
$input->{charset} ||= 'windows-1252'; ## TODO: for now. |
325 |
my $time1 = time; |
my $time1 = time; |
326 |
my $t = Encode::decode ($input->{charset}, $input->{s}); |
my $t = \($input->{s}); |
327 |
|
unless ($input->{is_char_string}) { |
328 |
|
$t = \(Encode::decode ($input->{charset}, $$t)); |
329 |
|
} |
330 |
$time{decode} = time - $time1; |
$time{decode} = time - $time1; |
331 |
|
|
332 |
$el = $doc->create_element_ns |
$el = $doc->create_element_ns |
333 |
('http://www.w3.org/1999/xhtml', [undef, $inner_html_element]); |
('http://www.w3.org/1999/xhtml', [undef, $inner_html_element]); |
334 |
$time1 = time; |
$time1 = time; |
335 |
Whatpm::HTML->set_inner_html ($el, $t, $onerror); |
Whatpm::HTML->set_inner_html ($el, $$t, $onerror); |
336 |
$time{parse} = time - $time1; |
$time{parse} = time - $time1; |
337 |
} else { |
} else { |
338 |
my $time1 = time; |
my $time1 = time; |
339 |
Whatpm::HTML->parse_byte_string |
if ($input->{is_char_string}) { |
340 |
($input->{charset}, $input->{s} => $doc, $onerror); |
Whatpm::HTML->parse_char_string ($input->{s} => $doc, $onerror); |
341 |
|
} else { |
342 |
|
Whatpm::HTML->parse_byte_string |
343 |
|
($input->{charset}, $input->{s} => $doc, $onerror); |
344 |
|
} |
345 |
$time{parse_html} = time - $time1; |
$time{parse_html} = time - $time1; |
346 |
} |
} |
347 |
$doc->manakai_charset ($input->{official_charset}) |
$doc->manakai_charset ($input->{official_charset}) |
381 |
return 1; |
return 1; |
382 |
}; |
}; |
383 |
|
|
384 |
|
my $t = \($input->{s}); |
385 |
|
if ($input->{is_char_string}) { |
386 |
|
require Encode; |
387 |
|
$t = \(Encode::encode ('utf8', $$t)); |
388 |
|
$input->{charset} = 'utf-8'; |
389 |
|
} |
390 |
|
|
391 |
my $time1 = time; |
my $time1 = time; |
392 |
open my $fh, '<', \($input->{s}); |
open my $fh, '<', $t; |
393 |
my $doc = Message::DOM::XMLParserTemp->parse_byte_stream |
my $doc = Message::DOM::XMLParserTemp->parse_byte_stream |
394 |
($fh => $dom, $onerror, charset => $input->{charset}); |
($fh => $dom, $onerror, charset => $input->{charset}); |
395 |
$time{parse_xml} = time - $time1; |
$time{parse_xml} = time - $time1; |
662 |
add_error ('syntax', \%opt => $result); |
add_error ('syntax', \%opt => $result); |
663 |
}; |
}; |
664 |
|
|
665 |
|
my $m = $input->{is_char_string} ? 'parse_char_string' : 'parse_byte_string'; |
666 |
my $time1 = time; |
my $time1 = time; |
667 |
my $manifest = Whatpm::CacheManifest->parse_byte_string |
my $manifest = Whatpm::CacheManifest->$m |
668 |
($input->{s}, $input->{uri}, $input->{base_uri}, $onerror); |
($input->{s}, $input->{uri}, $input->{base_uri}, $onerror); |
669 |
$time{parse_manifest} = time - $time1; |
$time{parse_manifest} = time - $time1; |
670 |
|
|
677 |
my $input = shift; |
my $input = shift; |
678 |
my $s; |
my $s; |
679 |
unless ($input->{is_char_string}) { |
unless ($input->{is_char_string}) { |
680 |
require Encode; |
open my $byte_stream, '<', $_[0]; |
681 |
my $enc = Encode::find_encoding ($_[1]); ## TODO: charset name -> Perl name |
require Message::Charset::Info; |
682 |
return unless $enc; |
my $charset = Message::Charset::Info->get_by_iana_name ($_[1]); |
683 |
|
my ($char_stream, $e_status) = $charset->get_decode_handle |
684 |
|
($byte_stream, allow_error_reporting => 1, allow_fallback => 1); |
685 |
|
return unless $char_stream; |
686 |
|
|
687 |
|
$char_stream->onerror (sub { |
688 |
|
my (undef, $type, %opt) = @_; |
689 |
|
if ($opt{octets}) { |
690 |
|
${$opt{octets}} = "\x{FFFD}"; |
691 |
|
} |
692 |
|
}); |
693 |
|
|
694 |
$s = \($enc->decode (${$_[0]})); |
my $t = ''; |
695 |
|
while (1) { |
696 |
|
my $c = $char_stream->getc; |
697 |
|
last unless defined $c; |
698 |
|
$t .= $c; |
699 |
|
} |
700 |
|
$s = \$t; |
701 |
|
## TODO: Output for each line, don't concat all of lines. |
702 |
} else { |
} else { |
703 |
$s = $_[0]; |
$s = $_[0]; |
704 |
} |
} |
973 |
require JSON; |
require JSON; |
974 |
|
|
975 |
my $i = 0; |
my $i = 0; |
976 |
for my $table_el (@$tables) { |
for my $table (@$tables) { |
977 |
$i++; |
$i++; |
978 |
print STDOUT qq[<div class="section" id="$input->{id_prefix}table-$i"><h3>] . |
print STDOUT qq[<div class="section" id="$input->{id_prefix}table-$i"><h3>] . |
979 |
get_node_link ($input, $table_el) . q[</h3>]; |
get_node_link ($input, $table->{element}) . q[</h3>]; |
980 |
|
|
981 |
## TODO: Make |ContentChecker| return |form_table| result |
delete $table->{element}; |
982 |
## so that this script don't have to run the algorithm twice. |
|
983 |
my $table = Whatpm::HTMLTable->form_table ($table_el); |
for (@{$table->{column_group}}, @{$table->{column}}, $table->{caption}, |
984 |
|
@{$table->{row}}) { |
|
for (@{$table->{column_group}}, @{$table->{column}}, $table->{caption}) { |
|
985 |
next unless $_; |
next unless $_; |
986 |
delete $_->{element}; |
delete $_->{element}; |
987 |
} |
} |
1034 |
print STDOUT qq[</dl></div>]; |
print STDOUT qq[</dl></div>]; |
1035 |
} # print_listing_section |
} # print_listing_section |
1036 |
|
|
1037 |
|
sub print_uri_section ($$$) { |
1038 |
|
my ($input, $uris) = @_; |
1039 |
|
|
1040 |
|
## NOTE: URIs contained in the DOM (i.e. in HTML or XML documents), |
1041 |
|
## except for those in RDF triples. |
1042 |
|
## TODO: URIs in CSS |
1043 |
|
|
1044 |
|
push @nav, ['#' . $input->{id_prefix} . 'uris' => 'URIs'] |
1045 |
|
unless $input->{nested}; |
1046 |
|
print STDOUT qq[ |
1047 |
|
<div id="$input->{id_prefix}uris" class="section"> |
1048 |
|
<h2>URIs</h2> |
1049 |
|
|
1050 |
|
<dl>]; |
1051 |
|
for my $uri (sort {$a cmp $b} keys %$uris) { |
1052 |
|
my $euri = htescape ($uri); |
1053 |
|
print STDOUT qq[<dt><code class=uri><<a href="$euri">$euri</a>></code>]; |
1054 |
|
my $eccuri = htescape (get_cc_uri ($uri)); |
1055 |
|
print STDOUT qq[<dd><a href="$eccuri">Check conformance of this document</a>]; |
1056 |
|
print STDOUT qq[<dd>Found at: <ul>]; |
1057 |
|
for my $entry (@{$uris->{$uri}}) { |
1058 |
|
print STDOUT qq[<li>], get_node_link ($input, $entry->{node}); |
1059 |
|
if (keys %{$entry->{type} or {}}) { |
1060 |
|
print STDOUT ' ('; |
1061 |
|
print STDOUT join ', ', map { |
1062 |
|
{ |
1063 |
|
hyperlink => 'Hyperlink', |
1064 |
|
resource => 'Link to an external resource', |
1065 |
|
namespace => 'Namespace URI', |
1066 |
|
cite => 'Citation or link to a long description', |
1067 |
|
embedded => 'Link to an embedded content', |
1068 |
|
base => 'Base URI', |
1069 |
|
action => 'Submission URI', |
1070 |
|
}->{$_} |
1071 |
|
or |
1072 |
|
htescape ($_) |
1073 |
|
} keys %{$entry->{type}}; |
1074 |
|
print STDOUT ')'; |
1075 |
|
} |
1076 |
|
} |
1077 |
|
print STDOUT qq[</ul>]; |
1078 |
|
} |
1079 |
|
print STDOUT qq[</dl></div>]; |
1080 |
|
} # print_uri_section |
1081 |
|
|
1082 |
sub print_rdf_section ($$$) { |
sub print_rdf_section ($$$) { |
1083 |
my ($input, $rdfs) = @_; |
my ($input, $rdfs) = @_; |
1084 |
|
|
1109 |
|
|
1110 |
sub get_rdf_resource_html ($) { |
sub get_rdf_resource_html ($) { |
1111 |
my $resource = shift; |
my $resource = shift; |
1112 |
if ($resource->{uri}) { |
if (defined $resource->{uri}) { |
1113 |
my $euri = htescape ($resource->{uri}); |
my $euri = htescape ($resource->{uri}); |
1114 |
return '<code class=uri><<a href="' . $euri . '">' . $euri . |
return '<code class=uri><<a href="' . $euri . '">' . $euri . |
1115 |
'</a>></code>'; |
'</a>></code>'; |
1116 |
} elsif ($resource->{bnodeid}) { |
} elsif (defined $resource->{bnodeid}) { |
1117 |
return htescape ('_:' . $resource->{bnodeid}); |
return htescape ('_:' . $resource->{bnodeid}); |
1118 |
} elsif ($resource->{nodes}) { |
} elsif ($resource->{nodes}) { |
1119 |
return '(rdf:XMLLiteral)'; |
return '(rdf:XMLLiteral)'; |
1199 |
|
|
1200 |
print STDOUT qq[<tr class="@{[$uncertain ? 'uncertain' : '']}"><th scope=row>$label</th><td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : '']}">$result->{$_->[1]}->{must}$uncertain</td><td class="@{[$result->{$_->[1]}->{should} ? 'SEE-RESULT' : '']}">$result->{$_->[1]}->{should}$uncertain</td><td>$result->{$_->[1]}->{warning}$uncertain</td>]; |
print STDOUT qq[<tr class="@{[$uncertain ? 'uncertain' : '']}"><th scope=row>$label</th><td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : '']}">$result->{$_->[1]}->{must}$uncertain</td><td class="@{[$result->{$_->[1]}->{should} ? 'SEE-RESULT' : '']}">$result->{$_->[1]}->{should}$uncertain</td><td>$result->{$_->[1]}->{warning}$uncertain</td>]; |
1201 |
if ($uncertain) { |
if ($uncertain) { |
1202 |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : $result->{$_->[1]}->{should} ? 'SEE-RESULT' : '']}">−∞..$result->{$_->[1]}->{score_max}</td>]; |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : $result->{$_->[1]}->{should} ? 'SEE-RESULT' : '']}">−∞..$result->{$_->[1]}->{score_max}]; |
1203 |
} elsif ($result->{$_->[1]}->{score_min} != $result->{$_->[1]}->{score_max}) { |
} elsif ($result->{$_->[1]}->{score_min} != $result->{$_->[1]}->{score_max}) { |
1204 |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : 'SEE-RESULT']}">$result->{$_->[1]}->{score_min}..$result->{$_->[1]}->{score_max}</td></tr>]; |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : 'SEE-RESULT']}">$result->{$_->[1]}->{score_min}..$result->{$_->[1]}->{score_max}]; |
1205 |
} else { |
} else { |
1206 |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : '']}">$result->{$_->[1]}->{score_min}</td></tr>]; |
print qq[<td class="@{[$result->{$_->[1]}->{must} ? 'FAIL' : '']}">$result->{$_->[1]}->{score_min}]; |
1207 |
} |
} |
1208 |
|
print qq[ / 20]; |
1209 |
} |
} |
1210 |
|
|
1211 |
$score_max += $score_base; |
$score_max += $score_base; |
1212 |
|
|
1213 |
print STDOUT qq[ |
print STDOUT qq[ |
1214 |
<tr class=uncertain><th scope=row>Semantics</th><td>0?</td><td>0?</td><td>0?</td><td>−∞..$score_base</td></tr> |
<tr class=uncertain><th scope=row>Semantics</th><td>0?</td><td>0?</td><td>0?</td><td>−∞..$score_base / 20 |
1215 |
</tbody> |
</tbody> |
1216 |
<tfoot><tr class=uncertain><th scope=row>Total</th> |
<tfoot><tr class=uncertain><th scope=row>Total</th> |
1217 |
<td class="@{[$must_error ? 'FAIL' : '']}">$must_error?</td> |
<td class="@{[$must_error ? 'FAIL' : '']}">$must_error?</td> |
1218 |
<td class="@{[$should_error ? 'SEE-RESULT' : '']}">$should_error?</td> |
<td class="@{[$should_error ? 'SEE-RESULT' : '']}">$should_error?</td> |
1219 |
<td>$warning?</td> |
<td>$warning?</td> |
1220 |
<td class="@{[$must_error ? 'FAIL' : $should_error ? 'SEE-RESULT' : '']}"><strong>−∞..$score_max</strong></td></tr></tfoot> |
<td class="@{[$must_error ? 'FAIL' : $should_error ? 'SEE-RESULT' : '']}"><strong>−∞..$score_max</strong> / 100 |
1221 |
</table> |
</table> |
1222 |
|
|
1223 |
<p><strong>Important</strong>: This conformance checking service |
<p><strong>Important</strong>: This conformance checking service |
1360 |
while (defined $node) { |
while (defined $node) { |
1361 |
my $rs; |
my $rs; |
1362 |
if ($node->node_type == 1) { |
if ($node->node_type == 1) { |
1363 |
$rs = $node->manakai_local_name; |
$rs = $node->node_name; |
1364 |
$node = $node->parent_node; |
$node = $node->parent_node; |
1365 |
} elsif ($node->node_type == 2) { |
} elsif ($node->node_type == 2) { |
1366 |
$rs = '@' . $node->manakai_local_name; |
$rs = '@' . $node->node_name; |
1367 |
$node = $node->owner_element; |
$node = $node->owner_element; |
1368 |
} elsif ($node->node_type == 3) { |
} elsif ($node->node_type == 3) { |
1369 |
$rs = '"' . $node->data . '"'; |
$rs = '"' . $node->data . '"'; |
1441 |
|
|
1442 |
} |
} |
1443 |
|
|
1444 |
|
sub encode_uri_component ($) { |
1445 |
|
require Encode; |
1446 |
|
my $s = Encode::encode ('utf8', shift); |
1447 |
|
$s =~ s/([^0-9A-Za-z_.~-])/sprintf '%%%02X', ord $1/ge; |
1448 |
|
return $s; |
1449 |
|
} # encode_uri_component |
1450 |
|
|
1451 |
|
sub get_cc_uri ($) { |
1452 |
|
return './?uri=' . encode_uri_component ($_[0]); |
1453 |
|
} # get_cc_uri |
1454 |
|
|
1455 |
sub get_input_document ($$) { |
sub get_input_document ($$) { |
1456 |
my ($http, $dom) = @_; |
my ($http, $dom) = @_; |
1457 |
|
|