1 |
wakaba |
1.1 |
use strict; |
2 |
|
|
|
3 |
|
|
## ISSUE: Currently we require manakai XML parser to test arbitrary XML tree. |
4 |
|
|
use lib qw[/home/wakaba/work/manakai2/lib]; |
5 |
|
|
|
6 |
|
|
use Test; |
7 |
|
|
require Whatpm::ContentChecker; |
8 |
|
|
require Message::DOM::DOMImplementation; |
9 |
|
|
require Message::DOM::XMLParserTemp; |
10 |
|
|
require Whatpm::HTML; |
11 |
|
|
require Whatpm::NanoDOM; |
12 |
|
|
|
13 |
|
|
sub test_files (@) { |
14 |
|
|
my @FILES = @_; |
15 |
|
|
|
16 |
|
|
for my $file_name (@FILES) { |
17 |
|
|
open my $file, '<', $file_name or die "$0: $file_name: $!"; |
18 |
|
|
print "# $file_name\n"; |
19 |
|
|
|
20 |
|
|
my $test; |
21 |
|
|
my $mode = 'data'; |
22 |
|
|
while (<$file>) { |
23 |
|
|
s/\x0D\x0A/\x0A/; |
24 |
|
|
if (/^#data$/) { |
25 |
|
|
undef $test; |
26 |
|
|
$test->{data} = ''; |
27 |
|
|
$mode = 'data'; |
28 |
|
|
$test->{parse_as} = 'xml'; |
29 |
|
|
} elsif (/^#data html$/) { |
30 |
|
|
undef $test; |
31 |
|
|
$test->{data} = ''; |
32 |
|
|
$mode = 'data'; |
33 |
|
|
$test->{parse_as} = 'html'; |
34 |
|
|
} elsif (/^#errors$/) { |
35 |
|
|
$test->{errors} = []; |
36 |
|
|
$mode = 'errors'; |
37 |
|
|
$test->{data} =~ s/\x0D?\x0A\z//; |
38 |
|
|
} elsif (defined $test->{errors} and /^$/) { |
39 |
|
|
test ($test); |
40 |
|
|
undef $test; |
41 |
|
|
} else { |
42 |
|
|
if ($mode eq 'data') { |
43 |
|
|
$test->{$mode} .= $_; |
44 |
|
|
} elsif ($mode eq 'errors') { |
45 |
|
|
tr/\x0D\x0A//d; |
46 |
|
|
push @{$test->{errors}}, $_; |
47 |
|
|
} |
48 |
|
|
} |
49 |
|
|
} |
50 |
|
|
} # @FILES |
51 |
|
|
} # test_files |
52 |
|
|
|
53 |
|
|
my $dom = Message::DOM::DOMImplementation->new; |
54 |
|
|
sub test ($) { |
55 |
|
|
my $test = shift; |
56 |
|
|
|
57 |
|
|
my $doc; |
58 |
|
|
if ($test->{parse_as} eq 'xml') { |
59 |
|
|
open my $fh, '<', \($test->{data}); |
60 |
|
|
$doc = Message::DOM::XMLParserTemp->parse_byte_stream |
61 |
|
|
($fh => $dom, sub { }, charset => 'utf-8'); |
62 |
|
|
$doc->input_encoding (undef); |
63 |
|
|
## NOTE: There should be no well-formedness error; if there is, |
64 |
|
|
## then it is an error of the test case itself. |
65 |
|
|
} else { |
66 |
|
|
$doc = Whatpm::NanoDOM::Document->new; |
67 |
|
|
Whatpm::HTML->parse_string ($test->{data} => $doc); |
68 |
|
|
} |
69 |
|
|
|
70 |
|
|
my @error; |
71 |
|
|
Whatpm::ContentChecker->check_element |
72 |
|
|
($doc->document_element, sub { |
73 |
|
|
my %opt = @_; |
74 |
|
|
if ($opt{type} =~ /^status:/ and $opt{level} eq 'i') { |
75 |
|
|
# |
76 |
|
|
} else { |
77 |
|
|
push @error, get_node_path ($opt{node}) . ';' . $opt{type} . |
78 |
|
|
(defined $opt{text} ? ';' . $opt{text} : '') . |
79 |
|
|
(defined $opt{level} ? ';'.$opt{level} : ''); |
80 |
|
|
} |
81 |
|
|
}, sub { |
82 |
|
|
my $opt = shift; |
83 |
|
|
push @error, get_node_path ($opt->{container_node}) . ';SUBDOC'; |
84 |
|
|
}); |
85 |
|
|
|
86 |
|
|
ok join ("\n", sort {$a cmp $b} @error), |
87 |
|
|
join ("\n", sort {$a cmp $b} @{$test->{errors}}), $test->{data}; |
88 |
|
|
} # test |
89 |
|
|
|
90 |
|
|
sub get_node_path ($) { |
91 |
|
|
my $node = shift; |
92 |
|
|
my @r; |
93 |
|
|
while (defined $node) { |
94 |
|
|
my $rs; |
95 |
|
|
if ($node->node_type == 1) { |
96 |
|
|
$rs = $node->manakai_local_name; |
97 |
|
|
$node = $node->parent_node; |
98 |
|
|
} elsif ($node->node_type == 2) { |
99 |
|
|
$rs = '@' . $node->manakai_local_name; |
100 |
|
|
$node = $node->owner_element; |
101 |
|
|
} elsif ($node->node_type == 3) { |
102 |
|
|
$rs = '"' . $node->data . '"'; |
103 |
|
|
$node = $node->parent_node; |
104 |
|
|
} elsif ($node->node_type == 9) { |
105 |
|
|
$rs = ''; |
106 |
|
|
$node = $node->parent_node; |
107 |
|
|
} else { |
108 |
|
|
$rs = '#' . $node->node_type; |
109 |
|
|
$node = $node->parent_node; |
110 |
|
|
} |
111 |
|
|
unshift @r, $rs; |
112 |
|
|
} |
113 |
|
|
return join '/', @r; |
114 |
|
|
} # get_node_path |
115 |
|
|
|
116 |
|
|
=head1 NAME |
117 |
|
|
|
118 |
|
|
content-checker.pl - Test engine for document conformance checking |
119 |
|
|
|
120 |
|
|
=head1 DESCRIPTION |
121 |
|
|
|
122 |
|
|
The C<content-checker.pl> script implements a test engine for the |
123 |
|
|
conformance checking modules, directly or indirectly referenced from |
124 |
|
|
L<Whatpm::ContentChecker>. |
125 |
|
|
|
126 |
|
|
This script is C<require>d by various test scripts, including |
127 |
|
|
C<ContentCheker.t>, C<ContentChecker-Atom.t>, C<HTML-tokenizer-2.t>, |
128 |
|
|
and C<LangTag.t>. |
129 |
|
|
|
130 |
|
|
=head1 AUTHOR |
131 |
|
|
|
132 |
|
|
Wakaba <w@suika.fam.cx>. |
133 |
|
|
|
134 |
|
|
=head1 LICENSE |
135 |
|
|
|
136 |
|
|
Public Domain. |
137 |
|
|
|
138 |
|
|
=cut |
139 |
|
|
|
140 |
|
|
1; ## $Date: 2008/08/31 06:57:32 $ |