/[suikacvs]/markup/html/whatpm/t/HTML-tree.t

Diff of /markup/html/whatpm/t/HTML-tree.t

Parent Directory | Revision Log | View Patch Patch

-revision 1.17 by wakaba,
Sat Jun 30 14:13:20 2007 UTC
+revision 1.40 by wakaba,
Tue Oct 14 06:08:26 2008 UTC
 Line 1
  #!/usr/bin/perl
  use strict;
+ my $DEBUG = $ENV{DEBUG};
+ use lib qw[/home/wakaba/work/manakai2/lib];
  my $dir_name;
  my $test_dir_name;
  BEGIN {
-Line 20 
 BEGIN {
+Line 24 
 BEGIN {
  }
  use Test;
- BEGIN { plan tests => 632 }
+ BEGIN { plan tests => 3105 }
  use Data::Dumper;
  $Data::Dumper::Useqq = 1;
-Line 30 
 sub Data::Dumper::qquote {
+Line 34 
 sub Data::Dumper::qquote {
    return q<qq'> . $s . q<'>;
  } # Data::Dumper::qquote
- for my $file_name (grep {$_} split /\s+/, qq[
+ if ($DEBUG) {
+   my $not_found = {%{$Whatpm::HTML::Debug::cp or {}}};
+   $Whatpm::HTML::Debug::cp_pass = sub {
+     my $id = shift;
+     delete $not_found->{$id};
+   };
+   END {
+     for my $id (sort {$a <=> $b || $a cmp $b} keys %$not_found) {
+       print "# checkpoint $id is not reached\n";
+     }
+   }
+ }
+ my @FILES = grep {$_} split /\s+/, qq[
                        ${test_dir_name}tokenizer-test-2.dat
+                       ${test_dir_name}tokenizer-test-3.dat
                        ${dir_name}tests1.dat
                        ${dir_name}tests2.dat
                        ${dir_name}tests3.dat
                        ${dir_name}tests4.dat
                        ${dir_name}tests5.dat
                        ${dir_name}tests6.dat
+                       ${dir_name}tests7.dat
+                       ${dir_name}tests8.dat
+                       ${dir_name}tests9.dat
+                       ${dir_name}tests10.dat
+                       ${dir_name}tests11.dat
+                       ${dir_name}tests12.dat
                        ${test_dir_name}tree-test-1.dat
                        ${test_dir_name}tree-test-2.dat
-                      ]) {
+                       ${test_dir_name}tree-test-3.dat
-   open my $file, '<', $file_name
+                       ${test_dir_name}tree-test-void.dat
-     or die "$0: $file_name: $!";
+                       ${test_dir_name}tree-test-flow.dat
-   print "# $file_name\n";
+                       ${test_dir_name}tree-test-phrasing.dat
+                       ${test_dir_name}tree-test-form.dat
-   my $test;
+                       ${test_dir_name}tree-test-foreign.dat
-   my $mode = 'data';
+                      ];
-   my $escaped;
-   while (<$file>) {
+ require 't/testfiles.pl';
-     s/\x0D\x0A/\x0A/;
+ execute_test ($_, {
-     if (/^#data$/) {
+   errors => {is_list => 1},
-       undef $test;
+   shoulds => {is_list => 1},
-       $test->{data} = '';
+   document => {is_prefixed => 1},
-       $mode = 'data';
+   'document-fragment' => {is_prefixed => 1},
-       undef $escaped;
+ }, \&test) for @FILES;
-     } elsif (/^#data escaped$/) {
-       undef $test;
-       $test->{data} = '';
-       $mode = 'data';
-       $escaped = 1;
-     } elsif (/^#errors$/) {
-       $test->{errors} = [];
-       $mode = 'errors';
-       $test->{data} =~ s/\x0D?\x0A\z//;
-       $test->{data} =~ s/\\u([0-9A-Fa-f]{4})/chr hex $1/ge if $escaped;
-       undef $escaped;
-     } elsif (/^#document$/) {
-       $test->{document} = '';
-       $mode = 'document';
-       undef $escaped;
-     } elsif (/^#document escaped$/) {
-       $test->{document} = '';
-       $mode = 'document';
-       $escaped = 1;
-     } elsif (/^#document-fragment (\S+)$/) {
-       $test->{document} = '';
-       $mode = 'document';
-       $test->{element} = $1;
-       undef $escaped;
-     } elsif (/^#document-fragment (\S+) escaped$/) {
-       $test->{document} = '';
-       $mode = 'document';
-       $test->{element} = $1;
-       $escaped = 1;
-     } elsif (defined $test->{document} and /^$/) {
-       $test->{document} =~ s/\\u([0-9A-Fa-f]{4})/chr hex $1/ge if $escaped;
-       test ($test);
-       undef $test;
-     } else {
-       if ($mode eq 'data' or $mode eq 'document') {
-         $test->{$mode} .= $_;
-       } elsif ($mode eq 'errors') {
-         tr/\x0D\x0A//d;
-         push @{$test->{errors}}, $_;
-       }
-     }
-   }
-   test ($test) if $test->{errors};
- }
  use Whatpm::HTML;
  use Whatpm::NanoDOM;
+ use Whatpm::Charset::UnicodeChecker;
  sub test ($) {
    my $test = shift;
+   if ($test->{'document-fragment'}) {
+     if (@{$test->{'document-fragment'}->[1]}) {
+       ## NOTE: Old format.
+       $test->{element} = $test->{'document-fragment'}->[1]->[0];
+       $test->{document} ||= $test->{'document-fragment'};
+     } else {
+       ## NOTE: New format.
+       $test->{element} = $test->{'document-fragment'}->[0];
+     }
+   }
    my $doc = Whatpm::NanoDOM::Document->new;
    my @errors;
+   my @shoulds;
    $SIG{INT} = sub {
      print scalar serialize ($doc);
-Line 116 
 sub test ($) {
+Line 111 
 sub test ($) {
    my $onerror = sub {
      my %opt = @_;
-     push @errors, join ':', $opt{line}, $opt{column}, $opt{type};
+     if ($opt{level} eq 's') {
+       push @shoulds, join ':', $opt{line}, $opt{column}, $opt{type};
+     } else {
+       push @errors, join ':', $opt{line}, $opt{column}, $opt{type};
+     }
    };
+   my $chk = sub {
+     return Whatpm::Charset::UnicodeChecker->new_handle ($_[0], 'html5');
+   }; # $chk
    my $result;
    unless (defined $test->{element}) {
-     Whatpm::HTML->parse_string ($test->{data} => $doc, $onerror);
+     Whatpm::HTML->parse_char_string
+         ($test->{data}->[0] => $doc, $onerror, $chk);
      $result = serialize ($doc);
    } else {
      my $el = $doc->create_element_ns
        ('http://www.w3.org/1999/xhtml', [undef, $test->{element}]);
-     Whatpm::HTML->set_inner_html ($el, $test->{data}, $onerror);
+     Whatpm::HTML->set_inner_html ($el, $test->{data}->[0], $onerror, $chk);
      $result = serialize ($el);
    }
+   warn "No #errors section" unless $test->{errors};
-   ok scalar @errors, scalar @{$test->{errors}},
+   ok scalar @errors, scalar @{$test->{errors}->[0] or []},
-     'Parse error: ' . $test->{data} . '; ' .
+     'Parse error: ' . Data::Dumper::qquote ($test->{data}->[0]) . '; ' .
-     join (', ', @errors) . ';' . join (', ', @{$test->{errors}});
+     join (', ', @errors) . ';' . join (', ', @{$test->{errors}->[0] or []});
+   ok scalar @shoulds, scalar @{$test->{shoulds}->[0] or []},
+     'SHOULD-level error: ' . Data::Dumper::qquote ($test->{data}->[0]) . '; ' .
+     join (', ', @shoulds) . ';' . join (', ', @{$test->{shoulds}->[0] or []});
-   ok $result, $test->{document}, 'Document tree: ' . $test->{data};
+   ok $result, $test->{document}->[0] . "\x0A",
+       'Document tree: ' . Data::Dumper::qquote ($test->{data}->[0]);
  } # test
+ ## NOTE: Spec: <http://wiki.whatwg.org/wiki/Parser_tests>.
  sub serialize ($) {
    my $node = shift;
    my $r = '';
-Line 145 
 sub serialize ($) {
+Line 157 
 sub serialize ($) {
      my $child = shift @node;
      my $nt = $child->[0]->node_type;
      if ($nt == $child->[0]->ELEMENT_NODE) {
-       $r .= '| ' . $child->[1] . '<' . $child->[0]->tag_name . ">\x0A"; ## ISSUE: case?
+       $r .= $child->[1] . '<' . $child->[0]->tag_name . ">\x0A"; ## ISSUE: case?
        for my $attr (sort {$a->[0] cmp $b->[0]} map { [$_->name, $_->value] }
                      @{$child->[0]->attributes}) {
-         $r .= '| ' . $child->[1] . '  ' . $attr->[0] . '="'; ## ISSUE: case?
+         $r .= $child->[1] . '  ' . $attr->[0] . '="'; ## ISSUE: case?
          $r .= $attr->[1] . '"' . "\x0A";
        }
        unshift @node,
          map { [$_, $child->[1] . '  '] } @{$child->[0]->child_nodes};
      } elsif ($nt == $child->[0]->TEXT_NODE) {
-       $r .= '| ' . $child->[1] . '"' . $child->[0]->data . '"' . "\x0A";
+       $r .= $child->[1] . '"' . $child->[0]->data . '"' . "\x0A";
      } elsif ($nt == $child->[0]->COMMENT_NODE) {
-       $r .= '| ' . $child->[1] . '<!-- ' . $child->[0]->data . " -->\x0A";
+       $r .= $child->[1] . '<!-- ' . $child->[0]->data . " -->\x0A";
      } elsif ($nt == $child->[0]->DOCUMENT_TYPE_NODE) {
-       $r .= '| ' . $child->[1] . '<!DOCTYPE ' . $child->[0]->name . ">\x0A";
+       $r .= $child->[1] . '<!DOCTYPE ' . $child->[0]->name;
+       my $pubid = $child->[0]->public_id;
+       my $sysid = $child->[0]->system_id;
+       if (length $pubid or length $sysid) {
+         $r .= ' "' . $pubid . '"';
+         $r .= ' "' . $sysid . '"';
+       }
+       $r .= ">\x0A";
      } else {
-       $r .= '| ' . $child->[1] . $child->[0]->node_type . "\x0A"; # error
+       $r .= $child->[1] . $child->[0]->node_type . "\x0A"; # error
      }
    }

 Legend:



Removed from v.1.17
 


changed lines


 
Added in v.1.40
 Legend:



Removed from v.1.17
 


changed lines


 
Added in v.1.40
-Removed from v.1.17
+Added in v.1.40

admin@suikawiki.org	ViewVC Help
Powered by ViewVC 1.1.24