/[pub]/test/html-webhacc/cc.cgi

Diff of /test/html-webhacc/cc.cgi

Parent Directory | Revision Log | View Patch Patch

-revision 1.2 by wakaba,
Wed Jun 27 12:35:24 2007 UTC
+revision 1.66 by wakaba,
Mon Sep 15 02:55:12 2008 UTC
 Line 1
- #!/usr/bin/perl
+ #!/usr/bin/perl -d:DProf
  use strict;
  use lib qw[/home/httpd/html/www/markup/html/whatpm
-            /home/wakaba/work/manakai/lib
+            /home/wakaba/work/manakai2/lib];
-            /home/wakaba/public_html/-temp/wiki/lib];
  use CGI::Carp qw[fatalsToBrowser];
- use Scalar::Util qw[refaddr];
- use SuikaWiki::Input::HTTP; ## TODO: Use some better CGI module
+   require WebHACC::Input;
- sub htescape ($) {
+ {
-   my $s = $_[0];
+   require Message::CGI::HTTP;
-   $s =~ s/&/&amp;/g;
+   my $http = Message::CGI::HTTP->new;
-   $s =~ s/</&lt;/g;
-   $s =~ s/>/&gt;/g;
+   require WebHACC::Output;
-   $s =~ s/"/&quot;/g;
+   my $out = WebHACC::Output->new;
-   $s =~ s!([\x00-\x09\x0B-\x1F\x7F-\x80])!sprintf '<var>U+%04X</var>', ord $1!ge;
+   $out->handle (*STDOUT);
-   return $s;
+   $out->set_utf8;
- } # htescape
- my $http = SuikaWiki::Input::HTTP->new;
- ## TODO: _charset_
-   my $input_format = $http->parameter ('i') || 'text/html';
-   my $inner_html_element = $http->parameter ('e');
-   my $input_uri = 'thismessage:/';
-   my $s = $http->parameter ('s');
-   if (length $s > 1000_000) {
-     print STDOUT "Status: 400 Document Too Long\nContent-Type: text/plain; charset=us-ascii\n\nToo long";
-     exit;
-   }
-   print STDOUT qq[Content-Type: text/html; charset=utf-8
- <!DOCTYPE html>
- <html lang="en">
- <head>
- <title>Web Document Conformance Checker (BETA)</title>
- <link rel="stylesheet" href="/www/style/html/xhtml">
- <style>
-   q {
-     white-space: pre;
-     white-space: -moz-pre-wrap;
-     white-space: pre-wrap;
-   }
- </style>
- </head>
- <body>
- <h1>Web Document Conformance Checker (<em>beta</em>)</h1>
- <dl>
- <dt>Document URI</dt>
-     <dd><code class="URI" lang="">&lt;<a href="@{[htescape $input_uri]}">@{[htescape $input_uri]}</a>&gt;</code></dd>
- <dt>Internet Media Type</dt>
-     <dd><code class="MIME" lang="en">@{[htescape $input_format]}</code></dd>
- ]; # no </dl> yet
-   require Message::DOM::DOMImplementation;
-   my $dom = Message::DOM::DOMImplementation->____new;
-   my $doc;
-   my $el;
-   if ($input_format eq 'text/html') {
-     require Encode;
-     require Whatpm::HTML;
-     $s = Encode::decode ('utf-8', $s);
-     print STDOUT qq[
- <dt>Character Encoding</dt>
-     <dd>(none)</dd>
- </dl>
- <div id="source-string" class="section">
- ];
-     print_source_string (\$s);
-     print STDOUT qq[
- </div>
- <div id="parse-errors" class="section">
- <h2>Parse Errors</h2>
- <ul>
- ];
-   my $onerror = sub {
-     my (%opt) = @_;
-     if ($opt{column} > 0) {
-       print STDOUT qq[<li><a href="#line-$opt{line}">Line $opt{line}</a> column $opt{column}: ];
-     } else {
-       $opt{line}--;
-       print STDOUT qq[<li><a href="#line-$opt{line}">Line $opt{line}</a>: ];
-     }
-     print STDOUT qq[@{[htescape $opt{type}]}</li>\n];
-   };
-   $doc = $dom->create_document;
-   if (defined $inner_html_element and length $inner_html_element) {
-     $el = $doc->create_element_ns
-         ('http://www.w3.org/1999/xhtml', [undef, $inner_html_element]);
-     Whatpm::HTML->set_inner_html ($el, $s, $onerror);
-   } else {
-     Whatpm::HTML->parse_string ($s => $doc, $onerror);
-   }
-   print STDOUT qq[
- </ul>
- </div>
- ];
-   } elsif ($input_format eq 'application/xhtml+xml') {
-     require Message::DOM::XMLParserTemp;
-     require Encode;
-     my $t = Encode::decode ('utf-8', $s);
-     print STDOUT qq[
- <dt>Character Encoding</dt>
-     <dd>(none)</dd>
- </dl>
- <div id="source-string" class="section">
- ];
-     print_source_string (\$t);
-     print STDOUT qq[
- </div>
- <div id="parse-errors" class="section">
- <h2>Parse Errors</h2>
- <ul>
- ];
-   my $onerror = sub {
-     my $err = shift;
-     my $line = $err->location->line_number;
-     print STDOUT qq[<li><a href="#line-$line">Line $line</a> column ];
-     print STDOUT $err->location->column_number, ": ";
-     print STDOUT htescape $err->text, "</li>\n";
-     return 1;
-   };
-   open my $fh, '<', \$s;
-   $doc = Message::DOM::XMLParserTemp->parse_byte_stream
-       ($fh => $dom, $onerror, charset => 'utf-8');
-     print STDOUT qq[
- </ul>
- </div>
- ];
-   } else {
-     print STDOUT qq[
- </dl>
- <p><em>Media type <code class="MIME" lang="en">@{[htescape $input_format]}</code> is not supported!</em></p>
+   if ($http->get_meta_variable ('PATH_INFO') ne '/') {
- ];
+     $out->http_error (404);
+     exit;
    }
+   ## TODO: We need real conneg support...
-   if (defined $doc or defined $el) {
+   my $primary_language = 'en';
-     print STDOUT qq[
+   if ($ENV{HTTP_ACCEPT_LANGUAGE} =~ /ja/) {
- <div id="document-tree" class="section">
+     $primary_language = 'ja';
- <h2>Document Tree</h2>
+   }
- ];
+   $out->load_text_catalog ($primary_language);
-     print_document_tree ($el || $doc);
+   $out->set_flush;
+   $out->http_header;
-     print STDOUT qq[
+   $out->html_header;
- </div>
+   $out->unset_flush;
- <div id="document-errors" class="section">
+   $out->generate_input_section ($http);
- <h2>Document Errors</h2>
+   my $u = $http->get_parameter ('uri');
- <ul>
+   my $s = $http->get_parameter ('s');
- ];
+   if ((not defined $u or not length $u) and
+       (not defined $s or not length $s)) {
-     require Whatpm::ContentChecker;
+     exit;
-     my $onerror = sub {
-       my %opt = @_;
-       print STDOUT qq[<li><a href="#node-@{[refaddr $opt{node}]}">],
-           htescape get_node_path ($opt{node}),
-           "</a>: ", htescape $opt{type}, "</li>\n";
-     };
-     if ($el) {
-       Whatpm::ContentChecker->check_element ($el, $onerror);
-     } else {
-       Whatpm::ContentChecker->check_document ($doc, $onerror);
-     }
-     print STDOUT qq[
- </ul>
- </div>
- ];
    }
-   ## TODO: Show result
+   require WebHACC::Result;
-   print STDOUT qq[
+   my $result = WebHACC::Result->new;
- </body>
+   $result->output ($out);
- </html>
- ];
+   require WebHACC::Input;
+   my $input = WebHACC::Input->get_document ($http => $result => $out);
- exit;
+   check_and_print ($input => $result => $out);
- sub print_source_string ($) {
-   my $s = $_[0];
+   $out->nav_list;
-   my $i = 1;
-   print STDOUT qq[<ol lang="">\n];
+   exit;
-   while ($$s =~ /\G([^\x0A]*?)\x0D?\x0A/gc) {
+ }
-     print STDOUT qq[<li id="line-$i">], htescape $1, "</li>\n";
-     $i++;
+ sub check_and_print ($$$) {
+   my ($input, $result, $out) = @_;
+   my $original_input = $out->input;
+   $out->input ($input);
+   $input->generate_info_section ($result);
+   $input->generate_transfer_sections ($result);
+   unless (defined $input->{s}) {
+     ## NOTE: This is an error of the implementation.
+     $result->layer_uncertain ('transfer');
+     $result->generate_result_section;
+     $out->input ($original_input);
+     return;
+   }
+   my $checker_class = {
+     'text/cache-manifest' => 'WebHACC::Language::CacheManifest',
+     'text/css' => 'WebHACC::Language::CSS',
+     'text/html' => 'WebHACC::Language::HTML',
+     'text/x-h2h' => 'WebHACC::Language::H2H',
+     'text/x-webidl' => 'WebHACC::Language::WebIDL',
+     'text/xml' => 'WebHACC::Language::XML',
+     'application/atom+xml' => 'WebHACC::Language::XML',
+     'application/rss+xml' => 'WebHACC::Language::XML',
+     'image/svg+xml' => 'WebHACC::Language::XML',
+     'application/xhtml+xml' => 'WebHACC::Language::XML',
+     'application/xml' => 'WebHACC::Language::XML',
+     ## TODO: Should we make all XML MIME Types fall
+     ## into this category?
+     ## NOTE: This type has different model from normal XML types.
+     'application/rdf+xml' => 'WebHACC::Language::XML',
+   }->{$input->{media_type}} || 'WebHACC::Language::Default';
+   eval qq{ require $checker_class } or die "$0: Loading $checker_class: $@";
+   my $checker = $checker_class->new;
+   $checker->input ($input);
+   $checker->output ($out);
+   $checker->result ($result);
+   ## TODO: A cache manifest MUST be text/cache-manifest
+   ## TODO: WebIDL media type "text/x-webidl"
+   $checker->generate_syntax_error_section;
+   $checker->generate_source_string_section;
+   my @subdoc;
+   $checker->onsubdoc (sub {
+     push @subdoc, shift;
+   });
+   $checker->generate_structure_dump_section;
+   $checker->generate_structure_error_section;
+   $checker->generate_additional_sections;
+   my $id_prefix = 0;
+   for my $_subinput (@subdoc) {
+     my $subinput = WebHACC::Input::Subdocument->new (++$id_prefix);
+     $subinput->{$_} = $_subinput->{$_} for keys %$_subinput;
+     $subinput->{base_uri} = $subinput->{container_node}->base_uri
+         unless defined $subinput->{base_uri};
+     $subinput->{parent_input} = $input;
+     my $subresult = WebHACC::Result->new;
+     $subresult->output ($out);
+     $subresult->parent_result ($result);
+     $subinput->start_section ($subresult);
+     check_and_print ($subinput => $subresult => $out);
+     $subinput->end_section ($subresult);
    }
-   if ($$s =~ /\G([^\x0A]+)/gc) {
-     print STDOUT qq[<li id="line-$i">], htescape $1, "</li>\n";
-   }
-   print STDOUT "</ol>";
- } # print_input_string
- sub print_document_tree ($) {
+   $result->generate_result_section;
-   my $node = shift;
-   my $r = '<ol class="xoxo">';
-   my @node = ($node);
-   while (@node) {
-     my $child = shift @node;
-     unless (ref $child) {
-       $r .= $child;
-       next;
-     }
-     my $node_id = 'node-'.refaddr $child;
-     my $nt = $child->node_type;
-     if ($nt == $child->ELEMENT_NODE) {
-       $r .= qq'<li id="$node_id"><code>' . htescape ($child->tag_name) .
-           '</code>'; ## ISSUE: case
-       if ($child->has_attributes) {
-         $r .= '<ul class="attributes">';
-         for my $attr (sort {$a->[0] cmp $b->[0]} map { [$_->name, $_->value, 'node-'.refaddr $_] }
-                       @{$child->attributes}) {
-           $r .= qq'<li id="$attr->[2]"><code>' . htescape ($attr->[0]) . '</code> = '; ## ISSUE: case?
-           $r .= '<q>' . htescape ($attr->[1]) . '</q></li>'; ## TODO: children
-         }
-         $r .= '</ul>';
-       }
-       if ($node->has_child_nodes) {
-         $r .= '<ol class="children">';
-         unshift @node, @{$child->child_nodes}, '</ol>';
-       }
-     } elsif ($nt == $child->TEXT_NODE) {
-       $r .= qq'<li id="$node_id"><q>' . htescape ($child->data) . '</q></li>';
-     } elsif ($nt == $child->CDATA_SECTION_NODE) {
-       $r .= qq'<li id="$node_id"><code>&lt;[CDATA[</code><q>' . htescape ($child->data) . '</q><code>]]&gt;</code></li>';
-     } elsif ($nt == $child->COMMENT_NODE) {
-       $r .= qq'<li id="$node_id"><code>&lt;!--</code><q>' . htescape ($child->data) . '</q><code>--&gt;</code></li>';
-     } elsif ($nt == $child->DOCUMENT_NODE) {
-       $r .= qq'<li id="$node_id">Document</li>';
-       if ($child->has_child_nodes) {
-         $r .= '<ol>';
-         unshift @node, @{$child->child_nodes}, '</ol>';
-       }
-     } elsif ($nt == $child->DOCUMENT_TYPE_NODE) {
-       $r .= qq'<li id="$node_id"><code>&lt;!DOCTYPE&gt;</code><ul>';
-       $r .= '<li>Name = <q>@{[htescape ($child->name)]}</q></li>';
-       $r .= '<li>Public identifier = <q>@{[htescape ($child->public_id)]}</q></li>';
-       $r .= '<li>System identifier = <q>@{[htescape ($child->system_id)]}</q></li>';
-       $r .= '</ul></li>';
-     } elsif ($nt == $child->PROCESSING_INSTRUCTION_NODE) {
-       $r .= qq'<li id="$node_id"><code>&lt;?@{[htescape ($child->target)]}?&gt;</code>';
-       $r .= '<ul><li>@{[htescape ($child->data)]}</li></ul></li>';
-     } else {
-       $r .= qq'<li id="$node_id">@{[$child->node_type]} @{[htescape ($child->node_name)]}</li>'; # error
-     }
-   }
-   $r .= '</ol>';
+   $out->input ($original_input);
-   print STDOUT $r;
+ } # check_and_print
- } # print_document_tree
- sub get_node_path ($) {
-   my $node = shift;
-   my @r;
-   while (defined $node) {
-     my $rs;
-     if ($node->node_type == 1) {
-       $rs = $node->manakai_local_name;
-       $node = $node->parent_node;
-     } elsif ($node->node_type == 2) {
-       $rs = '@' . $node->manakai_local_name;
-       $node = $node->owner_element;
-     } elsif ($node->node_type == 3) {
-       $rs = '"' . $node->data . '"';
-       $node = $node->parent_node;
-     } elsif ($node->node_type == 9) {
-       $rs = '';
-       $node = $node->parent_node;
-     } else {
-       $rs = '#' . $node->node_type;
-       $node = $node->parent_node;
-     }
-     unshift @r, $rs;
-   }
-   return join '/', @r;
- } # get_node_path
  =head1 AUTHOR
-Line 312 
 Wakaba <w@suika.fam.cx>.
+Line 143 
 Wakaba <w@suika.fam.cx>.
  =head1 LICENSE
- Copyright 2007 Wakaba <w@suika.fam.cx>
+ Copyright 2007-2008 Wakaba <w@suika.fam.cx>
  This library is free software; you can redistribute it
  and/or modify it under the same terms as Perl itself.

 Legend:



Removed from v.1.2
 


changed lines


 
Added in v.1.66
 Legend:



Removed from v.1.2
 


changed lines


 
Added in v.1.66
-Removed from v.1.2
+Added in v.1.66

admin@suikawiki.org	ViewVC Help
Powered by ViewVC 1.1.24