/[suikacvs]/test/html-webhacc/WebHACC/Language/HTML.pm
Suika

Contents of /test/html-webhacc/WebHACC/Language/HTML.pm

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.7 - (show annotations) (download)
Fri Aug 15 08:36:41 2008 UTC (16 years, 10 months ago) by wakaba
Branch: MAIN
Changes since 1.6: +18 -4 lines
++ ChangeLog	15 Aug 2008 08:33:38 -0000
	* error-description-source.xml: Missing entries for Whatpm::HTML
	error types are added.  Error entries used by Whatpm::HTML
	are marked as "HTML::Parser".

2008-08-15  Wakaba  <wakaba@suika.fam.cx>

++ html/WebHACC/Language/ChangeLog	15 Aug 2008 08:36:35 -0000
	* HTML.pm: Set flags for encoding layer errors appropriately.
	Save link to the document root for the parsed document
	for garbage collection safety.

2008-08-15  Wakaba  <wakaba@suika.fam.cx>

++ html/WebHACC/ChangeLog	15 Aug 2008 08:35:36 -0000
	* Output.pm: |fieldset| end tag no longer necessary.

	* Result.pm: Link to "#parse-errors" if there are
	encoding layer errors.

2008-08-15  Wakaba  <wakaba@suika.fam.cx>

1 package WebHACC::Language::HTML;
2 use strict;
3 require WebHACC::Language::DOM;
4 push our @ISA, 'WebHACC::Language::DOM';
5
6 sub new ($) {
7 return bless {}, shift;
8 } # new
9
10 sub generate_syntax_error_section ($) {
11 my $self = shift;
12
13 require Message::DOM::DOMImplementation;
14 require Encode;
15 require Whatpm::HTML;
16
17 $self->result->layer_uncertain ('charset');
18
19 my $out = $self->output;
20 $out->start_section (role => 'parse-errors');
21 $out->start_error_list (role => 'parse-errors');
22 $self->result->layer_applicable ('syntax');
23
24 my $input = $self->input;
25 my $result = $self->result;
26
27 my $onerror = sub {
28 my %opt = @_;
29 $result->add_error (layer => 'syntax', %opt);
30
31 if ($opt{type} eq 'chardecode:no error') {
32 $self->result->layer_uncertain ('encode');
33 } elsif ($opt{type} eq 'chardecode:fallback') {
34 $self->result->layer_uncertain ('charset');
35 $self->result->layer_uncertain ('syntax');
36 $self->result->layer_uncertain ('structure');
37 $self->result->layer_uncertain ('semantics');
38 }
39 };
40
41 my $dom = Message::DOM::DOMImplementation->new;
42 my $doc = $dom->create_document;
43 my $el;
44 my $inner_html_element = $input->{inner_html_element};
45 if (defined $inner_html_element and length $inner_html_element) {
46 $input->{charset} ||= 'utf-8';
47 my $t = \($input->{s});
48 unless ($input->{is_char_string}) {
49 $t = \(Encode::decode ($input->{charset}, $$t));
50 $self->result->layer_applicable ('encode');
51 }
52
53 $el = $doc->create_element_ns
54 ('http://www.w3.org/1999/xhtml', [undef, $inner_html_element]);
55 Whatpm::HTML->set_inner_html ($el, $$t, $onerror);
56
57 $self->{structure} = $el;
58 $self->{_structure_root} = $doc;
59 ## NOTE: This is necessary, otherwise it would be garbage collected
60 ## before $el is useless, since $el->owner_document is only a weak
61 ## reference.
62 } else {
63 if ($input->{is_char_string}) {
64 Whatpm::HTML->parse_char_string ($input->{s} => $doc, $onerror);
65 } else {
66 $self->result->layer_applicable ('encode');
67 Whatpm::HTML->parse_byte_string
68 ($input->{charset}, $input->{s} => $doc, $onerror);
69 }
70
71 $self->{structure} = $doc;
72 }
73 $doc->manakai_charset ($input->{official_charset})
74 if defined $input->{official_charset};
75
76 $doc->document_uri ($input->{uri});
77 $doc->manakai_entity_base_uri ($input->{base_uri});
78
79 $out->end_error_list (role => 'parse-errors');
80 $out->end_section;
81 } # generate_syntax_error_section
82
83 sub source_charset ($) {
84 my $self = shift;
85 return $self->input->{charset} || ($self->{structure}->owner_document || $self->{structure})->input_encoding;
86 ## TODO: Can we always use input_encoding?
87 } # source_charset
88
89 1;

admin@suikawiki.org
ViewVC Help
Powered by ViewVC 1.1.24