1 |
wakaba |
1.1 |
package WebHACC::Language::XML; |
2 |
|
|
use strict; |
3 |
|
|
require WebHACC::Language::DOM; |
4 |
|
|
push our @ISA, 'WebHACC::Language::DOM'; |
5 |
|
|
|
6 |
|
|
sub new ($) { |
7 |
|
|
return bless {}, shift; |
8 |
|
|
} # new |
9 |
|
|
|
10 |
|
|
sub generate_syntax_error_section ($) { |
11 |
|
|
my $self = shift; |
12 |
|
|
|
13 |
|
|
require Message::DOM::XMLParserTemp; |
14 |
|
|
|
15 |
|
|
my $out = $self->output; |
16 |
|
|
$out->start_section (id => 'parse-errors', title => 'Parse Errors'); |
17 |
|
|
$out->start_tag ('dl', class => 'parse-errors-list'); |
18 |
|
|
|
19 |
|
|
my $input = $self->input; |
20 |
|
|
my $result = $self->result; |
21 |
|
|
|
22 |
|
|
my $onerror = sub { |
23 |
|
|
my $err = shift; |
24 |
wakaba |
1.2 |
$result->add_error (line => $err->location->line_number, |
25 |
|
|
column => $err->location->column_number, |
26 |
|
|
type => 'xml parse error', |
27 |
|
|
value => $err->text, |
28 |
|
|
level => [ |
29 |
wakaba |
1.1 |
$err->SEVERITY_FATAL_ERROR => 'm', |
30 |
|
|
$err->SEVERITY_ERROR => 'm', |
31 |
|
|
$err->SEVERITY_WARNING => 's', |
32 |
wakaba |
1.2 |
]->[$err->severity], |
33 |
|
|
layer => 'syntax'); |
34 |
wakaba |
1.1 |
return 1; |
35 |
|
|
}; |
36 |
|
|
|
37 |
|
|
my $t = \($input->{s}); |
38 |
|
|
if ($input->{is_char_string}) { |
39 |
|
|
require Encode; |
40 |
|
|
$t = \(Encode::encode ('utf8', $$t)); |
41 |
|
|
$input->{charset} = 'utf-8'; |
42 |
|
|
} |
43 |
|
|
|
44 |
|
|
open my $fh, '<', $t; |
45 |
|
|
my $doc = Message::DOM::XMLParserTemp->parse_byte_stream |
46 |
|
|
($fh => $dom, $onerror, charset => $input->{charset}); |
47 |
|
|
$doc->manakai_charset ($input->{official_charset}) |
48 |
|
|
if defined $input->{official_charset}; |
49 |
|
|
|
50 |
|
|
$doc->document_uri ($input->{uri}); |
51 |
|
|
$doc->manakai_entity_base_uri ($input->{base_uri}); |
52 |
|
|
|
53 |
|
|
$out->end_tag ('dl'); |
54 |
|
|
$out->end_section; |
55 |
|
|
} # generate_syntax_error_section |
56 |
|
|
|
57 |
|
|
sub source_charset ($) { |
58 |
|
|
my $self = shift; |
59 |
|
|
return $self->input->{charset} || ($self->{structure}->owner_document || $self->{structure})->input_encoding; |
60 |
|
|
## TODO: Can we always use input_encoding? |
61 |
|
|
} # source_charset |
62 |
|
|
|
63 |
|
|
1; |