| 8 |
## doc.write (''); |
## doc.write (''); |
| 9 |
## alert (doc.compatMode); |
## alert (doc.compatMode); |
| 10 |
|
|
|
## TODO: 1252 parse error (revision 1264) |
|
|
## TODO: 8859-11 = 874 (revision 1271) |
|
|
|
|
| 11 |
require IO::Handle; |
require IO::Handle; |
| 12 |
|
|
| 13 |
my $HTML_NS = q<http://www.w3.org/1999/xhtml>; |
my $HTML_NS = q<http://www.w3.org/1999/xhtml>; |
| 3139 |
} elsif (defined $token->{public_identifier}) { |
} elsif (defined $token->{public_identifier}) { |
| 3140 |
my $pubid = $token->{public_identifier}; |
my $pubid = $token->{public_identifier}; |
| 3141 |
$pubid =~ tr/a-z/A-z/; |
$pubid =~ tr/a-z/A-z/; |
| 3142 |
if ({ |
my $prefix = [ |
| 3143 |
"+//SILMARIL//DTD HTML PRO V0R11 19970101//EN" => 1, |
"+//SILMARIL//DTD HTML PRO V0R11 19970101//", |
| 3144 |
"-//ADVASOFT LTD//DTD HTML 3.0 ASWEDIT + EXTENSIONS//EN" => 1, |
"-//ADVASOFT LTD//DTD HTML 3.0 ASWEDIT + EXTENSIONS//", |
| 3145 |
"-//AS//DTD HTML 3.0 ASWEDIT + EXTENSIONS//EN" => 1, |
"-//AS//DTD HTML 3.0 ASWEDIT + EXTENSIONS//", |
| 3146 |
"-//IETF//DTD HTML 2.0 LEVEL 1//EN" => 1, |
"-//IETF//DTD HTML 2.0 LEVEL 1//", |
| 3147 |
"-//IETF//DTD HTML 2.0 LEVEL 2//EN" => 1, |
"-//IETF//DTD HTML 2.0 LEVEL 2//", |
| 3148 |
"-//IETF//DTD HTML 2.0 STRICT LEVEL 1//EN" => 1, |
"-//IETF//DTD HTML 2.0 STRICT LEVEL 1//", |
| 3149 |
"-//IETF//DTD HTML 2.0 STRICT LEVEL 2//EN" => 1, |
"-//IETF//DTD HTML 2.0 STRICT LEVEL 2//", |
| 3150 |
"-//IETF//DTD HTML 2.0 STRICT//EN" => 1, |
"-//IETF//DTD HTML 2.0 STRICT//", |
| 3151 |
"-//IETF//DTD HTML 2.0//EN" => 1, |
"-//IETF//DTD HTML 2.0//", |
| 3152 |
"-//IETF//DTD HTML 2.1E//EN" => 1, |
"-//IETF//DTD HTML 2.1E//", |
| 3153 |
"-//IETF//DTD HTML 3.0//EN" => 1, |
"-//IETF//DTD HTML 3.0//", |
| 3154 |
"-//IETF//DTD HTML 3.0//EN//" => 1, |
"-//IETF//DTD HTML 3.2 FINAL//", |
| 3155 |
"-//IETF//DTD HTML 3.2 FINAL//EN" => 1, |
"-//IETF//DTD HTML 3.2//", |
| 3156 |
"-//IETF//DTD HTML 3.2//EN" => 1, |
"-//IETF//DTD HTML 3//", |
| 3157 |
"-//IETF//DTD HTML 3//EN" => 1, |
"-//IETF//DTD HTML LEVEL 0//", |
| 3158 |
"-//IETF//DTD HTML LEVEL 0//EN" => 1, |
"-//IETF//DTD HTML LEVEL 1//", |
| 3159 |
"-//IETF//DTD HTML LEVEL 0//EN//2.0" => 1, |
"-//IETF//DTD HTML LEVEL 2//", |
| 3160 |
"-//IETF//DTD HTML LEVEL 1//EN" => 1, |
"-//IETF//DTD HTML LEVEL 3//", |
| 3161 |
"-//IETF//DTD HTML LEVEL 1//EN//2.0" => 1, |
"-//IETF//DTD HTML STRICT LEVEL 0//", |
| 3162 |
"-//IETF//DTD HTML LEVEL 2//EN" => 1, |
"-//IETF//DTD HTML STRICT LEVEL 1//", |
| 3163 |
"-//IETF//DTD HTML LEVEL 2//EN//2.0" => 1, |
"-//IETF//DTD HTML STRICT LEVEL 2//", |
| 3164 |
"-//IETF//DTD HTML LEVEL 3//EN" => 1, |
"-//IETF//DTD HTML STRICT LEVEL 3//", |
| 3165 |
"-//IETF//DTD HTML LEVEL 3//EN//3.0" => 1, |
"-//IETF//DTD HTML STRICT//", |
| 3166 |
"-//IETF//DTD HTML STRICT LEVEL 0//EN" => 1, |
"-//IETF//DTD HTML//", |
| 3167 |
"-//IETF//DTD HTML STRICT LEVEL 0//EN//2.0" => 1, |
"-//METRIUS//DTD METRIUS PRESENTATIONAL//", |
| 3168 |
"-//IETF//DTD HTML STRICT LEVEL 1//EN" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML STRICT//", |
| 3169 |
"-//IETF//DTD HTML STRICT LEVEL 1//EN//2.0" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML//", |
| 3170 |
"-//IETF//DTD HTML STRICT LEVEL 2//EN" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 TABLES//", |
| 3171 |
"-//IETF//DTD HTML STRICT LEVEL 2//EN//2.0" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML STRICT//", |
| 3172 |
"-//IETF//DTD HTML STRICT LEVEL 3//EN" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML//", |
| 3173 |
"-//IETF//DTD HTML STRICT LEVEL 3//EN//3.0" => 1, |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 TABLES//", |
| 3174 |
"-//IETF//DTD HTML STRICT//EN" => 1, |
"-//NETSCAPE COMM. CORP.//DTD HTML//", |
| 3175 |
"-//IETF//DTD HTML STRICT//EN//2.0" => 1, |
"-//NETSCAPE COMM. CORP.//DTD STRICT HTML//", |
| 3176 |
"-//IETF//DTD HTML STRICT//EN//3.0" => 1, |
"-//O'REILLY AND ASSOCIATES//DTD HTML 2.0//", |
| 3177 |
"-//IETF//DTD HTML//EN" => 1, |
"-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED 1.0//", |
| 3178 |
"-//IETF//DTD HTML//EN//2.0" => 1, |
"-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED RELAXED 1.0//", |
| 3179 |
"-//IETF//DTD HTML//EN//3.0" => 1, |
"-//SOFTQUAD SOFTWARE//DTD HOTMETAL PRO 6.0::19990601::EXTENSIONS TO HTML 4.0//", |
| 3180 |
"-//METRIUS//DTD METRIUS PRESENTATIONAL//EN" => 1, |
"-//SOFTQUAD//DTD HOTMETAL PRO 4.0::19971010::EXTENSIONS TO HTML 4.0//", |
| 3181 |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML STRICT//EN" => 1, |
"-//SPYGLASS//DTD HTML 2.0 EXTENDED//", |
| 3182 |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML//EN" => 1, |
"-//SQ//DTD HTML 2.0 HOTMETAL + EXTENSIONS//", |
| 3183 |
"-//MICROSOFT//DTD INTERNET EXPLORER 2.0 TABLES//EN" => 1, |
"-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA HTML//", |
| 3184 |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML STRICT//EN" => 1, |
"-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA STRICT HTML//", |
| 3185 |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML//EN" => 1, |
"-//W3C//DTD HTML 3 1995-03-24//", |
| 3186 |
"-//MICROSOFT//DTD INTERNET EXPLORER 3.0 TABLES//EN" => 1, |
"-//W3C//DTD HTML 3.2 DRAFT//", |
| 3187 |
"-//NETSCAPE COMM. CORP.//DTD HTML//EN" => 1, |
"-//W3C//DTD HTML 3.2 FINAL//", |
| 3188 |
"-//NETSCAPE COMM. CORP.//DTD STRICT HTML//EN" => 1, |
"-//W3C//DTD HTML 3.2//", |
| 3189 |
"-//O'REILLY AND ASSOCIATES//DTD HTML 2.0//EN" => 1, |
"-//W3C//DTD HTML 3.2S DRAFT//", |
| 3190 |
"-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED 1.0//EN" => 1, |
"-//W3C//DTD HTML 4.0 FRAMESET//", |
| 3191 |
"-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED RELAXED 1.0//EN" => 1, |
"-//W3C//DTD HTML 4.0 TRANSITIONAL//", |
| 3192 |
"-//SOFTQUAD SOFTWARE//DTD HOTMETAL PRO 6.0::19990601::EXTENSIONS TO HTML 4.0//EN" => 1, |
"-//W3C//DTD HTML EXPERIMETNAL 19960712//", |
| 3193 |
"-//SOFTQUAD//DTD HOTMETAL PRO 4.0::19971010::EXTENSIONS TO HTML 4.0//EN" => 1, |
"-//W3C//DTD HTML EXPERIMENTAL 970421//", |
| 3194 |
"-//SPYGLASS//DTD HTML 2.0 EXTENDED//EN" => 1, |
"-//W3C//DTD W3 HTML//", |
| 3195 |
"-//SQ//DTD HTML 2.0 HOTMETAL + EXTENSIONS//EN" => 1, |
"-//W3O//DTD W3 HTML 3.0//", |
| 3196 |
"-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA HTML//EN" => 1, |
"-//WEBTECHS//DTD MOZILLA HTML 2.0//", |
| 3197 |
"-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA STRICT HTML//EN" => 1, |
"-//WEBTECHS//DTD MOZILLA HTML//", |
| 3198 |
"-//W3C//DTD HTML 3 1995-03-24//EN" => 1, |
]; # $prefix |
| 3199 |
"-//W3C//DTD HTML 3.2 DRAFT//EN" => 1, |
my $match; |
| 3200 |
"-//W3C//DTD HTML 3.2 FINAL//EN" => 1, |
for (@$prefix) { |
| 3201 |
"-//W3C//DTD HTML 3.2//EN" => 1, |
if (substr ($prefix, 0, length $_) eq $_) { |
| 3202 |
"-//W3C//DTD HTML 3.2S DRAFT//EN" => 1, |
$match = 1; |
| 3203 |
"-//W3C//DTD HTML 4.0 FRAMESET//EN" => 1, |
last; |
| 3204 |
"-//W3C//DTD HTML 4.0 TRANSITIONAL//EN" => 1, |
} |
| 3205 |
"-//W3C//DTD HTML EXPERIMETNAL 19960712//EN" => 1, |
} |
| 3206 |
"-//W3C//DTD HTML EXPERIMENTAL 970421//EN" => 1, |
if ($match or |
| 3207 |
"-//W3C//DTD W3 HTML//EN" => 1, |
$pubid eq "-//W3O//DTD W3 HTML STRICT 3.0//EN//" or |
| 3208 |
"-//W3O//DTD W3 HTML 3.0//EN" => 1, |
$pubid eq "-/W3C/DTD HTML 4.0 TRANSITIONAL/EN" or |
| 3209 |
"-//W3O//DTD W3 HTML 3.0//EN//" => 1, |
$pubid eq "HTML") { |
|
"-//W3O//DTD W3 HTML STRICT 3.0//EN//" => 1, |
|
|
"-//WEBTECHS//DTD MOZILLA HTML 2.0//EN" => 1, |
|
|
"-//WEBTECHS//DTD MOZILLA HTML//EN" => 1, |
|
|
"-/W3C/DTD HTML 4.0 TRANSITIONAL/EN" => 1, |
|
|
"HTML" => 1, |
|
|
}->{$pubid}) { |
|
| 3210 |
!!!cp ('t5'); |
!!!cp ('t5'); |
| 3211 |
$self->{document}->manakai_compat_mode ('quirks'); |
$self->{document}->manakai_compat_mode ('quirks'); |
| 3212 |
} elsif ($pubid eq "-//W3C//DTD HTML 4.01 FRAMESET//EN" or |
} elsif ($pubid =~ m[^-//W3C//DTD HTML 4.01 FRAMESET//] or |
| 3213 |
$pubid eq "-//W3C//DTD HTML 4.01 TRANSITIONAL//EN") { |
$pubid =~ m[^-//W3C//DTD HTML 4.01 TRANSITIONAL//]) { |
| 3214 |
if (defined $token->{system_identifier}) { |
if (defined $token->{system_identifier}) { |
| 3215 |
!!!cp ('t6'); |
!!!cp ('t6'); |
| 3216 |
$self->{document}->manakai_compat_mode ('quirks'); |
$self->{document}->manakai_compat_mode ('quirks'); |
| 3218 |
!!!cp ('t7'); |
!!!cp ('t7'); |
| 3219 |
$self->{document}->manakai_compat_mode ('limited quirks'); |
$self->{document}->manakai_compat_mode ('limited quirks'); |
| 3220 |
} |
} |
| 3221 |
} elsif ($pubid eq "-//W3C//DTD XHTML 1.0 FRAMESET//EN" or |
} elsif ($pubid =~ m[^-//W3C//DTD XHTML 1.0 FRAMESET//] or |
| 3222 |
$pubid eq "-//W3C//DTD XHTML 1.0 TRANSITIONAL//EN") { |
$pubid =~ m[^-//W3C//DTD XHTML 1.0 TRANSITIONAL//]) { |
| 3223 |
!!!cp ('t8'); |
!!!cp ('t8'); |
| 3224 |
$self->{document}->manakai_compat_mode ('limited quirks'); |
$self->{document}->manakai_compat_mode ('limited quirks'); |
| 3225 |
} else { |
} else { |
| 3232 |
my $sysid = $token->{system_identifier}; |
my $sysid = $token->{system_identifier}; |
| 3233 |
$sysid =~ tr/A-Z/a-z/; |
$sysid =~ tr/A-Z/a-z/; |
| 3234 |
if ($sysid eq "http://www.ibm.com/data/dtd/v11/ibmxhtml1-transitional.dtd") { |
if ($sysid eq "http://www.ibm.com/data/dtd/v11/ibmxhtml1-transitional.dtd") { |
| 3235 |
## TODO: Check the spec: PUBLIC "(limited quirks)" "(quirks)" |
## NOTE: Ensure that |PUBLIC "(limited quirks)" "(quirks)"| is |
| 3236 |
|
## marked as quirks. |
| 3237 |
$self->{document}->manakai_compat_mode ('quirks'); |
$self->{document}->manakai_compat_mode ('quirks'); |
| 3238 |
!!!cp ('t11'); |
!!!cp ('t11'); |
| 3239 |
} else { |
} else { |
| 4292 |
->{has_reference}); |
->{has_reference}); |
| 4293 |
} elsif ($token->{attributes}->{content}) { |
} elsif ($token->{attributes}->{content}) { |
| 4294 |
if ($token->{attributes}->{content}->{value} |
if ($token->{attributes}->{content}->{value} |
| 4295 |
=~ /\A[^;]*;[\x09-\x0D\x20]*[Cc][Hh][Aa][Rr][Ss][Ee][Tt] |
=~ /[Cc][Hh][Aa][Rr][Ss][Ee][Tt] |
| 4296 |
[\x09-\x0D\x20]*= |
[\x09-\x0D\x20]*= |
| 4297 |
[\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'| |
[\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'| |
| 4298 |
([^"'\x09-\x0D\x20][^\x09-\x0D\x20]*))/x) { |
([^"'\x09-\x0D\x20][^\x09-\x0D\x20\x3B]*))/x) { |
| 4299 |
!!!cp ('t107'); |
!!!cp ('t107'); |
| 4300 |
## NOTE: Whether the encoding is supported or not is handled |
## NOTE: Whether the encoding is supported or not is handled |
| 4301 |
## in the {change_encoding} callback. |
## in the {change_encoding} callback. |
| 6355 |
->{has_reference}); |
->{has_reference}); |
| 6356 |
} elsif ($token->{attributes}->{content}) { |
} elsif ($token->{attributes}->{content}) { |
| 6357 |
if ($token->{attributes}->{content}->{value} |
if ($token->{attributes}->{content}->{value} |
| 6358 |
=~ /\A[^;]*;[\x09-\x0D\x20]*[Cc][Hh][Aa][Rr][Ss][Ee][Tt] |
=~ /[Cc][Hh][Aa][Rr][Ss][Ee][Tt] |
| 6359 |
[\x09-\x0D\x20]*= |
[\x09-\x0D\x20]*= |
| 6360 |
[\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'| |
[\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'| |
| 6361 |
([^"'\x09-\x0D\x20][^\x09-\x0D\x20]*))/x) { |
([^"'\x09-\x0D\x20][^\x09-\x0D\x20\x3B]*))/x) { |
| 6362 |
!!!cp ('t336'); |
!!!cp ('t336'); |
| 6363 |
## NOTE: Whether the encoding is supported or not is handled |
## NOTE: Whether the encoding is supported or not is handled |
| 6364 |
## in the {change_encoding} callback. |
## in the {change_encoding} callback. |