/[suikacvs]/markup/html/whatpm/Whatpm/HTML.pm.src

Diff of /markup/html/whatpm/Whatpm/HTML.pm.src

Parent Directory | Revision Log | View Patch Patch

-revision 1.106 by wakaba,
Sun Mar  9 10:31:19 2008 UTC
+revision 1.170 by wakaba,
Sat Sep 13 12:25:44 2008 UTC
 Line 8 
 use Error qw(:try);
  ## doc.write ('');
  ## alert (doc.compatMode);
- ## TODO: Control charcters and noncharacters are not allowed (HTML5 revision 1263)
+ require IO::Handle;
- ## TODO: 1252 parse error (revision 1264)
- ## TODO: 8859-11 = 874 (revision 1271)
+ my $HTML_NS = q<http://www.w3.org/1999/xhtml>;
+ my $MML_NS = q<http://www.w3.org/1998/Math/MathML>;
- my $permitted_slash_tag_name = {
+ my $SVG_NS = q<http://www.w3.org/2000/svg>;
-   base => 1,
+ my $XLINK_NS = q<http://www.w3.org/1999/xlink>;
-   link => 1,
+ my $XML_NS = q<http://www.w3.org/XML/1998/namespace>;
-   meta => 1,
+ my $XMLNS_NS = q<http://www.w3.org/2000/xmlns/>;
-   hr => 1,
-   br => 1,
+ sub A_EL () { 0b1 }
-   img => 1,
+ sub ADDRESS_EL () { 0b10 }
-   embed => 1,
+ sub BODY_EL () { 0b100 }
-   param => 1,
+ sub BUTTON_EL () { 0b1000 }
-   area => 1,
+ sub CAPTION_EL () { 0b10000 }
-   col => 1,
+ sub DD_EL () { 0b100000 }
-   input => 1,
+ sub DIV_EL () { 0b1000000 }
+ sub DT_EL () { 0b10000000 }
+ sub FORM_EL () { 0b100000000 }
+ sub FORMATTING_EL () { 0b1000000000 }
+ sub FRAMESET_EL () { 0b10000000000 }
+ sub HEADING_EL () { 0b100000000000 }
+ sub HTML_EL () { 0b1000000000000 }
+ sub LI_EL () { 0b10000000000000 }
+ sub NOBR_EL () { 0b100000000000000 }
+ sub OPTION_EL () { 0b1000000000000000 }
+ sub OPTGROUP_EL () { 0b10000000000000000 }
+ sub P_EL () { 0b100000000000000000 }
+ sub SELECT_EL () { 0b1000000000000000000 }
+ sub TABLE_EL () { 0b10000000000000000000 }
+ sub TABLE_CELL_EL () { 0b100000000000000000000 }
+ sub TABLE_ROW_EL () { 0b1000000000000000000000 }
+ sub TABLE_ROW_GROUP_EL () { 0b10000000000000000000000 }
+ sub MISC_SCOPING_EL () { 0b100000000000000000000000 }
+ sub MISC_SPECIAL_EL () { 0b1000000000000000000000000 }
+ sub FOREIGN_EL () { 0b10000000000000000000000000 }
+ sub FOREIGN_FLOW_CONTENT_EL () { 0b100000000000000000000000000 }
+ sub MML_AXML_EL () { 0b1000000000000000000000000000 }
+ sub RUBY_EL () { 0b10000000000000000000000000000 }
+ sub RUBY_COMPONENT_EL () { 0b100000000000000000000000000000 }
+ sub TABLE_ROWS_EL () {
+   TABLE_EL |
+   TABLE_ROW_EL |
+   TABLE_ROW_GROUP_EL
+ }
+ ## NOTE: Used in "generate implied end tags" algorithm.
+ ## NOTE: There is a code where a modified version of END_TAG_OPTIONAL_EL
+ ## is used in "generate implied end tags" implementation (search for the
+ ## function mae).
+ sub END_TAG_OPTIONAL_EL () {
+   DD_EL |
+   DT_EL |
+   LI_EL |
+   P_EL |
+   RUBY_COMPONENT_EL
+ }
+ ## NOTE: Used in </body> and EOF algorithms.
+ sub ALL_END_TAG_OPTIONAL_EL () {
+   DD_EL |
+   DT_EL |
+   LI_EL |
+   P_EL |
+   BODY_EL |
+   HTML_EL |
+   TABLE_CELL_EL |
+   TABLE_ROW_EL |
+   TABLE_ROW_GROUP_EL
+ }
+ sub SCOPING_EL () {
+   BUTTON_EL |
+   CAPTION_EL |
+   HTML_EL |
+   TABLE_EL |
+   TABLE_CELL_EL |
+   MISC_SCOPING_EL
+ }
+ sub TABLE_SCOPING_EL () {
+   HTML_EL |
+   TABLE_EL
+ }
+ sub TABLE_ROWS_SCOPING_EL () {
+   HTML_EL |
+   TABLE_ROW_GROUP_EL
+ }
+ sub TABLE_ROW_SCOPING_EL () {
+   HTML_EL |
+   TABLE_ROW_EL
+ }
+ sub SPECIAL_EL () {
+   ADDRESS_EL |
+   BODY_EL |
+   DIV_EL |
+   DD_EL |
+   DT_EL |
+   LI_EL |
+   P_EL |
+   FORM_EL |
+   FRAMESET_EL |
+   HEADING_EL |
+   OPTION_EL |
+   OPTGROUP_EL |
+   SELECT_EL |
+   TABLE_ROW_EL |
+   TABLE_ROW_GROUP_EL |
+   MISC_SPECIAL_EL
+ }
+ my $el_category = {
+   a => A_EL | FORMATTING_EL,
+   address => ADDRESS_EL,
+   applet => MISC_SCOPING_EL,
+   area => MISC_SPECIAL_EL,
+   b => FORMATTING_EL,
+   base => MISC_SPECIAL_EL,
+   basefont => MISC_SPECIAL_EL,
+   bgsound => MISC_SPECIAL_EL,
+   big => FORMATTING_EL,
+   blockquote => MISC_SPECIAL_EL,
+   body => BODY_EL,
+   br => MISC_SPECIAL_EL,
+   button => BUTTON_EL,
+   caption => CAPTION_EL,
+   center => MISC_SPECIAL_EL,
+   col => MISC_SPECIAL_EL,
+   colgroup => MISC_SPECIAL_EL,
+   dd => DD_EL,
+   dir => MISC_SPECIAL_EL,
+   div => DIV_EL,
+   dl => MISC_SPECIAL_EL,
+   dt => DT_EL,
+   em => FORMATTING_EL,
+   embed => MISC_SPECIAL_EL,
+   fieldset => MISC_SPECIAL_EL,
+   font => FORMATTING_EL,
+   form => FORM_EL,
+   frame => MISC_SPECIAL_EL,
+   frameset => FRAMESET_EL,
+   h1 => HEADING_EL,
+   h2 => HEADING_EL,
+   h3 => HEADING_EL,
+   h4 => HEADING_EL,
+   h5 => HEADING_EL,
+   h6 => HEADING_EL,
+   head => MISC_SPECIAL_EL,
+   hr => MISC_SPECIAL_EL,
+   html => HTML_EL,
+   i => FORMATTING_EL,
+   iframe => MISC_SPECIAL_EL,
+   img => MISC_SPECIAL_EL,
+   input => MISC_SPECIAL_EL,
+   isindex => MISC_SPECIAL_EL,
+   li => LI_EL,
+   link => MISC_SPECIAL_EL,
+   listing => MISC_SPECIAL_EL,
+   marquee => MISC_SCOPING_EL,
+   menu => MISC_SPECIAL_EL,
+   meta => MISC_SPECIAL_EL,
+   nobr => NOBR_EL | FORMATTING_EL,
+   noembed => MISC_SPECIAL_EL,
+   noframes => MISC_SPECIAL_EL,
+   noscript => MISC_SPECIAL_EL,
+   object => MISC_SCOPING_EL,
+   ol => MISC_SPECIAL_EL,
+   optgroup => OPTGROUP_EL,
+   option => OPTION_EL,
+   p => P_EL,
+   param => MISC_SPECIAL_EL,
+   plaintext => MISC_SPECIAL_EL,
+   pre => MISC_SPECIAL_EL,
+   rp => RUBY_COMPONENT_EL,
+   rt => RUBY_COMPONENT_EL,
+   ruby => RUBY_EL,
+   s => FORMATTING_EL,
+   script => MISC_SPECIAL_EL,
+   select => SELECT_EL,
+   small => FORMATTING_EL,
+   spacer => MISC_SPECIAL_EL,
+   strike => FORMATTING_EL,
+   strong => FORMATTING_EL,
+   style => MISC_SPECIAL_EL,
+   table => TABLE_EL,
+   tbody => TABLE_ROW_GROUP_EL,
+   td => TABLE_CELL_EL,
+   textarea => MISC_SPECIAL_EL,
+   tfoot => TABLE_ROW_GROUP_EL,
+   th => TABLE_CELL_EL,
+   thead => TABLE_ROW_GROUP_EL,
+   title => MISC_SPECIAL_EL,
+   tr => TABLE_ROW_EL,
+   tt => FORMATTING_EL,
+   u => FORMATTING_EL,
+   ul => MISC_SPECIAL_EL,
+   wbr => MISC_SPECIAL_EL,
+ };
+ my $el_category_f = {
+   $MML_NS => {
+     'annotation-xml' => MML_AXML_EL,
+     mi => FOREIGN_FLOW_CONTENT_EL,
+     mo => FOREIGN_FLOW_CONTENT_EL,
+     mn => FOREIGN_FLOW_CONTENT_EL,
+     ms => FOREIGN_FLOW_CONTENT_EL,
+     mtext => FOREIGN_FLOW_CONTENT_EL,
+   },
+   $SVG_NS => {
+     foreignObject => FOREIGN_FLOW_CONTENT_EL,
+     desc => FOREIGN_FLOW_CONTENT_EL,
+     title => FOREIGN_FLOW_CONTENT_EL,
+   },
+   ## NOTE: In addition, FOREIGN_EL is set to non-HTML elements.
+ };
+ my $svg_attr_name = {
+   attributename => 'attributeName',
+   attributetype => 'attributeType',
+   basefrequency => 'baseFrequency',
+   baseprofile => 'baseProfile',
+   calcmode => 'calcMode',
+   clippathunits => 'clipPathUnits',
+   contentscripttype => 'contentScriptType',
+   contentstyletype => 'contentStyleType',
+   diffuseconstant => 'diffuseConstant',
+   edgemode => 'edgeMode',
+   externalresourcesrequired => 'externalResourcesRequired',
+   filterres => 'filterRes',
+   filterunits => 'filterUnits',
+   glyphref => 'glyphRef',
+   gradienttransform => 'gradientTransform',
+   gradientunits => 'gradientUnits',
+   kernelmatrix => 'kernelMatrix',
+   kernelunitlength => 'kernelUnitLength',
+   keypoints => 'keyPoints',
+   keysplines => 'keySplines',
+   keytimes => 'keyTimes',
+   lengthadjust => 'lengthAdjust',
+   limitingconeangle => 'limitingConeAngle',
+   markerheight => 'markerHeight',
+   markerunits => 'markerUnits',
+   markerwidth => 'markerWidth',
+   maskcontentunits => 'maskContentUnits',
+   maskunits => 'maskUnits',
+   numoctaves => 'numOctaves',
+   pathlength => 'pathLength',
+   patterncontentunits => 'patternContentUnits',
+   patterntransform => 'patternTransform',
+   patternunits => 'patternUnits',
+   pointsatx => 'pointsAtX',
+   pointsaty => 'pointsAtY',
+   pointsatz => 'pointsAtZ',
+   preservealpha => 'preserveAlpha',
+   preserveaspectratio => 'preserveAspectRatio',
+   primitiveunits => 'primitiveUnits',
+   refx => 'refX',
+   refy => 'refY',
+   repeatcount => 'repeatCount',
+   repeatdur => 'repeatDur',
+   requiredextensions => 'requiredExtensions',
+   requiredfeatures => 'requiredFeatures',
+   specularconstant => 'specularConstant',
+   specularexponent => 'specularExponent',
+   spreadmethod => 'spreadMethod',
+   startoffset => 'startOffset',
+   stddeviation => 'stdDeviation',
+   stitchtiles => 'stitchTiles',
+   surfacescale => 'surfaceScale',
+   systemlanguage => 'systemLanguage',
+   tablevalues => 'tableValues',
+   targetx => 'targetX',
+   targety => 'targetY',
+   textlength => 'textLength',
+   viewbox => 'viewBox',
+   viewtarget => 'viewTarget',
+   xchannelselector => 'xChannelSelector',
+   ychannelselector => 'yChannelSelector',
+   zoomandpan => 'zoomAndPan',
  };
+ my $foreign_attr_xname = {
+   'xlink:actuate' => [$XLINK_NS, ['xlink', 'actuate']],
+   'xlink:arcrole' => [$XLINK_NS, ['xlink', 'arcrole']],
+   'xlink:href' => [$XLINK_NS, ['xlink', 'href']],
+   'xlink:role' => [$XLINK_NS, ['xlink', 'role']],
+   'xlink:show' => [$XLINK_NS, ['xlink', 'show']],
+   'xlink:title' => [$XLINK_NS, ['xlink', 'title']],
+   'xlink:type' => [$XLINK_NS, ['xlink', 'type']],
+   'xml:base' => [$XML_NS, ['xml', 'base']],
+   'xml:lang' => [$XML_NS, ['xml', 'lang']],
+   'xml:space' => [$XML_NS, ['xml', 'space']],
+   'xmlns' => [$XMLNS_NS, [undef, 'xmlns']],
+   'xmlns:xlink' => [$XMLNS_NS, ['xmlns', 'xlink']],
+ };
+ ## ISSUE: xmlns:xlink="non-xlink-ns" is not an error.
  my $c1_entity_char = {
 x80 => 0x20AC,
 x81 => 0xFFFD,
-Line 61 
 my $c1_entity_char = {
+Line 347 
 my $c1_entity_char = {
 x9F => 0x0178,
  }; # $c1_entity_char
- my $special_category = {
-   address => 1, area => 1, base => 1, basefont => 1, bgsound => 1,
-   blockquote => 1, body => 1, br => 1, center => 1, col => 1, colgroup => 1,
-   dd => 1, dir => 1, div => 1, dl => 1, dt => 1, embed => 1, fieldset => 1,
-   form => 1, frame => 1, frameset => 1, h1 => 1, h2 => 1, h3 => 1,
-   h4 => 1, h5 => 1, h6 => 1, head => 1, hr => 1, iframe => 1, image => 1,
-   img => 1, input => 1, isindex => 1, li => 1, link => 1, listing => 1,
-   menu => 1, meta => 1, noembed => 1, noframes => 1, noscript => 1,
-   ol => 1, optgroup => 1, option => 1, p => 1, param => 1, plaintext => 1,
-   pre => 1, script => 1, select => 1, spacer => 1, style => 1, tbody => 1,
-   textarea => 1, tfoot => 1, thead => 1, title => 1, tr => 1, ul => 1, wbr => 1,
- };
- my $scoping_category = {
-   applet => 1, button => 1, caption => 1, html => 1, marquee => 1, object => 1,
-   table => 1, td => 1, th => 1,
- };
- my $formatting_category = {
-   a => 1, b => 1, big => 1, em => 1, font => 1, i => 1, nobr => 1,
-   s => 1, small => 1, strile => 1, strong => 1, tt => 1, u => 1,
- };
- # $phrasing_category: all other elements
  sub parse_byte_string ($$$$;$) {
+   my $self = shift;
+   my $charset_name = shift;
+   open my $input, '<', ref $_[0] ? $_[0] : \($_[0]);
+   return $self->parse_byte_stream ($charset_name, $input, @_[1..$#_]);
+ } # parse_byte_string
+ sub parse_byte_stream ($$$$;$$) {
+   # my ($self, $charset_name, $byte_stream, $doc, $onerror, $get_wrapper) = @_;
    my $self = ref $_[0] ? shift : shift->new;
-   my $charset = shift;
+   my $charset_name = shift;
-   my $bytes_s = ref $_[0] ? $_[0] : \($_[0]);
+   my $byte_stream = $_[0];
-   my $s;
-   if (defined $charset) {
-     require Encode; ## TODO: decode(utf8) don't delete BOM
-     $s = \ (Encode::decode ($charset, $$bytes_s));
-     $self->{input_encoding} = lc $charset; ## TODO: normalize name
-     $self->{confident} = 1;
-   } else {
-     ## TODO: Implement HTML5 detection algorithm
-     require Whatpm::Charset::UniversalCharDet;
-     $charset = Whatpm::Charset::UniversalCharDet->detect_byte_string
-         (substr ($$bytes_s, 0, 1024));
-     $charset ||= 'windows-1252';
-     $s = \ (Encode::decode ($charset, $$bytes_s));
-     $self->{input_encoding} = $charset;
-     $self->{confident} = 0;
-   }
-   $self->{change_encoding} = sub {
+   my $onerror = $_[2] || sub {
-     my $self = shift;
+     my (%opt) = @_;
-     my $charset = lc shift;
+     warn "Parse error ($opt{type})\n";
-     ## TODO: if $charset is supported
+   };
-     ## TODO: normalize charset name
+   $self->{parse_error} = $onerror; # updated later by parse_char_string
-     ## "Change the encoding" algorithm:
+   my $get_wrapper = $_[3] || sub ($) {
+     return $_[0]; # $_[0] = byte stream handle, returned = arg to char handle
-     ## Step 1
+   };
-     if ($charset eq 'utf-16') { ## ISSUE: UTF-16BE -> UTF-8? UTF-16LE -> UTF-8?
-       $charset = 'utf-8';
+   ## HTML5 encoding sniffing algorithm
+   require Message::Charset::Info;
+   my $charset;
+   my $buffer;
+   my ($char_stream, $e_status);
+   SNIFFING: {
+     ## NOTE: By setting |allow_fallback| option true when the
+     ## |get_decode_handle| method is invoked, we ignore what the HTML5
+     ## spec requires, i.e. unsupported encoding should be ignored.
+       ## TODO: We should not do this unless the parser is invoked
+       ## in the conformance checking mode, in which this behavior
+       ## would be useful.
+     ## Step 1
+     if (defined $charset_name) {
+       $charset = Message::Charset::Info->get_by_html_name ($charset_name);
+           ## TODO: Is this ok?  Transfer protocol's parameter should be
+           ## interpreted in its semantics?
+       ## ISSUE: Unsupported encoding is not ignored according to the spec.
+       ($char_stream, $e_status) = $charset->get_decode_handle
+           ($byte_stream, allow_error_reporting => 1,
+            allow_fallback => 1);
+       if ($char_stream) {
+         $self->{confident} = 1;
+         last SNIFFING;
+       } else {
+         ## TODO: unsupported error
+       }
      }
      ## Step 2
-     if (defined $self->{input_encoding} and
+     my $byte_buffer = '';
-         $self->{input_encoding} eq $charset) {
+     for (1..1024) {
+       my $char = $byte_stream->getc;
+       last unless defined $char;
+       $byte_buffer .= $char;
+     } ## TODO: timeout
+     ## Step 3
+     if ($byte_buffer =~ /^\xFE\xFF/) {
+       $charset = Message::Charset::Info->get_by_html_name ('utf-16be');
+       ($char_stream, $e_status) = $charset->get_decode_handle
+           ($byte_stream, allow_error_reporting => 1,
+            allow_fallback => 1, byte_buffer => \$byte_buffer);
        $self->{confident} = 1;
-       return;
+       last SNIFFING;
+     } elsif ($byte_buffer =~ /^\xFF\xFE/) {
+       $charset = Message::Charset::Info->get_by_html_name ('utf-16le');
+       ($char_stream, $e_status) = $charset->get_decode_handle
+           ($byte_stream, allow_error_reporting => 1,
+            allow_fallback => 1, byte_buffer => \$byte_buffer);
+       $self->{confident} = 1;
+       last SNIFFING;
+     } elsif ($byte_buffer =~ /^\xEF\xBB\xBF/) {
+       $charset = Message::Charset::Info->get_by_html_name ('utf-8');
+       ($char_stream, $e_status) = $charset->get_decode_handle
+           ($byte_stream, allow_error_reporting => 1,
+            allow_fallback => 1, byte_buffer => \$byte_buffer);
+       $self->{confident} = 1;
+       last SNIFFING;
      }
-     !!!parse-error (type => 'charset label detected:'.$self->{input_encoding}.
+     ## Step 4
-         ':'.$charset, level => 'w');
+     ## TODO: <meta charset>
-     ## Step 3
+     ## Step 5
-     # if (can) {
+     ## TODO: from history
-       ## change the encoding on the fly.
-       #$self->{confident} = 1;
-       #return;
-     # }
-     ## Step 4
+     ## Step 6
-     throw Whatpm::HTML::RestartParser (charset => $charset);
+     require Whatpm::Charset::UniversalCharDet;
+     $charset_name = Whatpm::Charset::UniversalCharDet->detect_byte_string
+         ($byte_buffer);
+     if (defined $charset_name) {
+       $charset = Message::Charset::Info->get_by_html_name ($charset_name);
+       ## ISSUE: Unsupported encoding is not ignored according to the spec.
+       require Whatpm::Charset::DecodeHandle;
+       $buffer = Whatpm::Charset::DecodeHandle::ByteBuffer->new
+           ($byte_stream);
+       ($char_stream, $e_status) = $charset->get_decode_handle
+           ($buffer, allow_error_reporting => 1,
+            allow_fallback => 1, byte_buffer => \$byte_buffer);
+       if ($char_stream) {
+         $buffer->{buffer} = $byte_buffer;
+         !!!parse-error (type => 'sniffing:chardet',
+                         text => $charset_name,
+                         level => $self->{level}->{info},
+                         layer => 'encode',
+                         line => 1, column => 1);
+         $self->{confident} = 0;
+         last SNIFFING;
+       }
+     }
+     ## Step 7: default
+     ## TODO: Make this configurable.
+     $charset = Message::Charset::Info->get_by_html_name ('windows-1252');
+         ## NOTE: We choose |windows-1252| here, since |utf-8| should be
+         ## detectable in the step 6.
+     require Whatpm::Charset::DecodeHandle;
+     $buffer = Whatpm::Charset::DecodeHandle::ByteBuffer->new
+         ($byte_stream);
+     ($char_stream, $e_status)
+         = $charset->get_decode_handle ($buffer,
+                                        allow_error_reporting => 1,
+                                        allow_fallback => 1,
+                                        byte_buffer => \$byte_buffer);
+     $buffer->{buffer} = $byte_buffer;
+     !!!parse-error (type => 'sniffing:default',
+                     text => 'windows-1252',
+                     level => $self->{level}->{info},
+                     line => 1, column => 1,
+                     layer => 'encode');
+     $self->{confident} = 0;
+   } # SNIFFING
+   if ($e_status & Message::Charset::Info::FALLBACK_ENCODING_IMPL ()) {
+     $self->{input_encoding} = $charset->get_iana_name; ## TODO: Should we set actual charset decoder's encoding name?
+     !!!parse-error (type => 'chardecode:fallback',
+                     #text => $self->{input_encoding},
+                     level => $self->{level}->{uncertain},
+                     line => 1, column => 1,
+                     layer => 'encode');
+   } elsif (not ($e_status &
+                 Message::Charset::Info::ERROR_REPORTING_ENCODING_IMPL())) {
+     $self->{input_encoding} = $charset->get_iana_name;
+     !!!parse-error (type => 'chardecode:no error',
+                     text => $self->{input_encoding},
+                     level => $self->{level}->{uncertain},
+                     line => 1, column => 1,
+                     layer => 'encode');
+   } else {
+     $self->{input_encoding} = $charset->get_iana_name;
+   }
+   $self->{change_encoding} = sub {
+     my $self = shift;
+     $charset_name = shift;
+     my $token = shift;
+     $charset = Message::Charset::Info->get_by_html_name ($charset_name);
+     ($char_stream, $e_status) = $charset->get_decode_handle
+         ($byte_stream, allow_error_reporting => 1, allow_fallback => 1,
+          byte_buffer => \ $buffer->{buffer});
+     if ($char_stream) { # if supported
+       ## "Change the encoding" algorithm:
+       ## Step 1
+       if ($charset->{category} &
+           Message::Charset::Info::CHARSET_CATEGORY_UTF16 ()) {
+         $charset = Message::Charset::Info->get_by_html_name ('utf-8');
+         ($char_stream, $e_status) = $charset->get_decode_handle
+             ($byte_stream,
+              byte_buffer => \ $buffer->{buffer});
+       }
+       $charset_name = $charset->get_iana_name;
+       ## Step 2
+       if (defined $self->{input_encoding} and
+           $self->{input_encoding} eq $charset_name) {
+         !!!parse-error (type => 'charset label:matching',
+                         text => $charset_name,
+                         level => $self->{level}->{info});
+         $self->{confident} = 1;
+         return;
+       }
+       !!!parse-error (type => 'charset label detected',
+                       text => $self->{input_encoding},
+                       value => $charset_name,
+                       level => $self->{level}->{warn},
+                       token => $token);
+       ## Step 3
+       # if (can) {
+         ## change the encoding on the fly.
+         #$self->{confident} = 1;
+         #return;
+       # }
+       ## Step 4
+       throw Whatpm::HTML::RestartParser ();
+     }
    }; # $self->{change_encoding}
+   my $char_onerror = sub {
+     my (undef, $type, %opt) = @_;
+     !!!parse-error (layer => 'encode',
+                     %opt, type => $type,
+                     line => $self->{line}, column => $self->{column} + 1);
+     if ($opt{octets}) {
+       ${$opt{octets}} = "\x{FFFD}"; # relacement character
+     }
+   };
+   my $wrapped_char_stream = $get_wrapper->($char_stream);
+   $wrapped_char_stream->onerror ($char_onerror);
    my @args = @_; shift @args; # $s
    my $return;
    try {
-     $return = $self->parse_char_string ($s, @args);
+     $return = $self->parse_char_stream ($wrapped_char_stream, @args);
    } catch Whatpm::HTML::RestartParser with {
-     my $charset = shift->{charset};
+     ## NOTE: Invoked after {change_encoding}.
-     $s = \ (Encode::decode ($charset, $$bytes_s));
-     $self->{input_encoding} = $charset; ## TODO: normalize
+     if ($e_status & Message::Charset::Info::FALLBACK_ENCODING_IMPL ()) {
+       $self->{input_encoding} = $charset->get_iana_name; ## TODO: Should we set actual charset decoder's encoding name?
+       !!!parse-error (type => 'chardecode:fallback',
+                       level => $self->{level}->{uncertain},
+                       #text => $self->{input_encoding},
+                       line => 1, column => 1,
+                       layer => 'encode');
+     } elsif (not ($e_status &
+                   Message::Charset::Info::ERROR_REPORTING_ENCODING_IMPL())) {
+       $self->{input_encoding} = $charset->get_iana_name;
+       !!!parse-error (type => 'chardecode:no error',
+                       text => $self->{input_encoding},
+                       level => $self->{level}->{uncertain},
+                       line => 1, column => 1,
+                       layer => 'encode');
+     } else {
+       $self->{input_encoding} = $charset->get_iana_name;
+     }
      $self->{confident} = 1;
-     $return = $self->parse_char_string ($s, @args);
+     $wrapped_char_stream = $get_wrapper->($char_stream);
+     $wrapped_char_stream->onerror ($char_onerror);
+     $return = $self->parse_char_stream ($wrapped_char_stream, @args);
    };
    return $return;
- } # parse_byte_string
+ } # parse_byte_stream
  ## NOTE: HTML5 spec says that the encoding layer MUST NOT strip BOM
  ## and the HTML layer MUST ignore it.  However, we does strip BOM in
-Line 162 
 sub parse_byte_string ($$$$;$) {
+Line 615 
 sub parse_byte_string ($$$$;$) {
  ## such as |parse_byte_string| in this module, must ensure that it does
  ## strip the BOM and never strip any ZWNBSP.
- *parse_char_string = \&parse_string;
+ sub parse_char_string ($$$;$$) {
+   #my ($self, $s, $doc, $onerror, $get_wrapper) = @_;
+   my $self = shift;
+   require utf8;
+   my $s = ref $_[0] ? $_[0] : \($_[0]);
+   open my $input, '<' . (utf8::is_utf8 ($$s) ? ':utf8' : ''), $s;
+   if ($_[3]) {
+     $input = $_[3]->($input);
+   }
+   return $self->parse_char_stream ($input, @_[1..$#_]);
+ } # parse_char_string
+ *parse_string = \&parse_char_string; ## NOTE: Alias for backward compatibility.
- sub parse_string ($$$;$) {
+ sub parse_char_stream ($$$;$) {
    my $self = ref $_[0] ? shift : shift->new;
-   my $s = ref $_[0] ? $_[0] : \($_[0]);
+   my $input = $_[0];
    $self->{document} = $_[1];
    @{$self->{document}->child_nodes} = ();
-Line 177 
 sub parse_string ($$$;$) {
+Line 641 
 sub parse_string ($$$;$) {
        if defined $self->{input_encoding};
    my $i = 0;
-   my $line = 1;
+   $self->{line_prev} = $self->{line} = 1;
-   my $column = 0;
+   $self->{column_prev} = $self->{column} = 0;
    $self->{set_next_char} = sub {
      my $self = shift;
      pop @{$self->{prev_char}};
      unshift @{$self->{prev_char}}, $self->{next_char};
-     $self->{next_char} = -1 and return if $i >= length $$s;
+     my $char;
-     $self->{next_char} = ord substr $$s, $i++, 1;
+     if (defined $self->{next_next_char}) {
-     $column++;
+       $char = $self->{next_next_char};
+       delete $self->{next_next_char};
+     } else {
+       $char = $input->getc;
+     }
+     $self->{next_char} = -1 and return unless defined $char;
+     $self->{next_char} = ord $char;
+     ($self->{line_prev}, $self->{column_prev})
+         = ($self->{line}, $self->{column});
+     $self->{column}++;
      if ($self->{next_char} == 0x000A) { # LF
-       $line++;
+       !!!cp ('j1');
-       $column = 0;
+       $self->{line}++;
+       $self->{column} = 0;
      } elsif ($self->{next_char} == 0x000D) { # CR
-       $i++ if substr ($$s, $i, 1) eq "\x0A";
+       !!!cp ('j2');
+ ## TODO: support for abort/streaming
+       my $next = $input->getc;
+       if (defined $next and $next ne "\x0A") {
+         $self->{next_next_char} = $next;
+       }
        $self->{next_char} = 0x000A; # LF # MUST
-       $line++;
+       $self->{line}++;
-       $column = 0;
+       $self->{column} = 0;
      } elsif ($self->{next_char} > 0x10FFFF) {
+       !!!cp ('j3');
        $self->{next_char} = 0xFFFD; # REPLACEMENT CHARACTER # MUST
      } elsif ($self->{next_char} == 0x0000) { # NULL
+       !!!cp ('j4');
        !!!parse-error (type => 'NULL');
        $self->{next_char} = 0xFFFD; # REPLACEMENT CHARACTER # MUST
+     } elsif ($self->{next_char} <= 0x0008 or
+              (0x000E <= $self->{next_char} and $self->{next_char} <= 0x001F) or
+              (0x007F <= $self->{next_char} and $self->{next_char} <= 0x009F) or
+              (0xD800 <= $self->{next_char} and $self->{next_char} <= 0xDFFF) or
+              (0xFDD0 <= $self->{next_char} and $self->{next_char} <= 0xFDDF) or
+              {
+xFFFE => 1, 0xFFFF => 1, 0x1FFFE => 1, 0x1FFFF => 1,
+x2FFFE => 1, 0x2FFFF => 1, 0x3FFFE => 1, 0x3FFFF => 1,
+x4FFFE => 1, 0x4FFFF => 1, 0x5FFFE => 1, 0x5FFFF => 1,
+x6FFFE => 1, 0x6FFFF => 1, 0x7FFFE => 1, 0x7FFFF => 1,
+x8FFFE => 1, 0x8FFFF => 1, 0x9FFFE => 1, 0x9FFFF => 1,
+xAFFFE => 1, 0xAFFFF => 1, 0xBFFFE => 1, 0xBFFFF => 1,
+xCFFFE => 1, 0xCFFFF => 1, 0xDFFFE => 1, 0xDFFFF => 1,
+xEFFFE => 1, 0xEFFFF => 1, 0xFFFFE => 1, 0xFFFFF => 1,
+x10FFFE => 1, 0x10FFFF => 1,
+              }->{$self->{next_char}}) {
+       !!!cp ('j5');
+       if ($self->{next_char} < 0x10000) {
+         !!!parse-error (type => 'control char',
+                         text => (sprintf 'U+%04X', $self->{next_char}));
+       } else {
+         !!!parse-error (type => 'control char',
+                         text => (sprintf 'U-%08X', $self->{next_char}));
+       }
      }
    };
    $self->{prev_char} = [-1, -1, -1];
-Line 209 
 sub parse_string ($$$;$) {
+Line 715 
 sub parse_string ($$$;$) {
    my $onerror = $_[2] || sub {
      my (%opt) = @_;
-     warn "Parse error ($opt{type}) at line $opt{line} column $opt{column}\n";
+     my $line = $opt{token} ? $opt{token}->{line} : $opt{line};
+     my $column = $opt{token} ? $opt{token}->{column} : $opt{column};
+     warn "Parse error ($opt{type}) at line $line column $column\n";
    };
    $self->{parse_error} = sub {
-     $onerror->(@_, line => $line, column => $column);
+     $onerror->(line => $self->{line}, column => $self->{column}, @_);
    };
    $self->_initialize_tokenizer;
-Line 220 
 sub parse_string ($$$;$) {
+Line 728 
 sub parse_string ($$$;$) {
    $self->_construct_tree;
    $self->_terminate_tree_constructor;
+   delete $self->{parse_error}; # remove loop
    return $self->{document};
- } # parse_string
+ } # parse_char_stream
  sub new ($) {
    my $class = shift;
-   my $self = bless {}, $class;
+   my $self = bless {
+     level => {must => 'm',
+               should => 's',
+               warn => 'w',
+               info => 'i',
+               uncertain => 'u'},
+   }, $class;
    $self->{set_next_char} = sub {
      $self->{next_char} = -1;
    };
-Line 254 
 sub RCDATA_CONTENT_MODEL () { CM_ENTITY
+Line 770 
 sub RCDATA_CONTENT_MODEL () { CM_ENTITY
  sub PCDATA_CONTENT_MODEL () { CM_ENTITY | CM_FULL_MARKUP }
  sub DATA_STATE () { 0 }
- sub ENTITY_DATA_STATE () { 1 }
+ #sub ENTITY_DATA_STATE () { 1 }
  sub TAG_OPEN_STATE () { 2 }
  sub CLOSE_TAG_OPEN_STATE () { 3 }
  sub TAG_NAME_STATE () { 4 }
-Line 265 
 sub BEFORE_ATTRIBUTE_VALUE_STATE () { 8
+Line 781 
 sub BEFORE_ATTRIBUTE_VALUE_STATE () { 8
  sub ATTRIBUTE_VALUE_DOUBLE_QUOTED_STATE () { 9 }
  sub ATTRIBUTE_VALUE_SINGLE_QUOTED_STATE () { 10 }
  sub ATTRIBUTE_VALUE_UNQUOTED_STATE () { 11 }
- sub ENTITY_IN_ATTRIBUTE_VALUE_STATE () { 12 }
+ #sub ENTITY_IN_ATTRIBUTE_VALUE_STATE () { 12 }
  sub MARKUP_DECLARATION_OPEN_STATE () { 13 }
  sub COMMENT_START_STATE () { 14 }
  sub COMMENT_START_DASH_STATE () { 15 }
-Line 287 
 sub DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUO
+Line 803 
 sub DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUO
  sub AFTER_DOCTYPE_SYSTEM_IDENTIFIER_STATE () { 31 }
  sub BOGUS_DOCTYPE_STATE () { 32 }
  sub AFTER_ATTRIBUTE_VALUE_QUOTED_STATE () { 33 }
+ sub SELF_CLOSING_START_TAG_STATE () { 34 }
+ sub CDATA_SECTION_STATE () { 35 }
+ sub MD_HYPHEN_STATE () { 36 } # "markup declaration open state" in the spec
+ sub MD_DOCTYPE_STATE () { 37 } # "markup declaration open state" in the spec
+ sub MD_CDATA_STATE () { 38 } # "markup declaration open state" in the spec
+ sub CDATA_PCDATA_CLOSE_TAG_STATE () { 39 } # "close tag open state" in the spec
+ sub CDATA_SECTION_MSE1_STATE () { 40 } # "CDATA section state" in the spec
+ sub CDATA_SECTION_MSE2_STATE () { 41 } # "CDATA section state" in the spec
+ sub PUBLIC_STATE () { 42 } # "after DOCTYPE name state" in the spec
+ sub SYSTEM_STATE () { 43 } # "after DOCTYPE name state" in the spec
+ ## NOTE: "Entity data state", "entity in attribute value state", and
+ ## "consume a character reference" algorithm are jointly implemented
+ ## using the following six states:
+ sub ENTITY_STATE () { 44 }
+ sub ENTITY_HASH_STATE () { 45 }
+ sub NCR_NUM_STATE () { 46 }
+ sub HEXREF_X_STATE () { 47 }
+ sub HEXREF_HEX_STATE () { 48 }
+ sub ENTITY_NAME_STATE () { 49 }
  sub DOCTYPE_TOKEN () { 1 }
  sub COMMENT_TOKEN () { 2 }
-Line 304 
 sub ROW_IMS ()        { 0b10000000 }
+Line 839 
 sub ROW_IMS ()        { 0b10000000 }
  sub BODY_AFTER_IMS () { 0b100000000 }
  sub FRAME_IMS ()      { 0b1000000000 }
  sub SELECT_IMS ()     { 0b10000000000 }
+ sub IN_FOREIGN_CONTENT_IM () { 0b100000000000 }
+     ## NOTE: "in foreign content" insertion mode is special; it is combined
+     ## with the secondary insertion mode.  In this parser, they are stored
+     ## together in the bit-or'ed form.
  ## NOTE: "initial" and "before html" insertion modes have no constants.
-Line 335 
 sub IN_COLUMN_GROUP_IM () { 0b10 }
+Line 874 
 sub IN_COLUMN_GROUP_IM () { 0b10 }
  sub _initialize_tokenizer ($) {
    my $self = shift;
    $self->{state} = DATA_STATE; # MUST
+   #$self->{state_keyword}; # initialized when used
+   #$self->{entity__value}; # initialized when used
+   #$self->{entity__match}; # initialized when used
    $self->{content_model} = PCDATA_CONTENT_MODEL; # be
-   undef $self->{current_token}; # start tag, end tag, comment, or DOCTYPE
+   undef $self->{current_token};
    undef $self->{current_attribute};
    undef $self->{last_emitted_start_tag_name};
-   undef $self->{last_attribute_value_state};
+   #$self->{prev_state}; # initialized when used
-   $self->{char} = [];
+   delete $self->{self_closing};
    # $self->{next_char}
    !!!next-input-character;
    $self->{token} = [];
-Line 360 
 sub _initialize_tokenizer ($) {
+Line 902 
 sub _initialize_tokenizer ($) {
  ##        ->{value}
  ##        ->{has_reference} == 1 or 0
  ##   ->{data} (COMMENT_TOKEN, CHARACTER_TOKEN)
+ ## NOTE: The "self-closing flag" is hold as |$self->{self_closing}|.
+ ##     |->{self_closing}| is used to save the value of |$self->{self_closing}|
+ ##     while the token is pushed back to the stack.
  ## Emitted token MUST immediately be handled by the tree construction state.
-Line 369 
 sub _initialize_tokenizer ($) {
+Line 914 
 sub _initialize_tokenizer ($) {
  ## has completed loading.  If one has, then it MUST be executed
  ## and removed from the list.
- ## NOTE: HTML5 "Writing HTML documents" section, applied to
+ ## TODO: Polytheistic slash SHOULD NOT be used. (Applied only to atheists.)
- ## documents and not to user agents and conformance checkers,
+ ## (This requirement was dropped from HTML5 spec, unfortunately.)
- ## contains some requirements that are not detected by the
- ## parsing algorithm:
- ## - Some requirements on character encoding declarations. ## TODO
- ## - "Elements MUST NOT contain content that their content model disallows."
- ##   ... Some are parse error, some are not (will be reported by c.c.).
- ## - Polytheistic slash SHOULD NOT be used. (Applied only to atheists.) ## TODO
- ## - Text (in elements, attributes, and comments) SHOULD NOT contain
- ##   control characters other than space characters. ## TODO: (what is control character? C0, C1 and DEL?  Unicode control character?)
- ## TODO: HTML5 poses authors two SHOULD-level requirements that cannot
- ## be detected by the HTML5 parsing algorithm:
- ## - Text,
  sub _get_next_token ($) {
    my $self = shift;
+   if ($self->{self_closing}) {
+     !!!parse-error (type => 'nestc', token => $self->{current_token});
+     ## NOTE: The |self_closing| flag is only set by start tag token.
+     ## In addition, when a start tag token is emitted, it is always set to
+     ## |current_token|.
+     delete $self->{self_closing};
+   }
    if (@{$self->{token}}) {
+     $self->{self_closing} = $self->{token}->[0]->{self_closing};
      return shift @{$self->{token}};
    }
-Line 396 
 sub _get_next_token ($) {
+Line 939 
 sub _get_next_token ($) {
          if ($self->{content_model} & CM_ENTITY and # PCDATA | RCDATA
              not $self->{escape}) {
            !!!cp (1);
-           $self->{state} = ENTITY_DATA_STATE;
+           ## NOTE: In the spec, the tokenizer is switched to the
+           ## "entity data state".  In this implementation, the tokenizer
+           ## is switched to the |ENTITY_STATE|, which is an implementation
+           ## of the "consume a character reference" algorithm.
+           $self->{entity_additional} = -1;
+           $self->{prev_state} = DATA_STATE;
+           $self->{state} = ENTITY_STATE;
            !!!next-input-character;
            redo A;
          } else {
-Line 449 
 sub _get_next_token ($) {
+Line 998 
 sub _get_next_token ($) {
          #
        } elsif ($self->{next_char} == -1) {
          !!!cp (11);
-         !!!emit ({type => END_OF_FILE_TOKEN});
+         !!!emit ({type => END_OF_FILE_TOKEN,
+                   line => $self->{line}, column => $self->{column}});
          last A; ## TODO: ok?
        } else {
          !!!cp (12);
        }
        # Anything else
        my $token = {type => CHARACTER_TOKEN,
-                    data => chr $self->{next_char}};
+                    data => chr $self->{next_char},
+                    line => $self->{line}, column => $self->{column},
+                   };
        ## Stay in the data state
        !!!next-input-character;
        !!!emit ($token);
        redo A;
-     } elsif ($self->{state} == ENTITY_DATA_STATE) {
-       ## (cannot happen in CDATA state)
-       my $token = $self->_tokenize_attempt_to_consume_an_entity (0, -1);
-       $self->{state} = DATA_STATE;
-       # next-input-character is already done
-       unless (defined $token) {
-         !!!cp (13);
-         !!!emit ({type => CHARACTER_TOKEN, data => '&'});
-       } else {
-         !!!cp (14);
-         !!!emit ($token);
-       }
-       redo A;
      } elsif ($self->{state} == TAG_OPEN_STATE) {
        if ($self->{content_model} & CM_LIMITED_MARKUP) { # RCDATA | CDATA
          if ($self->{next_char} == 0x002F) { # /
-Line 492 
 sub _get_next_token ($) {
+Line 1027 
 sub _get_next_token ($) {
            ## reconsume
            $self->{state} = DATA_STATE;
-           !!!emit ({type => CHARACTER_TOKEN, data => '<'});
+           !!!emit ({type => CHARACTER_TOKEN, data => '<',
+                     line => $self->{line_prev},
+                     column => $self->{column_prev},
+                    });
            redo A;
          }
-Line 512 
 sub _get_next_token ($) {
+Line 1050 
 sub _get_next_token ($) {
            !!!cp (19);
            $self->{current_token}
              = {type => START_TAG_TOKEN,
-                tag_name => chr ($self->{next_char} + 0x0020)};
+                tag_name => chr ($self->{next_char} + 0x0020),
+                line => $self->{line_prev},
+                column => $self->{column_prev}};
            $self->{state} = TAG_NAME_STATE;
            !!!next-input-character;
            redo A;
-Line 520 
 sub _get_next_token ($) {
+Line 1060 
 sub _get_next_token ($) {
                   $self->{next_char} <= 0x007A) { # a..z
            !!!cp (20);
            $self->{current_token} = {type => START_TAG_TOKEN,
-                             tag_name => chr ($self->{next_char})};
+                                     tag_name => chr ($self->{next_char}),
+                                     line => $self->{line_prev},
+                                     column => $self->{column_prev}};
            $self->{state} = TAG_NAME_STATE;
            !!!next-input-character;
            redo A;
          } elsif ($self->{next_char} == 0x003E) { # >
            !!!cp (21);
-           !!!parse-error (type => 'empty start tag');
+           !!!parse-error (type => 'empty start tag',
+                           line => $self->{line_prev},
+                           column => $self->{column_prev});
            $self->{state} = DATA_STATE;
            !!!next-input-character;
-           !!!emit ({type => CHARACTER_TOKEN, data => '<>'});
+           !!!emit ({type => CHARACTER_TOKEN, data => '<>',
+                     line => $self->{line_prev},
+                     column => $self->{column_prev},
+                    });
            redo A;
          } elsif ($self->{next_char} == 0x003F) { # ?
            !!!cp (22);
-           !!!parse-error (type => 'pio');
+           !!!parse-error (type => 'pio',
+                           line => $self->{line_prev},
+                           column => $self->{column_prev});
            $self->{state} = BOGUS_COMMENT_STATE;
+           $self->{current_token} = {type => COMMENT_TOKEN, data => '',
+                                     line => $self->{line_prev},
+                                     column => $self->{column_prev},
+                                    };
            ## $self->{next_char} is intentionally left as is
            redo A;
          } else {
            !!!cp (23);
-           !!!parse-error (type => 'bare stago');
+           !!!parse-error (type => 'bare stago',
+                           line => $self->{line_prev},
+                           column => $self->{column_prev});
            $self->{state} = DATA_STATE;
            ## reconsume
-           !!!emit ({type => CHARACTER_TOKEN, data => '<'});
+           !!!emit ({type => CHARACTER_TOKEN, data => '<',
+                     line => $self->{line_prev},
+                     column => $self->{column_prev},
+                    });
            redo A;
          }
-Line 553 
 sub _get_next_token ($) {
+Line 1111 
 sub _get_next_token ($) {
          die "$0: $self->{content_model} in tag open";
        }
      } elsif ($self->{state} == CLOSE_TAG_OPEN_STATE) {
+       ## NOTE: The "close tag open state" in the spec is implemented as
+       ## |CLOSE_TAG_OPEN_STATE| and |CDATA_PCDATA_CLOSE_TAG_STATE|.
+       my ($l, $c) = ($self->{line_prev}, $self->{column_prev} - 1); # "<"of"</"
        if ($self->{content_model} & CM_LIMITED_MARKUP) { # RCDATA | CDATA
          if (defined $self->{last_emitted_start_tag_name}) {
-           ## NOTE: <http://krijnhoetmer.nl/irc-logs/whatwg/20070626#l-564>
+           $self->{state} = CDATA_PCDATA_CLOSE_TAG_STATE;
-           my @next_char;
+           $self->{state_keyword} = '';
-           TAGNAME: for (my $i = 0; $i < length $self->{last_emitted_start_tag_name}; $i++) {
+           ## Reconsume.
-             push @next_char, $self->{next_char};
+           redo A;
-             my $c = ord substr ($self->{last_emitted_start_tag_name}, $i, 1);
-             my $C = 0x0061 <= $c && $c <= 0x007A ? $c - 0x0020 : $c;
-             if ($self->{next_char} == $c or $self->{next_char} == $C) {
-               !!!cp (24);
-               !!!next-input-character;
-               next TAGNAME;
-             } else {
-               !!!cp (25);
-               $self->{next_char} = shift @next_char; # reconsume
-               !!!back-next-input-character (@next_char);
-               $self->{state} = DATA_STATE;
-               !!!emit ({type => CHARACTER_TOKEN, data => '</'});
-               redo A;
-             }
-           }
-           push @next_char, $self->{next_char};
-           unless ($self->{next_char} == 0x0009 or # HT
-                   $self->{next_char} == 0x000A or # LF
-                   $self->{next_char} == 0x000B or # VT
-                   $self->{next_char} == 0x000C or # FF
-                   $self->{next_char} == 0x0020 or # SP
-                   $self->{next_char} == 0x003E or # >
-                   $self->{next_char} == 0x002F or # /
-                   $self->{next_char} == -1) {
-             !!!cp (26);
-             $self->{next_char} = shift @next_char; # reconsume
-             !!!back-next-input-character (@next_char);
-             $self->{state} = DATA_STATE;
-             !!!emit ({type => CHARACTER_TOKEN, data => '</'});
-             redo A;
-           } else {
-             !!!cp (27);
-             $self->{next_char} = shift @next_char;
-             !!!back-next-input-character (@next_char);
-             # and consume...
-           }
          } else {
            ## No start tag token has ever been emitted
+           ## NOTE: See <http://krijnhoetmer.nl/irc-logs/whatwg/20070626#l-564>.
            !!!cp (28);
-           # next-input-character is already done
            $self->{state} = DATA_STATE;
-           !!!emit ({type => CHARACTER_TOKEN, data => '</'});
+           ## Reconsume.
+           !!!emit ({type => CHARACTER_TOKEN, data => '</',
+                     line => $l, column => $c,
+                    });
            redo A;
          }
        }
        if (0x0041 <= $self->{next_char} and
            $self->{next_char} <= 0x005A) { # A..Z
          !!!cp (29);
-         $self->{current_token} = {type => END_TAG_TOKEN,
+         $self->{current_token}
-                           tag_name => chr ($self->{next_char} + 0x0020)};
+             = {type => END_TAG_TOKEN,
+                tag_name => chr ($self->{next_char} + 0x0020),
+                line => $l, column => $c};
          $self->{state} = TAG_NAME_STATE;
          !!!next-input-character;
          redo A;
-Line 620 
 sub _get_next_token ($) {
+Line 1148 
 sub _get_next_token ($) {
                 $self->{next_char} <= 0x007A) { # a..z
          !!!cp (30);
          $self->{current_token} = {type => END_TAG_TOKEN,
-                           tag_name => chr ($self->{next_char})};
+                                   tag_name => chr ($self->{next_char}),
+                                   line => $l, column => $c};
          $self->{state} = TAG_NAME_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x003E) { # >
          !!!cp (31);
-         !!!parse-error (type => 'empty end tag');
+         !!!parse-error (type => 'empty end tag',
+                         line => $self->{line_prev}, ## "<" in "</>"
+                         column => $self->{column_prev} - 1);
          $self->{state} = DATA_STATE;
          !!!next-input-character;
          redo A;
-Line 636 
 sub _get_next_token ($) {
+Line 1167 
 sub _get_next_token ($) {
          $self->{state} = DATA_STATE;
          # reconsume
-         !!!emit ({type => CHARACTER_TOKEN, data => '</'});
+         !!!emit ({type => CHARACTER_TOKEN, data => '</',
+                   line => $l, column => $c,
+                  });
          redo A;
        } else {
          !!!cp (33);
          !!!parse-error (type => 'bogus end tag');
          $self->{state} = BOGUS_COMMENT_STATE;
-         ## $self->{next_char} is intentionally left as is
+         $self->{current_token} = {type => COMMENT_TOKEN, data => '',
-         redo A;
+                                   line => $self->{line_prev}, # "<" of "</"
+                                   column => $self->{column_prev} - 1,
+                                  };
+         ## NOTE: $self->{next_char} is intentionally left as is.
+         ## Although the "anything else" case of the spec not explicitly
+         ## states that the next input character is to be reconsumed,
+         ## it will be included to the |data| of the comment token
+         ## generated from the bogus end tag, as defined in the
+         ## "bogus comment state" entry.
+         redo A;
+       }
+     } elsif ($self->{state} == CDATA_PCDATA_CLOSE_TAG_STATE) {
+       my $ch = substr $self->{last_emitted_start_tag_name}, length $self->{state_keyword}, 1;
+       if (length $ch) {
+         my $CH = $ch;
+         $ch =~ tr/a-z/A-Z/;
+         my $nch = chr $self->{next_char};
+         if ($nch eq $ch or $nch eq $CH) {
+           !!!cp (24);
+           ## Stay in the state.
+           $self->{state_keyword} .= $nch;
+           !!!next-input-character;
+           redo A;
+         } else {
+           !!!cp (25);
+           $self->{state} = DATA_STATE;
+           ## Reconsume.
+           !!!emit ({type => CHARACTER_TOKEN,
+                     data => '</' . $self->{state_keyword},
+                     line => $self->{line_prev},
+                     column => $self->{column_prev} - 1 - length $self->{state_keyword},
+                    });
+           redo A;
+         }
+       } else { # after "<{tag-name}"
+         unless ({
+x0009 => 1, # HT
+x000A => 1, # LF
+x000B => 1, # VT
+x000C => 1, # FF
+x0020 => 1, # SP
+x003E => 1, # >
+x002F => 1, # /
+                  -1 => 1, # EOF
+                 }->{$self->{next_char}}) {
+           !!!cp (26);
+           ## Reconsume.
+           $self->{state} = DATA_STATE;
+           !!!emit ({type => CHARACTER_TOKEN,
+                     data => '</' . $self->{state_keyword},
+                     line => $self->{line_prev},
+                     column => $self->{column_prev} - 1 - length $self->{state_keyword},
+                    });
+           redo A;
+         } else {
+           !!!cp (27);
+           $self->{current_token}
+               = {type => END_TAG_TOKEN,
+                  tag_name => $self->{last_emitted_start_tag_name},
+                  line => $self->{line_prev},
+                  column => $self->{column_prev} - 1 - length $self->{state_keyword}};
+           $self->{state} = TAG_NAME_STATE;
+           ## Reconsume.
+           redo A;
+         }
        }
      } elsif ($self->{state} == TAG_NAME_STATE) {
        if ($self->{next_char} == 0x0009 or # HT
-Line 659 
 sub _get_next_token ($) {
+Line 1256 
 sub _get_next_token ($) {
        } elsif ($self->{next_char} == 0x003E) { # >
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (35);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 692 
 sub _get_next_token ($) {
+Line 1287 
 sub _get_next_token ($) {
          !!!parse-error (type => 'unclosed tag');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (39);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 714 
 sub _get_next_token ($) {
+Line 1307 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x002F) { # /
+         !!!cp (42);
+         $self->{state} = SELF_CLOSING_START_TAG_STATE;
          !!!next-input-character;
-         if ($self->{next_char} == 0x003E and # >
-             $self->{current_token}->{type} == START_TAG_TOKEN and
-             $permitted_slash_tag_name->{$self->{current_token}->{tag_name}}) {
-           # permitted slash
-           !!!cp (42);
-           #
-         } else {
-           !!!cp (43);
-           !!!parse-error (type => 'nestc');
-         }
-         $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
-         # next-input-character is already done
          redo A;
        } else {
          !!!cp (44);
-Line 749 
 sub _get_next_token ($) {
+Line 1332 
 sub _get_next_token ($) {
        } elsif ($self->{next_char} == 0x003E) { # >
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (46);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 772 
 sub _get_next_token ($) {
+Line 1353 
 sub _get_next_token ($) {
        } elsif (0x0041 <= $self->{next_char} and
                 $self->{next_char} <= 0x005A) { # A..Z
          !!!cp (49);
-         $self->{current_attribute} = {name => chr ($self->{next_char} + 0x0020),
+         $self->{current_attribute}
-                               value => ''};
+             = {name => chr ($self->{next_char} + 0x0020),
+                value => '',
+                line => $self->{line}, column => $self->{column}};
          $self->{state} = ATTRIBUTE_NAME_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x002F) { # /
+         !!!cp (50);
+         $self->{state} = SELF_CLOSING_START_TAG_STATE;
          !!!next-input-character;
-         if ($self->{next_char} == 0x003E and # >
-             $self->{current_token}->{type} == START_TAG_TOKEN and
-             $permitted_slash_tag_name->{$self->{current_token}->{tag_name}}) {
-           # permitted slash
-           !!!cp (50);
-           #
-         } else {
-           !!!cp (51);
-           !!!parse-error (type => 'nestc');
-         }
-         ## Stay in the state
-         # next-input-character is already done
          redo A;
        } elsif ($self->{next_char} == -1) {
          !!!parse-error (type => 'unclosed tag');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (52);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 827 
 sub _get_next_token ($) {
+Line 1398 
 sub _get_next_token ($) {
          } else {
            !!!cp (56);
          }
-         $self->{current_attribute} = {name => chr ($self->{next_char}),
+         $self->{current_attribute}
-                               value => ''};
+             = {name => chr ($self->{next_char}),
+                value => '',
+                line => $self->{line}, column => $self->{column}};
          $self->{state} = ATTRIBUTE_NAME_STATE;
          !!!next-input-character;
          redo A;
-Line 838 
 sub _get_next_token ($) {
+Line 1411 
 sub _get_next_token ($) {
          if (exists $self->{current_token}->{attributes} # start tag or end tag
              ->{$self->{current_attribute}->{name}}) { # MUST
            !!!cp (57);
-           !!!parse-error (type => 'duplicate attribute:'.$self->{current_attribute}->{name});
+           !!!parse-error (type => 'duplicate attribute', text => $self->{current_attribute}->{name}, line => $self->{current_attribute}->{line}, column => $self->{current_attribute}->{column});
            ## Discard $self->{current_attribute} # MUST
          } else {
            !!!cp (58);
-Line 867 
 sub _get_next_token ($) {
+Line 1440 
 sub _get_next_token ($) {
          $before_leave->();
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (61);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            !!!cp (62);
-Line 893 
 sub _get_next_token ($) {
+Line 1464 
 sub _get_next_token ($) {
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x002F) { # /
+         !!!cp (64);
          $before_leave->();
+         $self->{state} = SELF_CLOSING_START_TAG_STATE;
          !!!next-input-character;
-         if ($self->{next_char} == 0x003E and # >
-             $self->{current_token}->{type} == START_TAG_TOKEN and
-             $permitted_slash_tag_name->{$self->{current_token}->{tag_name}}) {
-           # permitted slash
-           !!!cp (64);
-           #
-         } else {
-           !!!cp (65);
-           !!!parse-error (type => 'nestc');
-         }
-         $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
-         # next-input-character is already done
          redo A;
        } elsif ($self->{next_char} == -1) {
          !!!parse-error (type => 'unclosed tag');
          $before_leave->();
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (66);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 965 
 sub _get_next_token ($) {
+Line 1524 
 sub _get_next_token ($) {
        } elsif ($self->{next_char} == 0x003E) { # >
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (73);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 989 
 sub _get_next_token ($) {
+Line 1546 
 sub _get_next_token ($) {
        } elsif (0x0041 <= $self->{next_char} and
                 $self->{next_char} <= 0x005A) { # A..Z
          !!!cp (76);
-         $self->{current_attribute} = {name => chr ($self->{next_char} + 0x0020),
+         $self->{current_attribute}
-                               value => ''};
+             = {name => chr ($self->{next_char} + 0x0020),
+                value => '',
+                line => $self->{line}, column => $self->{column}};
          $self->{state} = ATTRIBUTE_NAME_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x002F) { # /
+         !!!cp (77);
+         $self->{state} = SELF_CLOSING_START_TAG_STATE;
          !!!next-input-character;
-         if ($self->{next_char} == 0x003E and # >
-             $self->{current_token}->{type} == START_TAG_TOKEN and
-             $permitted_slash_tag_name->{$self->{current_token}->{tag_name}}) {
-           # permitted slash
-           !!!cp (77);
-           #
-         } else {
-           !!!cp (78);
-           !!!parse-error (type => 'nestc');
-           ## TODO: Different error type for <aa / bb> than <aa/>
-         }
-         $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
-         # next-input-character is already done
          redo A;
        } elsif ($self->{next_char} == -1) {
          !!!parse-error (type => 'unclosed tag');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (79);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1036 
 sub _get_next_token ($) {
+Line 1582 
 sub _get_next_token ($) {
          redo A;
        } else {
-         !!!cp (82);
+         if ($self->{next_char} == 0x0022 or # "
-         $self->{current_attribute} = {name => chr ($self->{next_char}),
+             $self->{next_char} == 0x0027) { # '
-                               value => ''};
+           !!!cp (78);
+           !!!parse-error (type => 'bad attribute name');
+         } else {
+           !!!cp (82);
+         }
+         $self->{current_attribute}
+             = {name => chr ($self->{next_char}),
+                value => '',
+                line => $self->{line}, column => $self->{column}};
          $self->{state} = ATTRIBUTE_NAME_STATE;
          !!!next-input-character;
          redo A;
-Line 1069 
 sub _get_next_token ($) {
+Line 1623 
 sub _get_next_token ($) {
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x003E) { # >
+         !!!parse-error (type => 'empty unquoted attribute value');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (87);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1096 
 sub _get_next_token ($) {
+Line 1649 
 sub _get_next_token ($) {
          !!!parse-error (type => 'unclosed tag');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (90);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1137 
 sub _get_next_token ($) {
+Line 1688 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x0026) { # &
          !!!cp (96);
-         $self->{last_attribute_value_state} = $self->{state};
+         ## NOTE: In the spec, the tokenizer is switched to the
-         $self->{state} = ENTITY_IN_ATTRIBUTE_VALUE_STATE;
+         ## "entity in attribute value state".  In this implementation, the
+         ## tokenizer is switched to the |ENTITY_STATE|, which is an
+         ## implementation of the "consume a character reference" algorithm.
+         $self->{prev_state} = $self->{state};
+         $self->{entity_additional} = 0x0022; # "
+         $self->{state} = ENTITY_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == -1) {
          !!!parse-error (type => 'unclosed attribute value');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (97);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1181 
 sub _get_next_token ($) {
+Line 1735 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x0026) { # &
          !!!cp (102);
-         $self->{last_attribute_value_state} = $self->{state};
+         ## NOTE: In the spec, the tokenizer is switched to the
-         $self->{state} = ENTITY_IN_ATTRIBUTE_VALUE_STATE;
+         ## "entity in attribute value state".  In this implementation, the
+         ## tokenizer is switched to the |ENTITY_STATE|, which is an
+         ## implementation of the "consume a character reference" algorithm.
+         $self->{entity_additional} = 0x0027; # '
+         $self->{prev_state} = $self->{state};
+         $self->{state} = ENTITY_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == -1) {
          !!!parse-error (type => 'unclosed attribute value');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (103);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1229 
 sub _get_next_token ($) {
+Line 1786 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x0026) { # &
          !!!cp (108);
-         $self->{last_attribute_value_state} = $self->{state};
+         ## NOTE: In the spec, the tokenizer is switched to the
-         $self->{state} = ENTITY_IN_ATTRIBUTE_VALUE_STATE;
+         ## "entity in attribute value state".  In this implementation, the
+         ## tokenizer is switched to the |ENTITY_STATE|, which is an
+         ## implementation of the "consume a character reference" algorithm.
+         $self->{entity_additional} = -1;
+         $self->{prev_state} = $self->{state};
+         $self->{state} = ENTITY_STATE;
          !!!next-input-character;
          redo A;
        } elsif ($self->{next_char} == 0x003E) { # >
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (109);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1261 
 sub _get_next_token ($) {
+Line 1821 
 sub _get_next_token ($) {
          !!!parse-error (type => 'unclosed tag');
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (112);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1298 
 sub _get_next_token ($) {
+Line 1856 
 sub _get_next_token ($) {
          !!!next-input-character;
          redo A;
        }
-     } elsif ($self->{state} == ENTITY_IN_ATTRIBUTE_VALUE_STATE) {
-       my $token = $self->_tokenize_attempt_to_consume_an_entity
-           (1,
-            $self->{last_attribute_value_state}
-              == ATTRIBUTE_VALUE_DOUBLE_QUOTED_STATE ? 0x0022 : # "
-            $self->{last_attribute_value_state}
-              == ATTRIBUTE_VALUE_SINGLE_QUOTED_STATE ? 0x0027 : # '
-            -1);
-       unless (defined $token) {
-         !!!cp (117);
-         $self->{current_attribute}->{value} .= '&';
-       } else {
-         !!!cp (118);
-         $self->{current_attribute}->{value} .= $token->{data};
-         $self->{current_attribute}->{has_reference} = $token->{has_reference};
-         ## ISSUE: spec says "append the returned character token to the current attribute's value"
-       }
-       $self->{state} = $self->{last_attribute_value_state};
-       # next-input-character is already done
-       redo A;
      } elsif ($self->{state} == AFTER_ATTRIBUTE_VALUE_QUOTED_STATE) {
        if ($self->{next_char} == 0x0009 or # HT
            $self->{next_char} == 0x000A or # LF
-Line 1333 
 sub _get_next_token ($) {
+Line 1869 
 sub _get_next_token ($) {
        } elsif ($self->{next_char} == 0x003E) { # >
          if ($self->{current_token}->{type} == START_TAG_TOKEN) {
            !!!cp (119);
-           $self->{current_token}->{first_start_tag}
-               = not defined $self->{last_emitted_start_tag_name};
            $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
          } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
            $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-Line 1355 
 sub _get_next_token ($) {
+Line 1889 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x002F) { # /
+         !!!cp (122);
+         $self->{state} = SELF_CLOSING_START_TAG_STATE;
          !!!next-input-character;
-         if ($self->{next_char} == 0x003E and # >
+         redo A;
-             $self->{current_token}->{type} == START_TAG_TOKEN and
+       } elsif ($self->{next_char} == -1) {
-             $permitted_slash_tag_name->{$self->{current_token}->{tag_name}}) {
+         !!!parse-error (type => 'unclosed tag');
-           # permitted slash
+         if ($self->{current_token}->{type} == START_TAG_TOKEN) {
-           !!!cp (122);
+           !!!cp (122.3);
-           #
+           $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
+         } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
+           if ($self->{current_token}->{attributes}) {
+             !!!cp (122.1);
+             !!!parse-error (type => 'end tag attribute');
+           } else {
+             ## NOTE: This state should never be reached.
+             !!!cp (122.2);
+           }
          } else {
-           !!!cp (123);
+           die "$0: $self->{current_token}->{type}: Unknown token type";
-           !!!parse-error (type => 'nestc');
          }
-         $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
+         $self->{state} = DATA_STATE;
-         # next-input-character is already done
+         ## Reconsume.
+         !!!emit ($self->{current_token}); # start tag or end tag
          redo A;
        } else {
-         !!!cp (124);
+         !!!cp ('124.1');
          !!!parse-error (type => 'no space between attributes');
          $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
          ## reconsume
          redo A;
        }
-     } elsif ($self->{state} == BOGUS_COMMENT_STATE) {
+     } elsif ($self->{state} == SELF_CLOSING_START_TAG_STATE) {
-       ## (only happen if PCDATA state)
+       if ($self->{next_char} == 0x003E) { # >
+         if ($self->{current_token}->{type} == END_TAG_TOKEN) {
-       my $token = {type => COMMENT_TOKEN, data => ''};
+           !!!cp ('124.2');
+           !!!parse-error (type => 'nestc', token => $self->{current_token});
-       BC: {
+           ## TODO: Different type than slash in start tag
-         if ($self->{next_char} == 0x003E) { # >
+           $self->{content_model} = PCDATA_CONTENT_MODEL; # MUST
-           !!!cp (124);
+           if ($self->{current_token}->{attributes}) {
-           $self->{state} = DATA_STATE;
+             !!!cp ('124.4');
-           !!!next-input-character;
+             !!!parse-error (type => 'end tag attribute');
+           } else {
-           !!!emit ($token);
+             !!!cp ('124.5');
+           }
+           ## TODO: Test |<title></title/>|
+         } else {
+           !!!cp ('124.3');
+           $self->{self_closing} = 1;
+         }
-           redo A;
+         $self->{state} = DATA_STATE;
-         } elsif ($self->{next_char} == -1) {
+         !!!next-input-character;
-           !!!cp (125);
-           $self->{state} = DATA_STATE;
-           ## reconsume
-           !!!emit ($token);
+         !!!emit ($self->{current_token}); # start tag or end tag
-           redo A;
+         redo A;
+       } elsif ($self->{next_char} == -1) {
+         !!!parse-error (type => 'unclosed tag');
+         if ($self->{current_token}->{type} == START_TAG_TOKEN) {
+           !!!cp (124.7);
+           $self->{last_emitted_start_tag_name} = $self->{current_token}->{tag_name};
+         } elsif ($self->{current_token}->{type} == END_TAG_TOKEN) {
+           if ($self->{current_token}->{attributes}) {
+             !!!cp (124.5);
+             !!!parse-error (type => 'end tag attribute');
+           } else {
+             ## NOTE: This state should never be reached.
+             !!!cp (124.6);
+           }
          } else {
-           !!!cp (126);
+           die "$0: $self->{current_token}->{type}: Unknown token type";
-           $token->{data} .= chr ($self->{next_char});
-           !!!next-input-character;
-           redo BC;
          }
-       } # BC
+         $self->{state} = DATA_STATE;
+         ## Reconsume.
+         !!!emit ($self->{current_token}); # start tag or end tag
+         redo A;
+       } else {
+         !!!cp ('124.4');
+         !!!parse-error (type => 'nestc');
+         ## TODO: This error type is wrong.
+         $self->{state} = BEFORE_ATTRIBUTE_NAME_STATE;
+         ## Reconsume.
+         redo A;
+       }
+     } elsif ($self->{state} == BOGUS_COMMENT_STATE) {
+       ## (only happen if PCDATA state)
-       die "$0: _get_next_token: unexpected case [BC]";
+       ## NOTE: Unlike spec's "bogus comment state", this implementation
+       ## consumes characters one-by-one basis.
+       if ($self->{next_char} == 0x003E) { # >
+         !!!cp (124);
+         $self->{state} = DATA_STATE;
+         !!!next-input-character;
+         !!!emit ($self->{current_token}); # comment
+         redo A;
+       } elsif ($self->{next_char} == -1) {
+         !!!cp (125);
+         $self->{state} = DATA_STATE;
+         ## reconsume
+         !!!emit ($self->{current_token}); # comment
+         redo A;
+       } else {
+         !!!cp (126);
+         $self->{current_token}->{data} .= chr ($self->{next_char}); # comment
+         ## Stay in the state.
+         !!!next-input-character;
+         redo A;
+       }
      } elsif ($self->{state} == MARKUP_DECLARATION_OPEN_STATE) {
        ## (only happen if PCDATA state)
-       my @next_char;
-       push @next_char, $self->{next_char};
        if ($self->{next_char} == 0x002D) { # -
+         !!!cp (133);
+         $self->{state} = MD_HYPHEN_STATE;
          !!!next-input-character;
-         push @next_char, $self->{next_char};
+         redo A;
-         if ($self->{next_char} == 0x002D) { # -
-           !!!cp (127);
-           $self->{current_token} = {type => COMMENT_TOKEN, data => ''};
-           $self->{state} = COMMENT_START_STATE;
-           !!!next-input-character;
-           redo A;
-         } else {
-           !!!cp (128);
-         }
        } elsif ($self->{next_char} == 0x0044 or # D
                 $self->{next_char} == 0x0064) { # d
+         ## ASCII case-insensitive.
+         !!!cp (130);
+         $self->{state} = MD_DOCTYPE_STATE;
+         $self->{state_keyword} = chr $self->{next_char};
          !!!next-input-character;
-         push @next_char, $self->{next_char};
+         redo A;
-         if ($self->{next_char} == 0x004F or # O
+       } elsif ($self->{insertion_mode} & IN_FOREIGN_CONTENT_IM and
-             $self->{next_char} == 0x006F) { # o
+                $self->{open_elements}->[-1]->[1] & FOREIGN_EL and
-           !!!next-input-character;
+                $self->{next_char} == 0x005B) { # [
-           push @next_char, $self->{next_char};
+         !!!cp (135.4);
-           if ($self->{next_char} == 0x0043 or # C
+         $self->{state} = MD_CDATA_STATE;
-               $self->{next_char} == 0x0063) { # c
+         $self->{state_keyword} = '[';
-             !!!next-input-character;
+         !!!next-input-character;
-             push @next_char, $self->{next_char};
+         redo A;
-             if ($self->{next_char} == 0x0054 or # T
-                 $self->{next_char} == 0x0074) { # t
-               !!!next-input-character;
-               push @next_char, $self->{next_char};
-               if ($self->{next_char} == 0x0059 or # Y
-                   $self->{next_char} == 0x0079) { # y
-                 !!!next-input-character;
-                 push @next_char, $self->{next_char};
-                 if ($self->{next_char} == 0x0050 or # P
-                     $self->{next_char} == 0x0070) { # p
-                   !!!next-input-character;
-                   push @next_char, $self->{next_char};
-                   if ($self->{next_char} == 0x0045 or # E
-                       $self->{next_char} == 0x0065) { # e
-                     !!!cp (129);
-                     ## TODO: What a stupid code this is!
-                     $self->{state} = DOCTYPE_STATE;
-                     !!!next-input-character;
-                     redo A;
-                   } else {
-                     !!!cp (130);
-                   }
-                 } else {
-                   !!!cp (131);
-                 }
-               } else {
-                 !!!cp (132);
-               }
-             } else {
-               !!!cp (133);
-             }
-           } else {
-             !!!cp (134);
-           }
-         } else {
-           !!!cp (135);
-         }
        } else {
          !!!cp (136);
        }
-       !!!parse-error (type => 'bogus comment');
+       !!!parse-error (type => 'bogus comment',
-       $self->{next_char} = shift @next_char;
+                       line => $self->{line_prev},
-       !!!back-next-input-character (@next_char);
+                       column => $self->{column_prev} - 1);
+       ## Reconsume.
        $self->{state} = BOGUS_COMMENT_STATE;
+       $self->{current_token} = {type => COMMENT_TOKEN, data => '',
+                                 line => $self->{line_prev},
+                                 column => $self->{column_prev} - 1,
+                                };
        redo A;
+     } elsif ($self->{state} == MD_HYPHEN_STATE) {
-       ## ISSUE: typos in spec: chacacters, is is a parse error
+       if ($self->{next_char} == 0x002D) { # -
-       ## ISSUE: spec is somewhat unclear on "is the first character that will be in the comment"; what is "that will be in the comment" is what the algorithm defines, isn't it?
+         !!!cp (127);
+         $self->{current_token} = {type => COMMENT_TOKEN, data => '',
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 2,
+                                  };
+         $self->{state} = COMMENT_START_STATE;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (128);
+         !!!parse-error (type => 'bogus comment',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} - 2);
+         $self->{state} = BOGUS_COMMENT_STATE;
+         ## Reconsume.
+         $self->{current_token} = {type => COMMENT_TOKEN,
+                                   data => '-',
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 2,
+                                  };
+         redo A;
+       }
+     } elsif ($self->{state} == MD_DOCTYPE_STATE) {
+       ## ASCII case-insensitive.
+       if ($self->{next_char} == [
+             undef,
+x004F, # O
+x0043, # C
+x0054, # T
+x0059, # Y
+x0050, # P
+           ]->[length $self->{state_keyword}] or
+           $self->{next_char} == [
+             undef,
+x006F, # o
+x0063, # c
+x0074, # t
+x0079, # y
+x0070, # p
+           ]->[length $self->{state_keyword}]) {
+         !!!cp (131);
+         ## Stay in the state.
+         $self->{state_keyword} .= chr $self->{next_char};
+         !!!next-input-character;
+         redo A;
+       } elsif ((length $self->{state_keyword}) == 6 and
+                ($self->{next_char} == 0x0045 or # E
+                 $self->{next_char} == 0x0065)) { # e
+         !!!cp (129);
+         $self->{state} = DOCTYPE_STATE;
+         $self->{current_token} = {type => DOCTYPE_TOKEN,
+                                   quirks => 1,
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 7,
+                                  };
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (132);
+         !!!parse-error (type => 'bogus comment',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} - 1 - length $self->{state_keyword});
+         $self->{state} = BOGUS_COMMENT_STATE;
+         ## Reconsume.
+         $self->{current_token} = {type => COMMENT_TOKEN,
+                                   data => $self->{state_keyword},
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 1 - length $self->{state_keyword},
+                                  };
+         redo A;
+       }
+     } elsif ($self->{state} == MD_CDATA_STATE) {
+       if ($self->{next_char} == {
+             '[' => 0x0043, # C
+             '[C' => 0x0044, # D
+             '[CD' => 0x0041, # A
+             '[CDA' => 0x0054, # T
+             '[CDAT' => 0x0041, # A
+           }->{$self->{state_keyword}}) {
+         !!!cp (135.1);
+         ## Stay in the state.
+         $self->{state_keyword} .= chr $self->{next_char};
+         !!!next-input-character;
+         redo A;
+       } elsif ($self->{state_keyword} eq '[CDATA' and
+                $self->{next_char} == 0x005B) { # [
+         !!!cp (135.2);
+         $self->{current_token} = {type => CHARACTER_TOKEN,
+                                   data => '',
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 7};
+         $self->{state} = CDATA_SECTION_STATE;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (135.3);
+         !!!parse-error (type => 'bogus comment',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} - 1 - length $self->{state_keyword});
+         $self->{state} = BOGUS_COMMENT_STATE;
+         ## Reconsume.
+         $self->{current_token} = {type => COMMENT_TOKEN,
+                                   data => $self->{state_keyword},
+                                   line => $self->{line_prev},
+                                   column => $self->{column_prev} - 1 - length $self->{state_keyword},
+                                  };
+         redo A;
+       }
      } elsif ($self->{state} == COMMENT_START_STATE) {
        if ($self->{next_char} == 0x002D) { # -
          !!!cp (137);
-Line 1605 
 sub _get_next_token ($) {
+Line 2267 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x002D) { # -
          !!!cp (152);
-         !!!parse-error (type => 'dash in comment');
+         !!!parse-error (type => 'dash in comment',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev});
          $self->{current_token}->{data} .= '-'; # comment
          ## Stay in the state
          !!!next-input-character;
-Line 1621 
 sub _get_next_token ($) {
+Line 2285 
 sub _get_next_token ($) {
          redo A;
        } else {
          !!!cp (154);
-         !!!parse-error (type => 'dash in comment');
+         !!!parse-error (type => 'dash in comment',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev});
          $self->{current_token}->{data} .= '--' . chr ($self->{next_char}); # comment
          $self->{state} = COMMENT_STATE;
          !!!next-input-character;
-Line 1660 
 sub _get_next_token ($) {
+Line 2326 
 sub _get_next_token ($) {
          $self->{state} = DATA_STATE;
          !!!next-input-character;
-         !!!emit ({type => DOCTYPE_TOKEN, quirks => 1});
+         !!!emit ($self->{current_token}); # DOCTYPE (quirks)
          redo A;
        } elsif ($self->{next_char} == -1) {
-Line 1669 
 sub _get_next_token ($) {
+Line 2335 
 sub _get_next_token ($) {
          $self->{state} = DATA_STATE;
          ## reconsume
-         !!!emit ({type => DOCTYPE_TOKEN, quirks => 1});
+         !!!emit ($self->{current_token}); # DOCTYPE (quirks)
          redo A;
        } else {
          !!!cp (160);
-         $self->{current_token}
+         $self->{current_token}->{name} = chr $self->{next_char};
-             = {type => DOCTYPE_TOKEN,
+         delete $self->{current_token}->{quirks};
-                name => chr ($self->{next_char}),
-                #quirks => 0,
-               };
  ## ISSUE: "Set the token's name name to the" in the spec
          $self->{state} = DOCTYPE_NAME_STATE;
          !!!next-input-character;
-Line 1751 
 sub _get_next_token ($) {
+Line 2414 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x0050 or # P
                 $self->{next_char} == 0x0070) { # p
+         $self->{state} = PUBLIC_STATE;
+         $self->{state_keyword} = chr $self->{next_char};
          !!!next-input-character;
-         if ($self->{next_char} == 0x0055 or # U
+         redo A;
-             $self->{next_char} == 0x0075) { # u
-           !!!next-input-character;
-           if ($self->{next_char} == 0x0042 or # B
-               $self->{next_char} == 0x0062) { # b
-             !!!next-input-character;
-             if ($self->{next_char} == 0x004C or # L
-                 $self->{next_char} == 0x006C) { # l
-               !!!next-input-character;
-               if ($self->{next_char} == 0x0049 or # I
-                   $self->{next_char} == 0x0069) { # i
-                 !!!next-input-character;
-                 if ($self->{next_char} == 0x0043 or # C
-                     $self->{next_char} == 0x0063) { # c
-                   !!!cp (168);
-                   $self->{state} = BEFORE_DOCTYPE_PUBLIC_IDENTIFIER_STATE;
-                   !!!next-input-character;
-                   redo A;
-                 } else {
-                   !!!cp (169);
-                 }
-               } else {
-                 !!!cp (170);
-               }
-             } else {
-               !!!cp (171);
-             }
-           } else {
-             !!!cp (172);
-           }
-         } else {
-           !!!cp (173);
-         }
-         #
        } elsif ($self->{next_char} == 0x0053 or # S
                 $self->{next_char} == 0x0073) { # s
+         $self->{state} = SYSTEM_STATE;
+         $self->{state_keyword} = chr $self->{next_char};
          !!!next-input-character;
-         if ($self->{next_char} == 0x0059 or # Y
+         redo A;
-             $self->{next_char} == 0x0079) { # y
-           !!!next-input-character;
-           if ($self->{next_char} == 0x0053 or # S
-               $self->{next_char} == 0x0073) { # s
-             !!!next-input-character;
-             if ($self->{next_char} == 0x0054 or # T
-                 $self->{next_char} == 0x0074) { # t
-               !!!next-input-character;
-               if ($self->{next_char} == 0x0045 or # E
-                   $self->{next_char} == 0x0065) { # e
-                 !!!next-input-character;
-                 if ($self->{next_char} == 0x004D or # M
-                     $self->{next_char} == 0x006D) { # m
-                   !!!cp (174);
-                   $self->{state} = BEFORE_DOCTYPE_SYSTEM_IDENTIFIER_STATE;
-                   !!!next-input-character;
-                   redo A;
-                 } else {
-                   !!!cp (175);
-                 }
-               } else {
-                 !!!cp (176);
-               }
-             } else {
-               !!!cp (177);
-             }
-           } else {
-             !!!cp (178);
-           }
-         } else {
-           !!!cp (179);
-         }
-         #
        } else {
          !!!cp (180);
+         !!!parse-error (type => 'string after DOCTYPE name');
+         $self->{current_token}->{quirks} = 1;
+         $self->{state} = BOGUS_DOCTYPE_STATE;
          !!!next-input-character;
-         #
+         redo A;
        }
+     } elsif ($self->{state} == PUBLIC_STATE) {
+       ## ASCII case-insensitive
+       if ($self->{next_char} == [
+             undef,
+x0055, # U
+x0042, # B
+x004C, # L
+x0049, # I
+           ]->[length $self->{state_keyword}] or
+           $self->{next_char} == [
+             undef,
+x0075, # u
+x0062, # b
+x006C, # l
+x0069, # i
+           ]->[length $self->{state_keyword}]) {
+         !!!cp (175);
+         ## Stay in the state.
+         $self->{state_keyword} .= chr $self->{next_char};
+         !!!next-input-character;
+         redo A;
+       } elsif ((length $self->{state_keyword}) == 5 and
+                ($self->{next_char} == 0x0043 or # C
+                 $self->{next_char} == 0x0063)) { # c
+         !!!cp (168);
+         $self->{state} = BEFORE_DOCTYPE_PUBLIC_IDENTIFIER_STATE;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (169);
+         !!!parse-error (type => 'string after DOCTYPE name',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} + 1 - length $self->{state_keyword});
+         $self->{current_token}->{quirks} = 1;
-       !!!parse-error (type => 'string after DOCTYPE name');
+         $self->{state} = BOGUS_DOCTYPE_STATE;
-       $self->{current_token}->{quirks} = 1;
+         ## Reconsume.
+         redo A;
+       }
+     } elsif ($self->{state} == SYSTEM_STATE) {
+       ## ASCII case-insensitive
+       if ($self->{next_char} == [
+             undef,
+x0059, # Y
+x0053, # S
+x0054, # T
+x0045, # E
+           ]->[length $self->{state_keyword}] or
+           $self->{next_char} == [
+             undef,
+x0079, # y
+x0073, # s
+x0074, # t
+x0065, # e
+           ]->[length $self->{state_keyword}]) {
+         !!!cp (170);
+         ## Stay in the state.
+         $self->{state_keyword} .= chr $self->{next_char};
+         !!!next-input-character;
+         redo A;
+       } elsif ((length $self->{state_keyword}) == 5 and
+                ($self->{next_char} == 0x004D or # M
+                 $self->{next_char} == 0x006D)) { # m
+         !!!cp (171);
+         $self->{state} = BEFORE_DOCTYPE_SYSTEM_IDENTIFIER_STATE;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (172);
+         !!!parse-error (type => 'string after DOCTYPE name',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} + 1 - length $self->{state_keyword});
+         $self->{current_token}->{quirks} = 1;
-       $self->{state} = BOGUS_DOCTYPE_STATE;
+         $self->{state} = BOGUS_DOCTYPE_STATE;
-       # next-input-character is already done
+         ## Reconsume.
-       redo A;
+         redo A;
+       }
      } elsif ($self->{state} == BEFORE_DOCTYPE_PUBLIC_IDENTIFIER_STATE) {
        if ({
 x0009 => 1, 0x000A => 1, 0x000B => 1, 0x000C => 1, 0x0020 => 1,
-Line 2069 
 sub _get_next_token ($) {
+Line 2743 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x003E) { # >
          !!!cp (208);
-         !!!parse-error (type => 'unclosed PUBLIC literal');
+         !!!parse-error (type => 'unclosed SYSTEM literal');
          $self->{state} = DATA_STATE;
          !!!next-input-character;
-Line 2105 
 sub _get_next_token ($) {
+Line 2779 
 sub _get_next_token ($) {
          redo A;
        } elsif ($self->{next_char} == 0x003E) { # >
          !!!cp (212);
-         !!!parse-error (type => 'unclosed PUBLIC literal');
+         !!!parse-error (type => 'unclosed SYSTEM literal');
          $self->{state} = DATA_STATE;
          !!!next-input-character;
-Line 2153 
 sub _get_next_token ($) {
+Line 2827 
 sub _get_next_token ($) {
        } elsif ($self->{next_char} == -1) {
          !!!cp (217);
          !!!parse-error (type => 'unclosed DOCTYPE');
          $self->{state} = DATA_STATE;
          ## reconsume
-Line 2194 
 sub _get_next_token ($) {
+Line 2867 
 sub _get_next_token ($) {
          !!!next-input-character;
          redo A;
        }
-     } else {
+     } elsif ($self->{state} == CDATA_SECTION_STATE) {
-       die "$0: $self->{state}: Unknown state";
+       ## NOTE: "CDATA section state" in the state is jointly implemented
-     }
+       ## by three states, |CDATA_SECTION_STATE|, |CDATA_SECTION_MSE1_STATE|,
-   } # A
+       ## and |CDATA_SECTION_MSE2_STATE|.
-   die "$0: _get_next_token: unexpected case";
+       if ($self->{next_char} == 0x005D) { # ]
- } # _get_next_token
+         !!!cp (221.1);
+         $self->{state} = CDATA_SECTION_MSE1_STATE;
- sub _tokenize_attempt_to_consume_an_entity ($$$) {
+         !!!next-input-character;
-   my ($self, $in_attr, $additional) = @_;
+         redo A;
+       } elsif ($self->{next_char} == -1) {
+         $self->{state} = DATA_STATE;
+         !!!next-input-character;
+         if (length $self->{current_token}->{data}) { # character
+           !!!cp (221.2);
+           !!!emit ($self->{current_token}); # character
+         } else {
+           !!!cp (221.3);
+           ## No token to emit. $self->{current_token} is discarded.
+         }
+         redo A;
+       } else {
+         !!!cp (221.4);
+         $self->{current_token}->{data} .= chr $self->{next_char};
+         ## Stay in the state.
+         !!!next-input-character;
+         redo A;
+       }
-   if ({
+       ## ISSUE: "text tokens" in spec.
-x0009 => 1, 0x000A => 1, 0x000B => 1, 0x000C => 1, # HT, LF, VT, FF,
+     } elsif ($self->{state} == CDATA_SECTION_MSE1_STATE) {
-x0020 => 1, 0x003C => 1, 0x0026 => 1, -1 => 1, # SP, <, & # 0x000D # CR
+       if ($self->{next_char} == 0x005D) { # ]
-        $additional => 1,
+         !!!cp (221.5);
-       }->{$self->{next_char}}) {
+         $self->{state} = CDATA_SECTION_MSE2_STATE;
-     !!!cp (1001);
+         !!!next-input-character;
-     ## Don't consume
+         redo A;
-     ## No error
+       } else {
-     return undef;
+         !!!cp (221.6);
-   } elsif ($self->{next_char} == 0x0023) { # #
+         $self->{current_token}->{data} .= ']';
-     !!!next-input-character;
+         $self->{state} = CDATA_SECTION_STATE;
-     if ($self->{next_char} == 0x0078 or # x
+         ## Reconsume.
-         $self->{next_char} == 0x0058) { # X
+         redo A;
-       my $code;
+       }
-       X: {
+     } elsif ($self->{state} == CDATA_SECTION_MSE2_STATE) {
-         my $x_char = $self->{next_char};
+       if ($self->{next_char} == 0x003E) { # >
-         !!!next-input-character;
+         $self->{state} = DATA_STATE;
-         if (0x0030 <= $self->{next_char} and
+         !!!next-input-character;
-             $self->{next_char} <= 0x0039) { # 0..9
+         if (length $self->{current_token}->{data}) { # character
-           !!!cp (1002);
+           !!!cp (221.7);
-           $code ||= 0;
+           !!!emit ($self->{current_token}); # character
-           $code *= 0x10;
-           $code += $self->{next_char} - 0x0030;
-           redo X;
-         } elsif (0x0061 <= $self->{next_char} and
-                  $self->{next_char} <= 0x0066) { # a..f
-           !!!cp (1003);
-           $code ||= 0;
-           $code *= 0x10;
-           $code += $self->{next_char} - 0x0060 + 9;
-           redo X;
-         } elsif (0x0041 <= $self->{next_char} and
-                  $self->{next_char} <= 0x0046) { # A..F
-           !!!cp (1004);
-           $code ||= 0;
-           $code *= 0x10;
-           $code += $self->{next_char} - 0x0040 + 9;
-           redo X;
-         } elsif (not defined $code) { # no hexadecimal digit
-           !!!cp (1005);
-           !!!parse-error (type => 'bare hcro');
-           !!!back-next-input-character ($x_char, $self->{next_char});
-           $self->{next_char} = 0x0023; # #
-           return undef;
-         } elsif ($self->{next_char} == 0x003B) { # ;
-           !!!cp (1006);
-           !!!next-input-character;
          } else {
-           !!!cp (1007);
+           !!!cp (221.8);
-           !!!parse-error (type => 'no refc');
+           ## No token to emit. $self->{current_token} is discarded.
          }
+         redo A;
+       } elsif ($self->{next_char} == 0x005D) { # ]
+         !!!cp (221.9); # character
+         $self->{current_token}->{data} .= ']'; ## Add first "]" of "]]]".
+         ## Stay in the state.
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (221.11);
+         $self->{current_token}->{data} .= ']]'; # character
+         $self->{state} = CDATA_SECTION_STATE;
+         ## Reconsume.
+         redo A;
+       }
+     } elsif ($self->{state} == ENTITY_STATE) {
+       if ({
+x0009 => 1, 0x000A => 1, 0x000B => 1, 0x000C => 1, # HT, LF, VT, FF,
+x0020 => 1, 0x003C => 1, 0x0026 => 1, -1 => 1, # SP, <, &
+         $self->{entity_additional} => 1,
+       }->{$self->{next_char}}) {
+         !!!cp (1001);
+         ## Don't consume
+         ## No error
+         ## Return nothing.
+         #
+       } elsif ($self->{next_char} == 0x0023) { # #
+         !!!cp (999);
+         $self->{state} = ENTITY_HASH_STATE;
+         $self->{state_keyword} = '#';
+         !!!next-input-character;
+         redo A;
+       } elsif ((0x0041 <= $self->{next_char} and
+                 $self->{next_char} <= 0x005A) or # A..Z
+                (0x0061 <= $self->{next_char} and
+                 $self->{next_char} <= 0x007A)) { # a..z
+         !!!cp (998);
+         require Whatpm::_NamedEntityList;
+         $self->{state} = ENTITY_NAME_STATE;
+         $self->{state_keyword} = chr $self->{next_char};
+         $self->{entity__value} = $self->{state_keyword};
+         $self->{entity__match} = 0;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!cp (1027);
+         !!!parse-error (type => 'bare ero');
+         ## Return nothing.
+         #
+       }
-         if ($code == 0 or (0xD800 <= $code and $code <= 0xDFFF)) {
+       ## NOTE: No character is consumed by the "consume a character
-           !!!cp (1008);
+       ## reference" algorithm.  In other word, there is an "&" character
-           !!!parse-error (type => sprintf 'invalid character reference:U+%04X', $code);
+       ## that does not introduce a character reference, which would be
-           $code = 0xFFFD;
+       ## appended to the parent element or the attribute value in later
-         } elsif ($code > 0x10FFFF) {
+       ## process of the tokenizer.
-           !!!cp (1009);
-           !!!parse-error (type => sprintf 'invalid character reference:U-%08X', $code);
+       if ($self->{prev_state} == DATA_STATE) {
-           $code = 0xFFFD;
+         !!!cp (997);
-         } elsif ($code == 0x000D) {
+         $self->{state} = $self->{prev_state};
-           !!!cp (1010);
+         ## Reconsume.
-           !!!parse-error (type => 'CR character reference');
+         !!!emit ({type => CHARACTER_TOKEN, data => '&',
-           $code = 0x000A;
+                   line => $self->{line_prev},
-         } elsif (0x80 <= $code and $code <= 0x9F) {
+                   column => $self->{column_prev},
-           !!!cp (1011);
+                  });
-           !!!parse-error (type => sprintf 'C1 character reference:U+%04X', $code);
+         redo A;
-           $code = $c1_entity_char->{$code};
+       } else {
-         }
+         !!!cp (996);
+         $self->{current_attribute}->{value} .= '&';
-         return {type => CHARACTER_TOKEN, data => chr $code,
+         $self->{state} = $self->{prev_state};
-                 has_reference => 1};
+         ## Reconsume.
-       } # X
+         redo A;
-     } elsif (0x0030 <= $self->{next_char} and
+       }
-              $self->{next_char} <= 0x0039) { # 0..9
+     } elsif ($self->{state} == ENTITY_HASH_STATE) {
-       my $code = $self->{next_char} - 0x0030;
+       if ($self->{next_char} == 0x0078 or # x
-       !!!next-input-character;
+           $self->{next_char} == 0x0058) { # X
+         !!!cp (995);
-       while (0x0030 <= $self->{next_char} and
+         $self->{state} = HEXREF_X_STATE;
-                 $self->{next_char} <= 0x0039) { # 0..9
+         $self->{state_keyword} .= chr $self->{next_char};
+         !!!next-input-character;
+         redo A;
+       } elsif (0x0030 <= $self->{next_char} and
+                $self->{next_char} <= 0x0039) { # 0..9
+         !!!cp (994);
+         $self->{state} = NCR_NUM_STATE;
+         $self->{state_keyword} = $self->{next_char} - 0x0030;
+         !!!next-input-character;
+         redo A;
+       } else {
+         !!!parse-error (type => 'bare nero',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev} - 1);
+         ## NOTE: According to the spec algorithm, nothing is returned,
+         ## and then "&#" is appended to the parent element or the attribute
+         ## value in the later processing.
+         if ($self->{prev_state} == DATA_STATE) {
+           !!!cp (1019);
+           $self->{state} = $self->{prev_state};
+           ## Reconsume.
+           !!!emit ({type => CHARACTER_TOKEN,
+                     data => '&#',
+                     line => $self->{line_prev},
+                     column => $self->{column_prev} - 1,
+                    });
+           redo A;
+         } else {
+           !!!cp (993);
+           $self->{current_attribute}->{value} .= '&#';
+           $self->{state} = $self->{prev_state};
+           ## Reconsume.
+           redo A;
+         }
+       }
+     } elsif ($self->{state} == NCR_NUM_STATE) {
+       if (0x0030 <= $self->{next_char} and
+           $self->{next_char} <= 0x0039) { # 0..9
          !!!cp (1012);
-         $code *= 10;
+         $self->{state_keyword} *= 10;
-         $code += $self->{next_char} - 0x0030;
+         $self->{state_keyword} += $self->{next_char} - 0x0030;
+         ## Stay in the state.
          !!!next-input-character;
-       }
+         redo A;
+       } elsif ($self->{next_char} == 0x003B) { # ;
-       if ($self->{next_char} == 0x003B) { # ;
          !!!cp (1013);
          !!!next-input-character;
+         #
        } else {
          !!!cp (1014);
          !!!parse-error (type => 'no refc');
+         ## Reconsume.
+         #
        }
+       my $code = $self->{state_keyword};
+       my $l = $self->{line_prev};
+       my $c = $self->{column_prev};
        if ($code == 0 or (0xD800 <= $code and $code <= 0xDFFF)) {
          !!!cp (1015);
-         !!!parse-error (type => sprintf 'invalid character reference:U+%04X', $code);
+         !!!parse-error (type => 'invalid character reference',
+                         text => (sprintf 'U+%04X', $code),
+                         line => $l, column => $c);
          $code = 0xFFFD;
        } elsif ($code > 0x10FFFF) {
          !!!cp (1016);
-         !!!parse-error (type => sprintf 'invalid character reference:U-%08X', $code);
+         !!!parse-error (type => 'invalid character reference',
+                         text => (sprintf 'U-%08X', $code),
+                         line => $l, column => $c);
          $code = 0xFFFD;
        } elsif ($code == 0x000D) {
          !!!cp (1017);
-         !!!parse-error (type => 'CR character reference');
+         !!!parse-error (type => 'CR character reference',
+                         line => $l, column => $c);
          $code = 0x000A;
        } elsif (0x80 <= $code and $code <= 0x9F) {
          !!!cp (1018);
-         !!!parse-error (type => sprintf 'C1 character reference:U+%04X', $code);
+         !!!parse-error (type => 'C1 character reference',
+                         text => (sprintf 'U+%04X', $code),
+                         line => $l, column => $c);
          $code = $c1_entity_char->{$code};
        }
-       return {type => CHARACTER_TOKEN, data => chr $code, has_reference => 1};
+       if ($self->{prev_state} == DATA_STATE) {
-     } else {
+         !!!cp (992);
-       !!!cp (1019);
+         $self->{state} = $self->{prev_state};
-       !!!parse-error (type => 'bare nero');
+         ## Reconsume.
-       !!!back-next-input-character ($self->{next_char});
+         !!!emit ({type => CHARACTER_TOKEN, data => chr $code,
-       $self->{next_char} = 0x0023; # #
+                   line => $l, column => $c,
-       return undef;
+                  });
-     }
+         redo A;
-   } elsif ((0x0041 <= $self->{next_char} and
+       } else {
-             $self->{next_char} <= 0x005A) or
+         !!!cp (991);
-            (0x0061 <= $self->{next_char} and
+         $self->{current_attribute}->{value} .= chr $code;
-             $self->{next_char} <= 0x007A)) {
+         $self->{current_attribute}->{has_reference} = 1;
-     my $entity_name = chr $self->{next_char};
+         $self->{state} = $self->{prev_state};
-     !!!next-input-character;
+         ## Reconsume.
+         redo A;
-     my $value = $entity_name;
+       }
-     my $match = 0;
+     } elsif ($self->{state} == HEXREF_X_STATE) {
-     require Whatpm::_NamedEntityList;
+       if ((0x0030 <= $self->{next_char} and $self->{next_char} <= 0x0039) or
-     our $EntityChar;
+           (0x0041 <= $self->{next_char} and $self->{next_char} <= 0x0046) or
+           (0x0061 <= $self->{next_char} and $self->{next_char} <= 0x0066)) {
-     while (length $entity_name < 10 and
+         # 0..9, A..F, a..f
-            ## NOTE: Some number greater than the maximum length of entity name
+         !!!cp (990);
-            ((0x0041 <= $self->{next_char} and # a
+         $self->{state} = HEXREF_HEX_STATE;
-              $self->{next_char} <= 0x005A) or # x
+         $self->{state_keyword} = 0;
-             (0x0061 <= $self->{next_char} and # a
+         ## Reconsume.
-              $self->{next_char} <= 0x007A) or # z
+         redo A;
-             (0x0030 <= $self->{next_char} and # 0
+       } else {
-              $self->{next_char} <= 0x0039) or # 9
+         !!!parse-error (type => 'bare hcro',
-             $self->{next_char} == 0x003B)) { # ;
+                         line => $self->{line_prev},
-       $entity_name .= chr $self->{next_char};
+                         column => $self->{column_prev} - 2);
-       if (defined $EntityChar->{$entity_name}) {
-         if ($self->{next_char} == 0x003B) { # ;
+         ## NOTE: According to the spec algorithm, nothing is returned,
-           !!!cp (1020);
+         ## and then "&#" followed by "X" or "x" is appended to the parent
-           $value = $EntityChar->{$entity_name};
+         ## element or the attribute value in the later processing.
-           $match = 1;
-           !!!next-input-character;
+         if ($self->{prev_state} == DATA_STATE) {
-           last;
+           !!!cp (1005);
+           $self->{state} = $self->{prev_state};
+           ## Reconsume.
+           !!!emit ({type => CHARACTER_TOKEN,
+                     data => '&' . $self->{state_keyword},
+                     line => $self->{line_prev},
+                     column => $self->{column_prev} - length $self->{state_keyword},
+                    });
+           redo A;
          } else {
-           !!!cp (1021);
+           !!!cp (989);
-           $value = $EntityChar->{$entity_name};
+           $self->{current_attribute}->{value} .= '&' . $self->{state_keyword};
-           $match = -1;
+           $self->{state} = $self->{prev_state};
-           !!!next-input-character;
+           ## Reconsume.
+           redo A;
          }
-       } else {
+       }
-         !!!cp (1022);
+     } elsif ($self->{state} == HEXREF_HEX_STATE) {
-         $value .= chr $self->{next_char};
+       if (0x0030 <= $self->{next_char} and $self->{next_char} <= 0x0039) {
-         $match *= 2;
+         # 0..9
+         !!!cp (1002);
+         $self->{state_keyword} *= 0x10;
+         $self->{state_keyword} += $self->{next_char} - 0x0030;
+         ## Stay in the state.
+         !!!next-input-character;
+         redo A;
+       } elsif (0x0061 <= $self->{next_char} and
+                $self->{next_char} <= 0x0066) { # a..f
+         !!!cp (1003);
+         $self->{state_keyword} *= 0x10;
+         $self->{state_keyword} += $self->{next_char} - 0x0060 + 9;
+         ## Stay in the state.
          !!!next-input-character;
+         redo A;
+       } elsif (0x0041 <= $self->{next_char} and
+                $self->{next_char} <= 0x0046) { # A..F
+         !!!cp (1004);
+         $self->{state_keyword} *= 0x10;
+         $self->{state_keyword} += $self->{next_char} - 0x0040 + 9;
+         ## Stay in the state.
+         !!!next-input-character;
+         redo A;
+       } elsif ($self->{next_char} == 0x003B) { # ;
+         !!!cp (1006);
+         !!!next-input-character;
+         #
+       } else {
+         !!!cp (1007);
+         !!!parse-error (type => 'no refc',
+                         line => $self->{line},
+                         column => $self->{column});
+         ## Reconsume.
+         #
        }
-     }
+       my $code = $self->{state_keyword};
-     if ($match > 0) {
+       my $l = $self->{line_prev};
-       !!!cp (1023);
+       my $c = $self->{column_prev};
-       return {type => CHARACTER_TOKEN, data => $value, has_reference => 1};
+       if ($code == 0 or (0xD800 <= $code and $code <= 0xDFFF)) {
-     } elsif ($match < 0) {
+         !!!cp (1008);
-       !!!parse-error (type => 'no refc');
+         !!!parse-error (type => 'invalid character reference',
-       if ($in_attr and $match < -1) {
+                         text => (sprintf 'U+%04X', $code),
-         !!!cp (1024);
+                         line => $l, column => $c);
-         return {type => CHARACTER_TOKEN, data => '&'.$entity_name};
+         $code = 0xFFFD;
+       } elsif ($code > 0x10FFFF) {
+         !!!cp (1009);
+         !!!parse-error (type => 'invalid character reference',
+                         text => (sprintf 'U-%08X', $code),
+                         line => $l, column => $c);
+         $code = 0xFFFD;
+       } elsif ($code == 0x000D) {
+         !!!cp (1010);
+         !!!parse-error (type => 'CR character reference', line => $l, column => $c);
+         $code = 0x000A;
+       } elsif (0x80 <= $code and $code <= 0x9F) {
+         !!!cp (1011);
+         !!!parse-error (type => 'C1 character reference', text => (sprintf 'U+%04X', $code), line => $l, column => $c);
+         $code = $c1_entity_char->{$code};
+       }
+       if ($self->{prev_state} == DATA_STATE) {
+         !!!cp (988);
+         $self->{state} = $self->{prev_state};
+         ## Reconsume.
+         !!!emit ({type => CHARACTER_TOKEN, data => chr $code,
+                   line => $l, column => $c,
+                  });
+         redo A;
+       } else {
+         !!!cp (987);
+         $self->{current_attribute}->{value} .= chr $code;
+         $self->{current_attribute}->{has_reference} = 1;
+         $self->{state} = $self->{prev_state};
+         ## Reconsume.
+         redo A;
+       }
+     } elsif ($self->{state} == ENTITY_NAME_STATE) {
+       if (length $self->{state_keyword} < 30 and
+           ## NOTE: Some number greater than the maximum length of entity name
+           ((0x0041 <= $self->{next_char} and # a
+             $self->{next_char} <= 0x005A) or # x
+            (0x0061 <= $self->{next_char} and # a
+             $self->{next_char} <= 0x007A) or # z
+            (0x0030 <= $self->{next_char} and # 0
+             $self->{next_char} <= 0x0039) or # 9
+            $self->{next_char} == 0x003B)) { # ;
+         our $EntityChar;
+         $self->{state_keyword} .= chr $self->{next_char};
+         if (defined $EntityChar->{$self->{state_keyword}}) {
+           if ($self->{next_char} == 0x003B) { # ;
+             !!!cp (1020);
+             $self->{entity__value} = $EntityChar->{$self->{state_keyword}};
+             $self->{entity__match} = 1;
+             !!!next-input-character;
+             #
+           } else {
+             !!!cp (1021);
+             $self->{entity__value} = $EntityChar->{$self->{state_keyword}};
+             $self->{entity__match} = -1;
+             ## Stay in the state.
+             !!!next-input-character;
+             redo A;
+           }
+         } else {
+           !!!cp (1022);
+           $self->{entity__value} .= chr $self->{next_char};
+           $self->{entity__match} *= 2;
+           ## Stay in the state.
+           !!!next-input-character;
+           redo A;
+         }
+       }
+       my $data;
+       my $has_ref;
+       if ($self->{entity__match} > 0) {
+         !!!cp (1023);
+         $data = $self->{entity__value};
+         $has_ref = 1;
+         #
+       } elsif ($self->{entity__match} < 0) {
+         !!!parse-error (type => 'no refc');
+         if ($self->{prev_state} != DATA_STATE and # in attribute
+             $self->{entity__match} < -1) {
+           !!!cp (1024);
+           $data = '&' . $self->{state_keyword};
+           #
+         } else {
+           !!!cp (1025);
+           $data = $self->{entity__value};
+           $has_ref = 1;
+           #
+         }
        } else {
-         !!!cp (1025);
+         !!!cp (1026);
-         return {type => CHARACTER_TOKEN, data => $value, has_reference => 1};
+         !!!parse-error (type => 'bare ero',
+                         line => $self->{line_prev},
+                         column => $self->{column_prev});
+         $data = '&' . $self->{state_keyword};
+         #
+       }
+       ## NOTE: In these cases, when a character reference is found,
+       ## it is consumed and a character token is returned, or, otherwise,
+       ## nothing is consumed and returned, according to the spec algorithm.
+       ## In this implementation, anything that has been examined by the
+       ## tokenizer is appended to the parent element or the attribute value
+       ## as string, either literal string when no character reference or
+       ## entity-replaced string otherwise, in this stage, since any characters
+       ## that would not be consumed are appended in the data state or in an
+       ## appropriate attribute value state anyway.
+       if ($self->{prev_state} == DATA_STATE) {
+         !!!cp (986);
+         $self->{state} = $self->{prev_state};
+         ## Reconsume.
+         !!!emit ({type => CHARACTER_TOKEN,
+                   data => $data,
+                   line => $self->{line_prev},
+                   column => $self->{column_prev} + 1 - length $self->{state_keyword},
+                  });
+         redo A;
+       } else {
+         !!!cp (985);
+         $self->{current_attribute}->{value} .= $data;
+         $self->{current_attribute}->{has_reference} = 1 if $has_ref;
+         $self->{state} = $self->{prev_state};
+         ## Reconsume.
+         redo A;
        }
      } else {
-       !!!cp (1026);
+       die "$0: $self->{state}: Unknown state";
-       !!!parse-error (type => 'bare ero');
-       ## NOTE: "No characters are consumed" in the spec.
-       return {type => CHARACTER_TOKEN, data => '&'.$value};
      }
-   } else {
+   } # A
-     !!!cp (1027);
-     ## no characters are consumed
+   die "$0: _get_next_token: unexpected case";
-     !!!parse-error (type => 'bare ero');
+ } # _get_next_token
-     return undef;
-   }
- } # _tokenize_attempt_to_consume_an_entity
  sub _initialize_tree_constructor ($) {
    my $self = shift;
-Line 2402 
 sub _initialize_tree_constructor ($) {
+Line 3325 
 sub _initialize_tree_constructor ($) {
    ## TODO: Turn mutation events off # MUST
    ## TODO: Turn loose Document option (manakai extension) on
    $self->{document}->manakai_is_html (1); # MUST
+   $self->{document}->set_user_data (manakai_source_line => 1);
+   $self->{document}->set_user_data (manakai_source_column => 1);
  } # _initialize_tree_constructor
  sub _terminate_tree_constructor ($) {
-Line 2456 
 sub _tree_construction_initial ($) {
+Line 3381 
 sub _tree_construction_initial ($) {
        ## language.
        my $doctype_name = $token->{name};
        $doctype_name = '' unless defined $doctype_name;
-       $doctype_name =~ tr/a-z/A-Z/;
+       $doctype_name =~ tr/a-z/A-Z/; # ASCII case-insensitive
        if (not defined $token->{name} or # <!DOCTYPE>
-           defined $token->{public_identifier} or
            defined $token->{system_identifier}) {
          !!!cp ('t1');
-         !!!parse-error (type => 'not HTML5');
+         !!!parse-error (type => 'not HTML5', token => $token);
        } elsif ($doctype_name ne 'HTML') {
          !!!cp ('t2');
-         ## ISSUE: ASCII case-insensitive? (in fact it does not matter)
+         !!!parse-error (type => 'not HTML5', token => $token);
-         !!!parse-error (type => 'not HTML5');
+       } elsif (defined $token->{public_identifier}) {
+         if ($token->{public_identifier} eq 'XSLT-compat') {
+           !!!cp ('t1.2');
+           !!!parse-error (type => 'XSLT-compat', token => $token,
+                           level => $self->{level}->{should});
+         } else {
+           !!!parse-error (type => 'not HTML5', token => $token);
+         }
        } else {
          !!!cp ('t3');
+         #
        }
        my $doctype = $self->{document}->create_document_type_definition
          ($token->{name}); ## ISSUE: If name is missing (e.g. <!DOCTYPE>)?
+       ## NOTE: Default value for both |public_id| and |system_id| attributes
+       ## are empty strings, so that we don't set any value in missing cases.
        $doctype->public_id ($token->{public_identifier})
            if defined $token->{public_identifier};
        $doctype->system_id ($token->{system_identifier})
-Line 2486 
 sub _tree_construction_initial ($) {
+Line 3420 
 sub _tree_construction_initial ($) {
        } elsif (defined $token->{public_identifier}) {
          my $pubid = $token->{public_identifier};
          $pubid =~ tr/a-z/A-z/;
-         if ({
+         my $prefix = [
-           "+//SILMARIL//DTD HTML PRO V0R11 19970101//EN" => 1,
+           "+//SILMARIL//DTD HTML PRO V0R11 19970101//",
-           "-//ADVASOFT LTD//DTD HTML 3.0 ASWEDIT + EXTENSIONS//EN" => 1,
+           "-//ADVASOFT LTD//DTD HTML 3.0 ASWEDIT + EXTENSIONS//",
-           "-//AS//DTD HTML 3.0 ASWEDIT + EXTENSIONS//EN" => 1,
+           "-//AS//DTD HTML 3.0 ASWEDIT + EXTENSIONS//",
-           "-//IETF//DTD HTML 2.0 LEVEL 1//EN" => 1,
+           "-//IETF//DTD HTML 2.0 LEVEL 1//",
-           "-//IETF//DTD HTML 2.0 LEVEL 2//EN" => 1,
+           "-//IETF//DTD HTML 2.0 LEVEL 2//",
-           "-//IETF//DTD HTML 2.0 STRICT LEVEL 1//EN" => 1,
+           "-//IETF//DTD HTML 2.0 STRICT LEVEL 1//",
-           "-//IETF//DTD HTML 2.0 STRICT LEVEL 2//EN" => 1,
+           "-//IETF//DTD HTML 2.0 STRICT LEVEL 2//",
-           "-//IETF//DTD HTML 2.0 STRICT//EN" => 1,
+           "-//IETF//DTD HTML 2.0 STRICT//",
-           "-//IETF//DTD HTML 2.0//EN" => 1,
+           "-//IETF//DTD HTML 2.0//",
-           "-//IETF//DTD HTML 2.1E//EN" => 1,
+           "-//IETF//DTD HTML 2.1E//",
-           "-//IETF//DTD HTML 3.0//EN" => 1,
+           "-//IETF//DTD HTML 3.0//",
-           "-//IETF//DTD HTML 3.0//EN//" => 1,
+           "-//IETF//DTD HTML 3.2 FINAL//",
-           "-//IETF//DTD HTML 3.2 FINAL//EN" => 1,
+           "-//IETF//DTD HTML 3.2//",
-           "-//IETF//DTD HTML 3.2//EN" => 1,
+           "-//IETF//DTD HTML 3//",
-           "-//IETF//DTD HTML 3//EN" => 1,
+           "-//IETF//DTD HTML LEVEL 0//",
-           "-//IETF//DTD HTML LEVEL 0//EN" => 1,
+           "-//IETF//DTD HTML LEVEL 1//",
-           "-//IETF//DTD HTML LEVEL 0//EN//2.0" => 1,
+           "-//IETF//DTD HTML LEVEL 2//",
-           "-//IETF//DTD HTML LEVEL 1//EN" => 1,
+           "-//IETF//DTD HTML LEVEL 3//",
-           "-//IETF//DTD HTML LEVEL 1//EN//2.0" => 1,
+           "-//IETF//DTD HTML STRICT LEVEL 0//",
-           "-//IETF//DTD HTML LEVEL 2//EN" => 1,
+           "-//IETF//DTD HTML STRICT LEVEL 1//",
-           "-//IETF//DTD HTML LEVEL 2//EN//2.0" => 1,
+           "-//IETF//DTD HTML STRICT LEVEL 2//",
-           "-//IETF//DTD HTML LEVEL 3//EN" => 1,
+           "-//IETF//DTD HTML STRICT LEVEL 3//",
-           "-//IETF//DTD HTML LEVEL 3//EN//3.0" => 1,
+           "-//IETF//DTD HTML STRICT//",
-           "-//IETF//DTD HTML STRICT LEVEL 0//EN" => 1,
+           "-//IETF//DTD HTML//",
-           "-//IETF//DTD HTML STRICT LEVEL 0//EN//2.0" => 1,
+           "-//METRIUS//DTD METRIUS PRESENTATIONAL//",
-           "-//IETF//DTD HTML STRICT LEVEL 1//EN" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML STRICT//",
-           "-//IETF//DTD HTML STRICT LEVEL 1//EN//2.0" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML//",
-           "-//IETF//DTD HTML STRICT LEVEL 2//EN" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 TABLES//",
-           "-//IETF//DTD HTML STRICT LEVEL 2//EN//2.0" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML STRICT//",
-           "-//IETF//DTD HTML STRICT LEVEL 3//EN" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML//",
-           "-//IETF//DTD HTML STRICT LEVEL 3//EN//3.0" => 1,
+           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 TABLES//",
-           "-//IETF//DTD HTML STRICT//EN" => 1,
+           "-//NETSCAPE COMM. CORP.//DTD HTML//",
-           "-//IETF//DTD HTML STRICT//EN//2.0" => 1,
+           "-//NETSCAPE COMM. CORP.//DTD STRICT HTML//",
-           "-//IETF//DTD HTML STRICT//EN//3.0" => 1,
+           "-//O'REILLY AND ASSOCIATES//DTD HTML 2.0//",
-           "-//IETF//DTD HTML//EN" => 1,
+           "-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED 1.0//",
-           "-//IETF//DTD HTML//EN//2.0" => 1,
+           "-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED RELAXED 1.0//",
-           "-//IETF//DTD HTML//EN//3.0" => 1,
+           "-//SOFTQUAD SOFTWARE//DTD HOTMETAL PRO 6.0::19990601::EXTENSIONS TO HTML 4.0//",
-           "-//METRIUS//DTD METRIUS PRESENTATIONAL//EN" => 1,
+           "-//SOFTQUAD//DTD HOTMETAL PRO 4.0::19971010::EXTENSIONS TO HTML 4.0//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML STRICT//EN" => 1,
+           "-//SPYGLASS//DTD HTML 2.0 EXTENDED//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 HTML//EN" => 1,
+           "-//SQ//DTD HTML 2.0 HOTMETAL + EXTENSIONS//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 2.0 TABLES//EN" => 1,
+           "-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA HTML//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML STRICT//EN" => 1,
+           "-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA STRICT HTML//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 HTML//EN" => 1,
+           "-//W3C//DTD HTML 3 1995-03-24//",
-           "-//MICROSOFT//DTD INTERNET EXPLORER 3.0 TABLES//EN" => 1,
+           "-//W3C//DTD HTML 3.2 DRAFT//",
-           "-//NETSCAPE COMM. CORP.//DTD HTML//EN" => 1,
+           "-//W3C//DTD HTML 3.2 FINAL//",
-           "-//NETSCAPE COMM. CORP.//DTD STRICT HTML//EN" => 1,
+           "-//W3C//DTD HTML 3.2//",
-           "-//O'REILLY AND ASSOCIATES//DTD HTML 2.0//EN" => 1,
+           "-//W3C//DTD HTML 3.2S DRAFT//",
-           "-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED 1.0//EN" => 1,
+           "-//W3C//DTD HTML 4.0 FRAMESET//",
-           "-//O'REILLY AND ASSOCIATES//DTD HTML EXTENDED RELAXED 1.0//EN" => 1,
+           "-//W3C//DTD HTML 4.0 TRANSITIONAL//",
-           "-//SOFTQUAD SOFTWARE//DTD HOTMETAL PRO 6.0::19990601::EXTENSIONS TO HTML 4.0//EN" => 1,
+           "-//W3C//DTD HTML EXPERIMETNAL 19960712//",
-           "-//SOFTQUAD//DTD HOTMETAL PRO 4.0::19971010::EXTENSIONS TO HTML 4.0//EN" => 1,
+           "-//W3C//DTD HTML EXPERIMENTAL 970421//",
-           "-//SPYGLASS//DTD HTML 2.0 EXTENDED//EN" => 1,
+           "-//W3C//DTD W3 HTML//",
-           "-//SQ//DTD HTML 2.0 HOTMETAL + EXTENSIONS//EN" => 1,
+           "-//W3O//DTD W3 HTML 3.0//",
-           "-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA HTML//EN" => 1,
+           "-//WEBTECHS//DTD MOZILLA HTML 2.0//",
-           "-//SUN MICROSYSTEMS CORP.//DTD HOTJAVA STRICT HTML//EN" => 1,
+           "-//WEBTECHS//DTD MOZILLA HTML//",
-           "-//W3C//DTD HTML 3 1995-03-24//EN" => 1,
+         ]; # $prefix
-           "-//W3C//DTD HTML 3.2 DRAFT//EN" => 1,
+         my $match;
-           "-//W3C//DTD HTML 3.2 FINAL//EN" => 1,
+         for (@$prefix) {
-           "-//W3C//DTD HTML 3.2//EN" => 1,
+           if (substr ($prefix, 0, length $_) eq $_) {
-           "-//W3C//DTD HTML 3.2S DRAFT//EN" => 1,
+             $match = 1;
-           "-//W3C//DTD HTML 4.0 FRAMESET//EN" => 1,
+             last;
-           "-//W3C//DTD HTML 4.0 TRANSITIONAL//EN" => 1,
+           }
-           "-//W3C//DTD HTML EXPERIMETNAL 19960712//EN" => 1,
+         }
-           "-//W3C//DTD HTML EXPERIMENTAL 970421//EN" => 1,
+         if ($match or
-           "-//W3C//DTD W3 HTML//EN" => 1,
+             $pubid eq "-//W3O//DTD W3 HTML STRICT 3.0//EN//" or
-           "-//W3O//DTD W3 HTML 3.0//EN" => 1,
+             $pubid eq "-/W3C/DTD HTML 4.0 TRANSITIONAL/EN" or
-           "-//W3O//DTD W3 HTML 3.0//EN//" => 1,
+             $pubid eq "HTML") {
-           "-//W3O//DTD W3 HTML STRICT 3.0//EN//" => 1,
-           "-//WEBTECHS//DTD MOZILLA HTML 2.0//EN" => 1,
-           "-//WEBTECHS//DTD MOZILLA HTML//EN" => 1,
-           "-/W3C/DTD HTML 4.0 TRANSITIONAL/EN" => 1,
-           "HTML" => 1,
-         }->{$pubid}) {
            !!!cp ('t5');
            $self->{document}->manakai_compat_mode ('quirks');
-         } elsif ($pubid eq "-//W3C//DTD HTML 4.01 FRAMESET//EN" or
+         } elsif ($pubid =~ m[^-//W3C//DTD HTML 4.01 FRAMESET//] or
-                  $pubid eq "-//W3C//DTD HTML 4.01 TRANSITIONAL//EN") {
+                  $pubid =~ m[^-//W3C//DTD HTML 4.01 TRANSITIONAL//]) {
            if (defined $token->{system_identifier}) {
              !!!cp ('t6');
              $self->{document}->manakai_compat_mode ('quirks');
-Line 2571 
 sub _tree_construction_initial ($) {
+Line 3499 
 sub _tree_construction_initial ($) {
              !!!cp ('t7');
              $self->{document}->manakai_compat_mode ('limited quirks');
            }
-         } elsif ($pubid eq "-//W3C//DTD XHTML 1.0 FRAMESET//EN" or
+         } elsif ($pubid =~ m[^-//W3C//DTD XHTML 1.0 FRAMESET//] or
-                  $pubid eq "-//W3C//DTD XHTML 1.0 TRANSITIONAL//EN") {
+                  $pubid =~ m[^-//W3C//DTD XHTML 1.0 TRANSITIONAL//]) {
            !!!cp ('t8');
            $self->{document}->manakai_compat_mode ('limited quirks');
          } else {
-Line 2585 
 sub _tree_construction_initial ($) {
+Line 3513 
 sub _tree_construction_initial ($) {
          my $sysid = $token->{system_identifier};
          $sysid =~ tr/A-Z/a-z/;
          if ($sysid eq "http://www.ibm.com/data/dtd/v11/ibmxhtml1-transitional.dtd") {
-           ## TODO: Check the spec: PUBLIC "(limited quirks)" "(quirks)"
+           ## NOTE: Ensure that |PUBLIC "(limited quirks)" "(quirks)"| is
+           ## marked as quirks.
            $self->{document}->manakai_compat_mode ('quirks');
            !!!cp ('t11');
          } else {
-Line 2604 
 sub _tree_construction_initial ($) {
+Line 3533 
 sub _tree_construction_initial ($) {
                END_OF_FILE_TOKEN, 1,
               }->{$token->{type}}) {
        !!!cp ('t14');
-       !!!parse-error (type => 'no DOCTYPE');
+       !!!parse-error (type => 'no DOCTYPE', token => $token);
        $self->{document}->manakai_compat_mode ('quirks');
        ## Go to the "before html" insertion mode.
        ## reprocess
+       !!!ack-later;
        return;
      } elsif ($token->{type} == CHARACTER_TOKEN) {
        if ($token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) { # \x0D
-Line 2625 
 sub _tree_construction_initial ($) {
+Line 3555 
 sub _tree_construction_initial ($) {
          !!!cp ('t17');
        }
-       !!!parse-error (type => 'no DOCTYPE');
+       !!!parse-error (type => 'no DOCTYPE', token => $token);
        $self->{document}->manakai_compat_mode ('quirks');
        ## Go to the "before html" insertion mode.
        ## reprocess
-Line 2654 
 sub _tree_construction_root_element ($)
+Line 3584 
 sub _tree_construction_root_element ($)
    B: {
        if ($token->{type} == DOCTYPE_TOKEN) {
          !!!cp ('t19');
-         !!!parse-error (type => 'in html:#DOCTYPE');
+         !!!parse-error (type => 'in html:#DOCTYPE', token => $token);
          ## Ignore the token
          ## Stay in the insertion mode.
          !!!next-token;
-Line 2688 
 sub _tree_construction_root_element ($)
+Line 3618 
 sub _tree_construction_root_element ($)
        } elsif ($token->{type} == START_TAG_TOKEN) {
          if ($token->{tag_name} eq 'html') {
            my $root_element;
-           !!!create-element ($root_element, $token->{tag_name}, $token->{attributes});
+           !!!create-element ($root_element, $HTML_NS, $token->{tag_name}, $token->{attributes}, $token);
            $self->{document}->append_child ($root_element);
-           push @{$self->{open_elements}}, [$root_element, 'html'];
+           push @{$self->{open_elements}},
+               [$root_element, $el_category->{html}];
            if ($token->{attributes}->{manifest}) {
              !!!cp ('t24');
              $self->{application_cache_selection}
                  ->($token->{attributes}->{manifest}->{value});
-             ## ISSUE: No relative reference resolution?
+             ## ISSUE: Spec is unclear on relative references.
+             ## According to Hixie (#whatwg 2008-03-19), it should be
+             ## resolved against the base URI of the document in HTML
+             ## or xml:base of the element in XHTML.
            } else {
              !!!cp ('t25');
              $self->{application_cache_selection}->(undef);
            }
+           !!!nack ('t25c');
            !!!next-token;
            return; ## Go to the "before head" insertion mode.
          } else {
-Line 2718 
 sub _tree_construction_root_element ($)
+Line 3654 
 sub _tree_construction_root_element ($)
          die "$0: $token->{type}: Unknown token type";
        }
-     my $root_element; !!!create-element ($root_element, 'html');
+     my $root_element;
+     !!!create-element ($root_element, $HTML_NS, 'html',, $token);
      $self->{document}->append_child ($root_element);
-     push @{$self->{open_elements}}, [$root_element, 'html'];
+     push @{$self->{open_elements}}, [$root_element, $el_category->{html}];
      $self->{application_cache_selection}->(undef);
      ## NOTE: Reprocess the token.
+     !!!ack-later;
      return; ## Go to the "before head" insertion mode.
      ## ISSUE: There is an issue in the spec
-Line 2748 
 sub _reset_insertion_mode ($) {
+Line 3686 
 sub _reset_insertion_mode ($) {
        if ($self->{open_elements}->[0]->[0] eq $node->[0]) {
          $last = 1;
          if (defined $self->{inner_html_node}) {
-           if ($self->{inner_html_node}->[1] eq 'td' or
+           !!!cp ('t28');
-               $self->{inner_html_node}->[1] eq 'th') {
+           $node = $self->{inner_html_node};
-             !!!cp ('t27');
+         } else {
-             #
+           die "_reset_insertion_mode: t27";
-           } else {
-             !!!cp ('t28');
-             $node = $self->{inner_html_node};
-           }
          }
        }
-       ## Step 4..13
+       ## Step 4..14
-       my $new_mode = {
+       my $new_mode;
+       if ($node->[1] & FOREIGN_EL) {
+         !!!cp ('t28.1');
+         ## NOTE: Strictly spaking, the line below only applies to MathML and
+         ## SVG elements.  Currently the HTML syntax supports only MathML and
+         ## SVG elements as foreigners.
+         $new_mode = IN_BODY_IM | IN_FOREIGN_CONTENT_IM;
+       } elsif ($node->[1] & TABLE_CELL_EL) {
+         if ($last) {
+           !!!cp ('t28.2');
+           #
+         } else {
+           !!!cp ('t28.3');
+           $new_mode = IN_CELL_IM;
+         }
+       } else {
+         !!!cp ('t28.4');
+         $new_mode = {
                        select => IN_SELECT_IM,
                        ## NOTE: |option| and |optgroup| do not set
                        ## insertion mode to "in select" by themselves.
-                       td => IN_CELL_IM,
-                       th => IN_CELL_IM,
                        tr => IN_ROW_IM,
                        tbody => IN_TABLE_BODY_IM,
                        thead => IN_TABLE_BODY_IM,
-Line 2776 
 sub _reset_insertion_mode ($) {
+Line 3725 
 sub _reset_insertion_mode ($) {
                        head => IN_BODY_IM, # not in head!
                        body => IN_BODY_IM,
                        frameset => IN_FRAMESET_IM,
-                      }->{$node->[1]};
+                      }->{$node->[0]->manakai_local_name};
+       }
        $self->{insertion_mode} = $new_mode and return if defined $new_mode;
-       ## Step 14
+       ## Step 15
-       if ($node->[1] eq 'html') {
+       if ($node->[1] & HTML_EL) {
          unless (defined $self->{head_element}) {
            !!!cp ('t29');
            $self->{insertion_mode} = BEFORE_HEAD_IM;
-Line 2794 
 sub _reset_insertion_mode ($) {
+Line 3744 
 sub _reset_insertion_mode ($) {
          !!!cp ('t31');
        }
-       ## Step 15
+       ## Step 16
        $self->{insertion_mode} = IN_BODY_IM and return if $last;
-       ## Step 16
+       ## Step 17
        $i--;
        $node = $self->{open_elements}->[$i];
-       ## Step 17
+       ## Step 18
        redo S3;
      } # S3
-Line 2913 
 sub _tree_construction_main ($) {
+Line 3863 
 sub _tree_construction_main ($) {
      ## Step 1
      my $start_tag_name = $token->{tag_name};
      my $el;
-     !!!create-element ($el, $start_tag_name, $token->{attributes});
+     !!!create-element ($el, $HTML_NS, $start_tag_name, $token->{attributes}, $token);
      ## Step 2
      $insert->($el);
-Line 2924 
 sub _tree_construction_main ($) {
+Line 3874 
 sub _tree_construction_main ($) {
      ## Step 4
      my $text = '';
+     !!!nack ('t40.1');
      !!!next-token;
      while ($token->{type} == CHARACTER_TOKEN) { # or until stop tokenizing
        !!!cp ('t40');
-Line 2950 
 sub _tree_construction_main ($) {
+Line 3901 
 sub _tree_construction_main ($) {
        ## NOTE: An end-of-file token.
        if ($content_model_flag == CDATA_CONTENT_MODEL) {
          !!!cp ('t43');
-         !!!parse-error (type => 'in CDATA:#'.$token->{type});
+         !!!parse-error (type => 'in CDATA:#eof', token => $token);
        } elsif ($content_model_flag == RCDATA_CONTENT_MODEL) {
          !!!cp ('t44');
-         !!!parse-error (type => 'in RCDATA:#'.$token->{type});
+         !!!parse-error (type => 'in RCDATA:#eof', token => $token);
        } else {
          die "$0: $content_model_flag in parse_rcdata";
        }
-Line 2963 
 sub _tree_construction_main ($) {
+Line 3914 
 sub _tree_construction_main ($) {
    my $script_start_tag = sub () {
      my $script_el;
-     !!!create-element ($script_el, 'script', $token->{attributes});
+     !!!create-element ($script_el, $HTML_NS, 'script', $token->{attributes}, $token);
      ## TODO: mark as "parser-inserted"
      $self->{content_model} = CDATA_CONTENT_MODEL;
      delete $self->{escape}; # MUST
      my $text = '';
+     !!!nack ('t45.1');
      !!!next-token;
      while ($token->{type} == CHARACTER_TOKEN) {
        !!!cp ('t45');
-Line 2989 
 sub _tree_construction_main ($) {
+Line 3941 
 sub _tree_construction_main ($) {
        ## Ignore the token
      } else {
        !!!cp ('t48');
-       !!!parse-error (type => 'in CDATA:#'.$token->{type});
+       !!!parse-error (type => 'in CDATA:#eof', token => $token);
        ## ISSUE: And ignore?
        ## TODO: mark as "already executed"
      }
-Line 3017 
 sub _tree_construction_main ($) {
+Line 3969 
 sub _tree_construction_main ($) {
    my $open_tables = [[$self->{open_elements}->[0]->[0]]];
    my $formatting_end_tag = sub {
-     my $tag_name = shift;
+     my $end_tag_token = shift;
+     my $tag_name = $end_tag_token->{tag_name};
      ## NOTE: The adoption agency algorithm (AAA).
-Line 3026 
 sub _tree_construction_main ($) {
+Line 3979 
 sub _tree_construction_main ($) {
        my $formatting_element;
        my $formatting_element_i_in_active;
        AFE: for (reverse 0..$#$active_formatting_elements) {
-         if ($active_formatting_elements->[$_]->[1] eq $tag_name) {
+         if ($active_formatting_elements->[$_]->[0] eq '#marker') {
+           !!!cp ('t52');
+           last AFE;
+         } elsif ($active_formatting_elements->[$_]->[0]->manakai_local_name
+                      eq $tag_name) {
            !!!cp ('t51');
            $formatting_element = $active_formatting_elements->[$_];
            $formatting_element_i_in_active = $_;
            last AFE;
-         } elsif ($active_formatting_elements->[$_]->[0] eq '#marker') {
-           !!!cp ('t52');
-           last AFE;
          }
        } # AFE
        unless (defined $formatting_element) {
          !!!cp ('t53');
-         !!!parse-error (type => 'unmatched end tag:'.$tag_name);
+         !!!parse-error (type => 'unmatched end tag', text => $tag_name, token => $end_tag_token);
          ## Ignore the token
          !!!next-token;
          return;
-Line 3055 
 sub _tree_construction_main ($) {
+Line 4009 
 sub _tree_construction_main ($) {
              last INSCOPE;
            } else { # in open elements but not in scope
              !!!cp ('t55');
-             !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+             !!!parse-error (type => 'unmatched end tag',
+                             text => $token->{tag_name},
+                             token => $end_tag_token);
              ## Ignore the token
              !!!next-token;
              return;
            }
-         } elsif ({
+         } elsif ($node->[1] & SCOPING_EL) {
-                   applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                   button => 1, marquee => 1, object => 1, html => 1,
-                  }->{$node->[1]}) {
            !!!cp ('t56');
            $in_scope = 0;
          }
        } # INSCOPE
        unless (defined $formatting_element_i_in_open) {
          !!!cp ('t57');
-         !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+         !!!parse-error (type => 'unmatched end tag',
+                         text => $token->{tag_name},
+                         token => $end_tag_token);
          pop @$active_formatting_elements; # $formatting_element
          !!!next-token; ## TODO: ok?
          return;
        }
        if (not $self->{open_elements}->[-1]->[0] eq $formatting_element->[0]) {
          !!!cp ('t58');
-         !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+         !!!parse-error (type => 'not closed',
+                         text => $self->{open_elements}->[-1]->[0]
+                             ->manakai_local_name,
+                         token => $end_tag_token);
        }
        ## Step 2
-Line 3085 
 sub _tree_construction_main ($) {
+Line 4043 
 sub _tree_construction_main ($) {
        my $furthest_block_i_in_open;
        OE: for (reverse 0..$#{$self->{open_elements}}) {
          my $node = $self->{open_elements}->[$_];
-         if (not $formatting_category->{$node->[1]} and
+         if (not ($node->[1] & FORMATTING_EL) and
              #not $phrasing_category->{$node->[1]} and
-             ($special_category->{$node->[1]} or
+             ($node->[1] & SPECIAL_EL or
-              $scoping_category->{$node->[1]})) { ## Scoping is redundant, maybe
+              $node->[1] & SCOPING_EL)) { ## Scoping is redundant, maybe
            !!!cp ('t59');
            $furthest_block = $node;
            $furthest_block_i_in_open = $_;
-Line 3174 
 sub _tree_construction_main ($) {
+Line 4132 
 sub _tree_construction_main ($) {
        } # S7
        ## Step 8
-       if ({
+       if ($common_ancestor_node->[1] & TABLE_ROWS_EL) {
-            table => 1, tbody => 1, tfoot => 1, thead => 1, tr => 1,
-           }->{$common_ancestor_node->[1]}) {
          my $foster_parent_element;
          my $next_sibling;
-                          OE: for (reverse 0..$#{$self->{open_elements}}) {
+         OE: for (reverse 0..$#{$self->{open_elements}}) {
-                            if ($self->{open_elements}->[$_]->[1] eq 'table') {
+           if ($self->{open_elements}->[$_]->[1] & TABLE_EL) {
                               my $parent = $self->{open_elements}->[$_]->[0]->parent_node;
                               if (defined $parent and $parent->node_type == 1) {
                                 !!!cp ('t65.1');
-Line 3253 
 sub _tree_construction_main ($) {
+Line 4209 
 sub _tree_construction_main ($) {
    my $insert_to_foster = sub {
      my $child = shift;
-     if ({
+     if ($self->{open_elements}->[-1]->[1] & TABLE_ROWS_EL) {
-          table => 1, tbody => 1, tfoot => 1, thead => 1, tr => 1,
-         }->{$self->{open_elements}->[-1]->[1]}) {
        # MUST
        my $foster_parent_element;
        my $next_sibling;
-                          OE: for (reverse 0..$#{$self->{open_elements}}) {
+       OE: for (reverse 0..$#{$self->{open_elements}}) {
-                            if ($self->{open_elements}->[$_]->[1] eq 'table') {
+         if ($self->{open_elements}->[$_]->[1] & TABLE_EL) {
                               my $parent = $self->{open_elements}->[$_]->[0]->parent_node;
                               if (defined $parent and $parent->node_type == 1) {
                                 !!!cp ('t70');
-Line 3285 
 sub _tree_construction_main ($) {
+Line 4239 
 sub _tree_construction_main ($) {
      }
    }; # $insert_to_foster
-   B: {
+   B: while (1) {
      if ($token->{type} == DOCTYPE_TOKEN) {
        !!!cp ('t73');
-       !!!parse-error (type => 'DOCTYPE in the middle');
+       !!!parse-error (type => 'in html:#DOCTYPE', token => $token);
        ## Ignore the token
        ## Stay in the phase
        !!!next-token;
-       redo B;
+       next B;
      } elsif ($token->{type} == START_TAG_TOKEN and
               $token->{tag_name} eq 'html') {
        if ($self->{insertion_mode} == AFTER_HTML_BODY_IM) {
          !!!cp ('t79');
-         !!!parse-error (type => 'after html:html');
+         !!!parse-error (type => 'after html', text => 'html', token => $token);
          $self->{insertion_mode} = AFTER_BODY_IM;
        } elsif ($self->{insertion_mode} == AFTER_HTML_FRAMESET_IM) {
          !!!cp ('t80');
-         !!!parse-error (type => 'after html:html');
+         !!!parse-error (type => 'after html', text => 'html', token => $token);
          $self->{insertion_mode} = AFTER_FRAMESET_IM;
        } else {
          !!!cp ('t81');
        }
        !!!cp ('t82');
-       !!!parse-error (type => 'not first start tag');
+       !!!parse-error (type => 'not first start tag', token => $token);
        my $top_el = $self->{open_elements}->[0]->[0];
        for my $attr_name (keys %{$token->{attributes}}) {
          unless ($top_el->has_attribute_ns (undef, $attr_name)) {
-Line 3318 
 sub _tree_construction_main ($) {
+Line 4272 
 sub _tree_construction_main ($) {
               $token->{attributes}->{$attr_name}->{value});
          }
        }
+       !!!nack ('t84.1');
        !!!next-token;
-       redo B;
+       next B;
      } elsif ($token->{type} == COMMENT_TOKEN) {
        my $comment = $self->{document}->create_comment ($token->{data});
        if ($self->{insertion_mode} & AFTER_HTML_IMS) {
-Line 3333 
 sub _tree_construction_main ($) {
+Line 4288 
 sub _tree_construction_main ($) {
          $self->{open_elements}->[-1]->[0]->append_child ($comment);
        }
        !!!next-token;
-       redo B;
+       next B;
-     } elsif ($self->{insertion_mode} & HEAD_IMS) {
+     } elsif ($self->{insertion_mode} & IN_FOREIGN_CONTENT_IM) {
+       if ($token->{type} == CHARACTER_TOKEN) {
+         !!!cp ('t87.1');
+         $self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data});
+         !!!next-token;
+         next B;
+       } elsif ($token->{type} == START_TAG_TOKEN) {
+         if ((not {mglyph => 1, malignmark => 1}->{$token->{tag_name}} and
+              $self->{open_elements}->[-1]->[1] & FOREIGN_FLOW_CONTENT_EL) or
+             not ($self->{open_elements}->[-1]->[1] & FOREIGN_EL) or
+             ($token->{tag_name} eq 'svg' and
+              $self->{open_elements}->[-1]->[1] & MML_AXML_EL)) {
+           ## NOTE: "using the rules for secondary insertion mode"then"continue"
+           !!!cp ('t87.2');
+           #
+         } elsif ({
+                   b => 1, big => 1, blockquote => 1, body => 1, br => 1,
+                   center => 1, code => 1, dd => 1, div => 1, dl => 1, dt => 1,
+                   em => 1, embed => 1, font => 1, h1 => 1, h2 => 1, h3 => 1,
+                   h4 => 1, h5 => 1, h6 => 1, head => 1, hr => 1, i => 1,
+                   img => 1, li => 1, listing => 1, menu => 1, meta => 1,
+                   nobr => 1, ol => 1, p => 1, pre => 1, ruby => 1, s => 1,
+                   small => 1, span => 1, strong => 1, strike => 1, sub => 1,
+                   sup => 1, table => 1, tt => 1, u => 1, ul => 1, var => 1,
+                  }->{$token->{tag_name}}) {
+           !!!cp ('t87.2');
+           !!!parse-error (type => 'not closed',
+                           text => $self->{open_elements}->[-1]->[0]
+                               ->manakai_local_name,
+                           token => $token);
+           pop @{$self->{open_elements}}
+               while $self->{open_elements}->[-1]->[1] & FOREIGN_EL;
+           $self->{insertion_mode} &= ~ IN_FOREIGN_CONTENT_IM;
+           ## Reprocess.
+           next B;
+         } else {
+           my $nsuri = $self->{open_elements}->[-1]->[0]->namespace_uri;
+           my $tag_name = $token->{tag_name};
+           if ($nsuri eq $SVG_NS) {
+             $tag_name = {
+                altglyph => 'altGlyph',
+                altglyphdef => 'altGlyphDef',
+                altglyphitem => 'altGlyphItem',
+                animatecolor => 'animateColor',
+                animatemotion => 'animateMotion',
+                animatetransform => 'animateTransform',
+                clippath => 'clipPath',
+                feblend => 'feBlend',
+                fecolormatrix => 'feColorMatrix',
+                fecomponenttransfer => 'feComponentTransfer',
+                fecomposite => 'feComposite',
+                feconvolvematrix => 'feConvolveMatrix',
+                fediffuselighting => 'feDiffuseLighting',
+                fedisplacementmap => 'feDisplacementMap',
+                fedistantlight => 'feDistantLight',
+                feflood => 'feFlood',
+                fefunca => 'feFuncA',
+                fefuncb => 'feFuncB',
+                fefuncg => 'feFuncG',
+                fefuncr => 'feFuncR',
+                fegaussianblur => 'feGaussianBlur',
+                feimage => 'feImage',
+                femerge => 'feMerge',
+                femergenode => 'feMergeNode',
+                femorphology => 'feMorphology',
+                feoffset => 'feOffset',
+                fepointlight => 'fePointLight',
+                fespecularlighting => 'feSpecularLighting',
+                fespotlight => 'feSpotLight',
+                fetile => 'feTile',
+                feturbulence => 'feTurbulence',
+                foreignobject => 'foreignObject',
+                glyphref => 'glyphRef',
+                lineargradient => 'linearGradient',
+                radialgradient => 'radialGradient',
+                #solidcolor => 'solidColor', ## NOTE: Commented in spec (SVG1.2)
+                textpath => 'textPath',
+             }->{$tag_name} || $tag_name;
+           }
+           ## "adjust SVG attributes" (SVG only) - done in insert-element-f
+           ## "adjust foreign attributes" - done in insert-element-f
+           !!!insert-element-f ($nsuri, $tag_name, $token->{attributes}, $token);
+           if ($self->{self_closing}) {
+             pop @{$self->{open_elements}};
+             !!!ack ('t87.3');
+           } else {
+             !!!cp ('t87.4');
+           }
+           !!!next-token;
+           next B;
+         }
+       } elsif ($token->{type} == END_TAG_TOKEN) {
+         ## NOTE: "using the rules for secondary insertion mode" then "continue"
+         !!!cp ('t87.5');
+         #
+       } elsif ($token->{type} == END_OF_FILE_TOKEN) {
+         !!!cp ('t87.6');
+         !!!parse-error (type => 'not closed',
+                         text => $self->{open_elements}->[-1]->[0]
+                             ->manakai_local_name,
+                         token => $token);
+         pop @{$self->{open_elements}}
+             while $self->{open_elements}->[-1]->[1] & FOREIGN_EL;
+         $self->{insertion_mode} &= ~ IN_FOREIGN_CONTENT_IM;
+         ## Reprocess.
+         next B;
+       } else {
+         die "$0: $token->{type}: Unknown token type";
+       }
+     }
+     if ($self->{insertion_mode} & HEAD_IMS) {
        if ($token->{type} == CHARACTER_TOKEN) {
          if ($token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) {
            unless ($self->{insertion_mode} == BEFORE_HEAD_IM) {
-Line 3344 
 sub _tree_construction_main ($) {
+Line 4419 
 sub _tree_construction_main ($) {
              !!!cp ('t88.1');
              ## Ignore the token.
              !!!next-token;
-             redo B;
+             next B;
            }
            unless (length $token->{data}) {
              !!!cp ('t88');
              !!!next-token;
-             redo B;
+             next B;
            }
          }
          if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
            !!!cp ('t89');
            ## As if <head>
-           !!!create-element ($self->{head_element}, 'head');
+           !!!create-element ($self->{head_element}, $HTML_NS, 'head',, $token);
            $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
-           push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+           push @{$self->{open_elements}},
+               [$self->{head_element}, $el_category->{head}];
            ## Reprocess in the "in head" insertion mode...
            pop @{$self->{open_elements}};
-Line 3368 
 sub _tree_construction_main ($) {
+Line 4444 
 sub _tree_construction_main ($) {
            !!!cp ('t90');
            ## As if </noscript>
            pop @{$self->{open_elements}};
-           !!!parse-error (type => 'in noscript:#character');
+           !!!parse-error (type => 'in noscript:#text', token => $token);
            ## Reprocess in the "in head" insertion mode...
            ## As if </head>
-Line 3384 
 sub _tree_construction_main ($) {
+Line 4460 
 sub _tree_construction_main ($) {
            !!!cp ('t92');
          }
-             ## "after head" insertion mode
+         ## "after head" insertion mode
-             ## As if <body>
+         ## As if <body>
-             !!!insert-element ('body');
+         !!!insert-element ('body',, $token);
-             $self->{insertion_mode} = IN_BODY_IM;
+         $self->{insertion_mode} = IN_BODY_IM;
-             ## reprocess
+         ## reprocess
-             redo B;
+         next B;
-           } elsif ($token->{type} == START_TAG_TOKEN) {
+       } elsif ($token->{type} == START_TAG_TOKEN) {
-             if ($token->{tag_name} eq 'head') {
+         if ($token->{tag_name} eq 'head') {
-               if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
+           if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
-                 !!!cp ('t93');
+             !!!cp ('t93');
-                 !!!create-element ($self->{head_element}, $token->{tag_name}, $token->{attributes});
+             !!!create-element ($self->{head_element}, $HTML_NS, $token->{tag_name}, $token->{attributes}, $token);
-                 $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
+             $self->{open_elements}->[-1]->[0]->append_child
-                 push @{$self->{open_elements}}, [$self->{head_element}, $token->{tag_name}];
+                 ($self->{head_element});
-                 $self->{insertion_mode} = IN_HEAD_IM;
+             push @{$self->{open_elements}},
-                 !!!next-token;
+                 [$self->{head_element}, $el_category->{head}];
-                 redo B;
+             $self->{insertion_mode} = IN_HEAD_IM;
-               } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
+             !!!nack ('t93.1');
-                 !!!cp ('t94');
+             !!!next-token;
-                 #
+             next B;
-               } else {
+           } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
-                 !!!cp ('t95');
+             !!!cp ('t93.2');
-                 !!!parse-error (type => 'in head:head'); # or in head noscript
+             !!!parse-error (type => 'after head', text => 'head',
-                 ## Ignore the token
+                             token => $token);
-                 !!!next-token;
+             ## Ignore the token
-                 redo B;
+             !!!nack ('t93.3');
-               }
+             !!!next-token;
-             } elsif ($self->{insertion_mode} == BEFORE_HEAD_IM) {
+             next B;
-               !!!cp ('t96');
+           } else {
-               ## As if <head>
+             !!!cp ('t95');
-               !!!create-element ($self->{head_element}, 'head');
+             !!!parse-error (type => 'in head:head',
-               $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
+                             token => $token); # or in head noscript
-               push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+             ## Ignore the token
+             !!!nack ('t95.1');
+             !!!next-token;
+             next B;
+           }
+         } elsif ($self->{insertion_mode} == BEFORE_HEAD_IM) {
+           !!!cp ('t96');
+           ## As if <head>
+           !!!create-element ($self->{head_element}, $HTML_NS, 'head',, $token);
+           $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
+           push @{$self->{open_elements}},
+               [$self->{head_element}, $el_category->{head}];
-               $self->{insertion_mode} = IN_HEAD_IM;
+           $self->{insertion_mode} = IN_HEAD_IM;
-               ## Reprocess in the "in head" insertion mode...
+           ## Reprocess in the "in head" insertion mode...
-             } else {
+         } else {
-               !!!cp ('t97');
+           !!!cp ('t97');
-             }
+         }
              if ($token->{tag_name} eq 'base') {
                if ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t98');
                  ## As if </noscript>
                  pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'in noscript:base');
+                 !!!parse-error (type => 'in noscript', text => 'base',
+                                 token => $token);
                  $self->{insertion_mode} = IN_HEAD_IM;
                  ## Reprocess in the "in head" insertion mode...
-Line 3439 
 sub _tree_construction_main ($) {
+Line 4527 
 sub _tree_construction_main ($) {
                ## NOTE: There is a "as if in head" code clone.
                if ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t100');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t101');
                }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec.
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
+               !!!nack ('t101.1');
                !!!next-token;
-               redo B;
+               next B;
              } elsif ($token->{tag_name} eq 'link') {
                ## NOTE: There is a "as if in head" code clone.
                if ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t102');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t103');
                }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec.
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
+               !!!ack ('t103.1');
                !!!next-token;
-               redo B;
+               next B;
              } elsif ($token->{tag_name} eq 'meta') {
                ## NOTE: There is a "as if in head" code clone.
                if ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t104');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t105');
                }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                my $meta_el = pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec.
                unless ($self->{confident}) {
-                 if ($token->{attributes}->{charset}) { ## TODO: And if supported
+                 if ($token->{attributes}->{charset}) {
                    !!!cp ('t106');
+                   ## NOTE: Whether the encoding is supported or not is handled
+                   ## in the {change_encoding} callback.
                    $self->{change_encoding}
-                       ->($self, $token->{attributes}->{charset}->{value});
+                       ->($self, $token->{attributes}->{charset}->{value},
+                          $token);
                    $meta_el->[0]->get_attribute_node_ns (undef, 'charset')
                        ->set_user_data (manakai_has_reference =>
                                             $token->{attributes}->{charset}
                                                 ->{has_reference});
                  } elsif ($token->{attributes}->{content}) {
-                   ## ISSUE: Algorithm name in the spec was incorrect so that not linked to the definition.
                    if ($token->{attributes}->{content}->{value}
-                       =~ /\A[^;]*;[\x09-\x0D\x20]*[Cc][Hh][Aa][Rr][Ss][Ee][Tt]
+                       =~ /[Cc][Hh][Aa][Rr][Ss][Ee][Tt]
                            [\x09-\x0D\x20]*=
                            [\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'|
-                           ([^"'\x09-\x0D\x20][^\x09-\x0D\x20]*))/x) {
+                           ([^"'\x09-\x0D\x20][^\x09-\x0D\x20\x3B]*))/x) {
                      !!!cp ('t107');
+                     ## NOTE: Whether the encoding is supported or not is handled
+                     ## in the {change_encoding} callback.
                      $self->{change_encoding}
-                         ->($self, defined $1 ? $1 : defined $2 ? $2 : $3);
+                         ->($self, defined $1 ? $1 : defined $2 ? $2 : $3,
+                            $token);
                      $meta_el->[0]->get_attribute_node_ns (undef, 'content')
                          ->set_user_data (manakai_has_reference =>
                                               $token->{attributes}->{content}
-Line 3524 
 sub _tree_construction_main ($) {
+Line 4625 
 sub _tree_construction_main ($) {
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
+               !!!ack ('t110.1');
                !!!next-token;
-               redo B;
+               next B;
              } elsif ($token->{tag_name} eq 'title') {
                if ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t111');
                  ## As if </noscript>
                  pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'in noscript:title');
+                 !!!parse-error (type => 'in noscript', text => 'title',
+                                 token => $token);
                  $self->{insertion_mode} = IN_HEAD_IM;
                  ## Reprocess in the "in head" insertion mode...
                } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t112');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t113');
                }
-Line 3549 
 sub _tree_construction_main ($) {
+Line 4654 
 sub _tree_construction_main ($) {
                $parse_rcdata->(RCDATA_CONTENT_MODEL);
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
-               redo B;
+               next B;
-             } elsif ($token->{tag_name} eq 'style') {
+             } elsif ($token->{tag_name} eq 'style' or
+                      $token->{tag_name} eq 'noframes') {
                ## NOTE: Or (scripting is enabled and tag_name eq 'noscript' and
                ## insertion mode IN_HEAD_IM)
                ## NOTE: There is a "as if in head" code clone.
                if ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t114');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t115');
                }
                $parse_rcdata->(CDATA_CONTENT_MODEL);
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
-               redo B;
+               next B;
              } elsif ($token->{tag_name} eq 'noscript') {
                if ($self->{insertion_mode} == IN_HEAD_IM) {
                  !!!cp ('t116');
                  ## NOTE: and scripting is disalbed
-                 !!!insert-element ($token->{tag_name}, $token->{attributes});
+                 !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                  $self->{insertion_mode} = IN_HEAD_NOSCRIPT_IM;
+                 !!!nack ('t116.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                } elsif ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t117');
-                 !!!parse-error (type => 'in noscript:noscript');
+                 !!!parse-error (type => 'in noscript', text => 'noscript',
+                                 token => $token);
                  ## Ignore the token
+                 !!!nack ('t117.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t118');
                  #
-Line 3588 
 sub _tree_construction_main ($) {
+Line 4699 
 sub _tree_construction_main ($) {
                  !!!cp ('t119');
                  ## As if </noscript>
                  pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'in noscript:script');
+                 !!!parse-error (type => 'in noscript', text => 'script',
+                                 token => $token);
                  $self->{insertion_mode} = IN_HEAD_IM;
                  ## Reprocess in the "in head" insertion mode...
                } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t120');
-                 !!!parse-error (type => 'after head:'.$token->{tag_name});
+                 !!!parse-error (type => 'after head',
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                                 text => $token->{tag_name}, token => $token);
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                } else {
                  !!!cp ('t121');
                }
-Line 3604 
 sub _tree_construction_main ($) {
+Line 4718 
 sub _tree_construction_main ($) {
                $script_start_tag->();
                pop @{$self->{open_elements}} # <head>
                    if $self->{insertion_mode} == AFTER_HEAD_IM;
-               redo B;
+               next B;
              } elsif ($token->{tag_name} eq 'body' or
                       $token->{tag_name} eq 'frameset') {
                if ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t122');
                  ## As if </noscript>
                  pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'in noscript:'.$token->{tag_name});
+                 !!!parse-error (type => 'in noscript',
+                                 text => $token->{tag_name}, token => $token);
                  ## Reprocess in the "in head" insertion mode...
                  ## As if </head>
-Line 3628 
 sub _tree_construction_main ($) {
+Line 4743 
 sub _tree_construction_main ($) {
                }
                ## "after head" insertion mode
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                if ($token->{tag_name} eq 'body') {
                  !!!cp ('t126');
                  $self->{insertion_mode} = IN_BODY_IM;
-Line 3638 
 sub _tree_construction_main ($) {
+Line 4753 
 sub _tree_construction_main ($) {
                } else {
                  die "$0: tag name: $self->{tag_name}";
                }
+               !!!nack ('t127.1');
                !!!next-token;
-               redo B;
+               next B;
              } else {
                !!!cp ('t128');
                #
-Line 3649 
 sub _tree_construction_main ($) {
+Line 4765 
 sub _tree_construction_main ($) {
                !!!cp ('t129');
                ## As if </noscript>
                pop @{$self->{open_elements}};
-               !!!parse-error (type => 'in noscript:/'.$token->{tag_name});
+               !!!parse-error (type => 'in noscript:/',
+                               text => $token->{tag_name}, token => $token);
                ## Reprocess in the "in head" insertion mode...
                ## As if </head>
-Line 3668 
 sub _tree_construction_main ($) {
+Line 4785 
 sub _tree_construction_main ($) {
              ## "after head" insertion mode
              ## As if <body>
-             !!!insert-element ('body');
+             !!!insert-element ('body',, $token);
              $self->{insertion_mode} = IN_BODY_IM;
              ## reprocess
-             redo B;
+             !!!ack-later;
+             next B;
            } elsif ($token->{type} == END_TAG_TOKEN) {
              if ($token->{tag_name} eq 'head') {
                if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
                  !!!cp ('t132');
                  ## As if <head>
-                 !!!create-element ($self->{head_element}, 'head');
+                 !!!create-element ($self->{head_element}, $HTML_NS, 'head',, $token);
                  $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                 push @{$self->{open_elements}},
+                     [$self->{head_element}, $el_category->{head}];
                  ## Reprocess in the "in head" insertion mode...
                  pop @{$self->{open_elements}};
                  $self->{insertion_mode} = AFTER_HEAD_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
                } elsif ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t133');
                  ## As if </noscript>
                  pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'in noscript:/head');
+                 !!!parse-error (type => 'in noscript:/',
+                                 text => 'head', token => $token);
                  ## Reprocess in the "in head" insertion mode...
                  pop @{$self->{open_elements}};
                  $self->{insertion_mode} = AFTER_HEAD_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
                } elsif ($self->{insertion_mode} == IN_HEAD_IM) {
                  !!!cp ('t134');
                  pop @{$self->{open_elements}};
                  $self->{insertion_mode} = AFTER_HEAD_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
+               } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
+                 !!!cp ('t134.1');
+                 !!!parse-error (type => 'unmatched end tag', text => 'head',
+                                 token => $token);
+                 ## Ignore the token
+                 !!!next-token;
+                 next B;
                } else {
-                 !!!cp ('t135');
+                 die "$0: $self->{insertion_mode}: Unknown insertion mode";
-                 #
                }
              } elsif ($token->{tag_name} eq 'noscript') {
                if ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
-Line 3713 
 sub _tree_construction_main ($) {
+Line 4839 
 sub _tree_construction_main ($) {
                  pop @{$self->{open_elements}};
                  $self->{insertion_mode} = IN_HEAD_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
-               } elsif ($self->{insertion_mode} == BEFORE_HEAD_IM) {
+               } elsif ($self->{insertion_mode} == BEFORE_HEAD_IM or
+                        $self->{insertion_mode} == AFTER_HEAD_IM) {
                  !!!cp ('t137');
-                 !!!parse-error (type => 'unmatched end tag:noscript');
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => 'noscript', token => $token);
                  ## Ignore the token ## ISSUE: An issue in the spec.
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t138');
                  #
-Line 3727 
 sub _tree_construction_main ($) {
+Line 4855 
 sub _tree_construction_main ($) {
              } elsif ({
                        body => 1, html => 1,
                       }->{$token->{tag_name}}) {
-               if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
+               if ($self->{insertion_mode} == BEFORE_HEAD_IM or
-                 !!!cp ('t139');
+                   $self->{insertion_mode} == IN_HEAD_IM or
-                 ## As if <head>
+                   $self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
-                 !!!create-element ($self->{head_element}, 'head');
-                 $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
-                 $self->{insertion_mode} = IN_HEAD_IM;
-                 ## Reprocess in the "in head" insertion mode...
-               } elsif ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                  !!!cp ('t140');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
+               } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
+                 !!!cp ('t140.1');
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
+                 ## Ignore the token
+                 !!!next-token;
+                 next B;
                } else {
-                 !!!cp ('t141');
+                 die "$0: $self->{insertion_mode}: Unknown insertion mode";
                }
+             } elsif ($token->{tag_name} eq 'p') {
-               #
+               !!!cp ('t142');
-             } elsif ({
+               !!!parse-error (type => 'unmatched end tag',
-                       p => 1, br => 1,
+                               text => $token->{tag_name}, token => $token);
-                      }->{$token->{tag_name}}) {
+               ## Ignore the token
+               !!!next-token;
+               next B;
+             } elsif ($token->{tag_name} eq 'br') {
                if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
-                 !!!cp ('t142');
+                 !!!cp ('t142.2');
-                 ## As if <head>
+                 ## (before head) as if <head>, (in head) as if </head>
-                 !!!create-element ($self->{head_element}, 'head');
+                 !!!create-element ($self->{head_element}, $HTML_NS, 'head',, $token);
                  $self->{open_elements}->[-1]->[0]->append_child ($self->{head_element});
-                 push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+                 $self->{insertion_mode} = AFTER_HEAD_IM;
+                 ## Reprocess in the "after head" insertion mode...
+               } elsif ($self->{insertion_mode} == IN_HEAD_IM) {
+                 !!!cp ('t143.2');
+                 ## As if </head>
+                 pop @{$self->{open_elements}};
+                 $self->{insertion_mode} = AFTER_HEAD_IM;
+                 ## Reprocess in the "after head" insertion mode...
+               } elsif ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
+                 !!!cp ('t143.3');
+                 ## ISSUE: Two parse errors for <head><noscript></br>
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => 'br', token => $token);
+                 ## As if </noscript>
+                 pop @{$self->{open_elements}};
                  $self->{insertion_mode} = IN_HEAD_IM;
                  ## Reprocess in the "in head" insertion mode...
-               } else {
+                 ## As if </head>
-                 !!!cp ('t143');
+                 pop @{$self->{open_elements}};
-               }
+                 $self->{insertion_mode} = AFTER_HEAD_IM;
-               #
+                 ## Reprocess in the "after head" insertion mode...
-             } else {
+               } elsif ($self->{insertion_mode} == AFTER_HEAD_IM) {
-               if ($self->{insertion_mode} == AFTER_HEAD_IM) {
+                 !!!cp ('t143.4');
-                 !!!cp ('t144');
                  #
                } else {
-                 !!!cp ('t145');
+                 die "$0: $self->{insertion_mode}: Unknown insertion mode";
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
-                 ## Ignore the token
-                 !!!next-token;
-                 redo B;
                }
+               ## ISSUE: does not agree with IE7 - it doesn't ignore </br>.
+               !!!parse-error (type => 'unmatched end tag',
+                               text => 'br', token => $token);
+               ## Ignore the token
+               !!!next-token;
+               next B;
+             } else {
+               !!!cp ('t145');
+               !!!parse-error (type => 'unmatched end tag',
+                               text => $token->{tag_name}, token => $token);
+               ## Ignore the token
+               !!!next-token;
+               next B;
              }
              if ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
                !!!cp ('t146');
                ## As if </noscript>
                pop @{$self->{open_elements}};
-               !!!parse-error (type => 'in noscript:/'.$token->{tag_name});
+               !!!parse-error (type => 'in noscript:/',
+                               text => $token->{tag_name}, token => $token);
                ## Reprocess in the "in head" insertion mode...
                ## As if </head>
-Line 3797 
 sub _tree_construction_main ($) {
+Line 4955 
 sub _tree_construction_main ($) {
              } elsif ($self->{insertion_mode} == BEFORE_HEAD_IM) {
  ## ISSUE: This case cannot be reached?
                !!!cp ('t148');
-               !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+               !!!parse-error (type => 'unmatched end tag',
+                               text => $token->{tag_name}, token => $token);
                ## Ignore the token ## ISSUE: An issue in the spec.
                !!!next-token;
-               redo B;
+               next B;
              } else {
                !!!cp ('t149');
              }
              ## "after head" insertion mode
              ## As if <body>
-             !!!insert-element ('body');
+             !!!insert-element ('body',, $token);
              $self->{insertion_mode} = IN_BODY_IM;
              ## reprocess
-             redo B;
+             next B;
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
          if ($self->{insertion_mode} == BEFORE_HEAD_IM) {
            !!!cp ('t149.1');
            ## NOTE: As if <head>
-           !!!create-element ($self->{head_element}, 'head');
+           !!!create-element ($self->{head_element}, $HTML_NS, 'head',, $token);
            $self->{open_elements}->[-1]->[0]->append_child
                ($self->{head_element});
-           #push @{$self->{open_elements}}, [$self->{head_element}, 'head'];
+           #push @{$self->{open_elements}},
+           #    [$self->{head_element}, $el_category->{head}];
            #$self->{insertion_mode} = IN_HEAD_IM;
            ## NOTE: Reprocess.
-Line 3841 
 sub _tree_construction_main ($) {
+Line 5001 
 sub _tree_construction_main ($) {
          } elsif ($self->{insertion_mode} == IN_HEAD_NOSCRIPT_IM) {
            !!!cp ('t149.3');
-           !!!parse-error (type => 'in noscript:#eof');
+           !!!parse-error (type => 'in noscript:#eof', token => $token);
            ## As if </noscript>
            pop @{$self->{open_elements}};
-Line 3860 
 sub _tree_construction_main ($) {
+Line 5020 
 sub _tree_construction_main ($) {
          }
          ## NOTE: As if <body>
-         !!!insert-element ('body');
+         !!!insert-element ('body',, $token);
          $self->{insertion_mode} = IN_BODY_IM;
          ## NOTE: Reprocess.
-         redo B;
+         next B;
        } else {
          die "$0: $token->{type}: Unknown token type";
        }
-Line 3878 
 sub _tree_construction_main ($) {
+Line 5038 
 sub _tree_construction_main ($) {
              $self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data});
              !!!next-token;
-             redo B;
+             next B;
            } elsif ($token->{type} == START_TAG_TOKEN) {
              if ({
                   caption => 1, col => 1, colgroup => 1, tbody => 1,
-Line 3886 
 sub _tree_construction_main ($) {
+Line 5046 
 sub _tree_construction_main ($) {
                  }->{$token->{tag_name}}) {
                if ($self->{insertion_mode} == IN_CELL_IM) {
                  ## have an element in table scope
-                 my $tn;
+                 for (reverse 0..$#{$self->{open_elements}}) {
-                 INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq 'td' or $node->[1] eq 'th') {
+                   if ($node->[1] & TABLE_CELL_EL) {
                      !!!cp ('t151');
-                     $tn = $node->[1];
-                     last INSCOPE;
+                     ## Close the cell
-                   } elsif ({
+                     !!!back-token; # <x>
-                             table => 1, html => 1,
+                     $token = {type => END_TAG_TOKEN,
-                            }->{$node->[1]}) {
+                               tag_name => $node->[0]->manakai_local_name,
+                               line => $token->{line},
+                               column => $token->{column}};
+                     next B;
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
                      !!!cp ('t152');
-                     last INSCOPE;
+                     ## ISSUE: This case can never be reached, maybe.
+                     last;
                    }
-                 } # INSCOPE
+                 }
-                   unless (defined $tn) {
-                     !!!cp ('t153');
+                 !!!cp ('t153');
- ## TODO: This error type is wrong.
+                 !!!parse-error (type => 'start tag not allowed',
-                     !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                     text => $token->{tag_name}, token => $token);
-                     ## Ignore the token
+                 ## Ignore the token
-                     !!!next-token;
+                 !!!nack ('t153.1');
-                     redo B;
+                 !!!next-token;
-                   }
+                 next B;
-                 !!!cp ('t154');
-                 ## Close the cell
-                 !!!back-token; # <?>
-                 $token = {type => END_TAG_TOKEN, tag_name => $tn};
-                 redo B;
                } elsif ($self->{insertion_mode} == IN_CAPTION_IM) {
-                 !!!parse-error (type => 'not closed:caption');
+                 !!!parse-error (type => 'not closed', text => 'caption',
+                                 token => $token);
-                 ## As if </caption>
+                 ## NOTE: As if </caption>.
                  ## have a table element in table scope
                  my $i;
-                 INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+                 INSCOPE: {
-                   my $node = $self->{open_elements}->[$_];
+                   for (reverse 0..$#{$self->{open_elements}}) {
-                   if ($node->[1] eq 'caption') {
+                     my $node = $self->{open_elements}->[$_];
-                     !!!cp ('t155');
+                     if ($node->[1] & CAPTION_EL) {
-                     $i = $_;
+                       !!!cp ('t155');
-                     last INSCOPE;
+                       $i = $_;
-                   } elsif ({
+                       last INSCOPE;
-                             table => 1, html => 1,
+                     } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                            }->{$node->[1]}) {
+                       !!!cp ('t156');
-                     !!!cp ('t156');
+                       last;
-                     last INSCOPE;
+                     }
                    }
+                   !!!cp ('t157');
+                   !!!parse-error (type => 'start tag not allowed',
+                                   text => $token->{tag_name}, token => $token);
+                   ## Ignore the token
+                   !!!nack ('t157.1');
+                   !!!next-token;
+                   next B;
                  } # INSCOPE
-                   unless (defined $i) {
-                     !!!cp ('t157');
- ## TODO: this type is wrong.
-                     !!!parse-error (type => 'unmatched end tag:caption');
-                     ## Ignore the token
-                     !!!next-token;
-                     redo B;
-                   }
                  ## generate implied end tags
-                 while ({
+                 while ($self->{open_elements}->[-1]->[1]
-                         dd => 1, dt => 1, li => 1, p => 1,
+                            & END_TAG_OPTIONAL_EL) {
-                        }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t158');
                    pop @{$self->{open_elements}};
                  }
-                 if ($self->{open_elements}->[-1]->[1] ne 'caption') {
+                 unless ($self->{open_elements}->[-1]->[1] & CAPTION_EL) {
                    !!!cp ('t159');
-                   !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+                   !!!parse-error (type => 'not closed',
+                                   text => $self->{open_elements}->[-1]->[0]
+                                       ->manakai_local_name,
+                                   token => $token);
                  } else {
                    !!!cp ('t160');
                  }
-Line 3964 
 sub _tree_construction_main ($) {
+Line 5125 
 sub _tree_construction_main ($) {
                  $self->{insertion_mode} = IN_TABLE_IM;
                  ## reprocess
-                 redo B;
+                 !!!ack-later;
+                 next B;
                } else {
                  !!!cp ('t161');
                  #
-Line 3980 
 sub _tree_construction_main ($) {
+Line 5142 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq $token->{tag_name}) {
+                   if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
                      !!!cp ('t163');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t164');
                      last INSCOPE;
                    }
                  } # INSCOPE
                    unless (defined $i) {
                      !!!cp ('t165');
-                     !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                     !!!parse-error (type => 'unmatched end tag',
+                                     text => $token->{tag_name},
+                                     token => $token);
                      ## Ignore the token
                      !!!next-token;
-                     redo B;
+                     next B;
                    }
                  ## generate implied end tags
-                 while ({
+                 while ($self->{open_elements}->[-1]->[1]
-                         dd => 1, dt => 1, li => 1, p => 1,
+                            & END_TAG_OPTIONAL_EL) {
-                        }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t166');
                    pop @{$self->{open_elements}};
                  }
-                 if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) {
+                 if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                         ne $token->{tag_name}) {
                    !!!cp ('t167');
-                   !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+                   !!!parse-error (type => 'not closed',
+                                   text => $self->{open_elements}->[-1]->[0]
+                                       ->manakai_local_name,
+                                   token => $token);
                  } else {
                    !!!cp ('t168');
                  }
-Line 4021 
 sub _tree_construction_main ($) {
+Line 5186 
 sub _tree_construction_main ($) {
                  $self->{insertion_mode} = IN_ROW_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
                } elsif ($self->{insertion_mode} == IN_CAPTION_IM) {
                  !!!cp ('t169');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t170');
                  #
-Line 4036 
 sub _tree_construction_main ($) {
+Line 5202 
 sub _tree_construction_main ($) {
                if ($self->{insertion_mode} == IN_CAPTION_IM) {
                  ## have a table element in table scope
                  my $i;
-                 INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+                 INSCOPE: {
-                   my $node = $self->{open_elements}->[$_];
+                   for (reverse 0..$#{$self->{open_elements}}) {
-                   if ($node->[1] eq $token->{tag_name}) {
+                     my $node = $self->{open_elements}->[$_];
-                     !!!cp ('t171');
+                     if ($node->[1] & CAPTION_EL) {
-                     $i = $_;
+                       !!!cp ('t171');
-                     last INSCOPE;
+                       $i = $_;
-                   } elsif ({
+                       last INSCOPE;
-                             table => 1, html => 1,
+                     } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                            }->{$node->[1]}) {
+                       !!!cp ('t172');
-                     !!!cp ('t172');
+                       last;
-                     last INSCOPE;
+                     }
                    }
+                   !!!cp ('t173');
+                   !!!parse-error (type => 'unmatched end tag',
+                                   text => $token->{tag_name}, token => $token);
+                   ## Ignore the token
+                   !!!next-token;
+                   next B;
                  } # INSCOPE
-                   unless (defined $i) {
-                     !!!cp ('t173');
-                     !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
-                     ## Ignore the token
-                     !!!next-token;
-                     redo B;
-                   }
                  ## generate implied end tags
-                 while ({
+                 while ($self->{open_elements}->[-1]->[1]
-                         dd => 1, dt => 1, li => 1, p => 1,
+                            & END_TAG_OPTIONAL_EL) {
-                        }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t174');
                    pop @{$self->{open_elements}};
                  }
-                 if ($self->{open_elements}->[-1]->[1] ne 'caption') {
+                 unless ($self->{open_elements}->[-1]->[1] & CAPTION_EL) {
                    !!!cp ('t175');
-                   !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+                   !!!parse-error (type => 'not closed',
+                                   text => $self->{open_elements}->[-1]->[0]
+                                       ->manakai_local_name,
+                                   token => $token);
                  } else {
                    !!!cp ('t176');
                  }
-Line 4079 
 sub _tree_construction_main ($) {
+Line 5247 
 sub _tree_construction_main ($) {
                  $self->{insertion_mode} = IN_TABLE_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
                } elsif ($self->{insertion_mode} == IN_CELL_IM) {
                  !!!cp ('t177');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t178');
                  #
-Line 4098 
 sub _tree_construction_main ($) {
+Line 5267 
 sub _tree_construction_main ($) {
                ## have an element in table scope
                my $i;
                my $tn;
-               INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+               INSCOPE: {
-                 my $node = $self->{open_elements}->[$_];
+                 for (reverse 0..$#{$self->{open_elements}}) {
-                 if ($node->[1] eq $token->{tag_name}) {
+                   my $node = $self->{open_elements}->[$_];
-                   !!!cp ('t179');
+                   if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
-                   $i = $_;
+                     !!!cp ('t179');
-                   last INSCOPE;
+                     $i = $_;
-                 } elsif ($node->[1] eq 'td' or $node->[1] eq 'th') {
-                   !!!cp ('t180');
+                     ## Close the cell
-                   $tn = $node->[1];
+                     !!!back-token; # </x>
-                   ## NOTE: There is exactly one |td| or |th| element
+                     $token = {type => END_TAG_TOKEN, tag_name => $tn,
-                   ## in scope in the stack of open elements by definition.
+                               line => $token->{line},
-                 } elsif ({
+                               column => $token->{column}};
-                           table => 1, html => 1,
+                     next B;
-                          }->{$node->[1]}) {
+                   } elsif ($node->[1] & TABLE_CELL_EL) {
-                   !!!cp ('t181');
+                     !!!cp ('t180');
-                   last INSCOPE;
+                     $tn = $node->[0]->manakai_local_name;
+                     ## NOTE: There is exactly one |td| or |th| element
+                     ## in scope in the stack of open elements by definition.
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
+                     ## ISSUE: Can this be reached?
+                     !!!cp ('t181');
+                     last;
+                   }
                  }
-               } # INSCOPE
-               unless (defined $i) {
                  !!!cp ('t182');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                     text => $token->{tag_name}, token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
-               } else {
+               } # INSCOPE
-                 !!!cp ('t183');
-               }
-               ## Close the cell
-               !!!back-token; # </?>
-               $token = {type => END_TAG_TOKEN, tag_name => $tn};
-               redo B;
              } elsif ($token->{tag_name} eq 'table' and
                       $self->{insertion_mode} == IN_CAPTION_IM) {
-               !!!parse-error (type => 'not closed:caption');
+               !!!parse-error (type => 'not closed', text => 'caption',
+                               token => $token);
                ## As if </caption>
                ## have a table element in table scope
                my $i;
                INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                  my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq 'caption') {
+                 if ($node->[1] & CAPTION_EL) {
                    !!!cp ('t184');
                    $i = $_;
                    last INSCOPE;
-                 } elsif ({
+                 } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
-                          }->{$node->[1]}) {
                    !!!cp ('t185');
                    last INSCOPE;
                  }
                } # INSCOPE
                unless (defined $i) {
                  !!!cp ('t186');
-                 !!!parse-error (type => 'unmatched end tag:caption');
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => 'caption', token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
                }
                ## generate implied end tags
-               while ({
+               while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
-                       dd => 1, dt => 1, li => 1, p => 1,
-                      }->{$self->{open_elements}->[-1]->[1]}) {
                  !!!cp ('t187');
                  pop @{$self->{open_elements}};
                }
-               if ($self->{open_elements}->[-1]->[1] ne 'caption') {
+               unless ($self->{open_elements}->[-1]->[1] & CAPTION_EL) {
                  !!!cp ('t188');
-                 !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+                 !!!parse-error (type => 'not closed',
+                                 text => $self->{open_elements}->[-1]->[0]
+                                     ->manakai_local_name,
+                                 token => $token);
                } else {
                  !!!cp ('t189');
                }
-Line 4180 
 sub _tree_construction_main ($) {
+Line 5350 
 sub _tree_construction_main ($) {
                $self->{insertion_mode} = IN_TABLE_IM;
                ## reprocess
-               redo B;
+               next B;
              } elsif ({
                        body => 1, col => 1, colgroup => 1, html => 1,
                       }->{$token->{tag_name}}) {
                if ($self->{insertion_mode} & BODY_TABLE_IMS) {
                  !!!cp ('t190');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t191');
                  #
-Line 4200 
 sub _tree_construction_main ($) {
+Line 5371 
 sub _tree_construction_main ($) {
                       }->{$token->{tag_name}} and
                       $self->{insertion_mode} == IN_CAPTION_IM) {
                !!!cp ('t192');
-               !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+               !!!parse-error (type => 'unmatched end tag',
+                               text => $token->{tag_name}, token => $token);
                ## Ignore the token
                !!!next-token;
-               redo B;
+               next B;
              } else {
                !!!cp ('t193');
                #
              }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
          for my $entry (@{$self->{open_elements}}) {
-           if (not {
+           unless ($entry->[1] & ALL_END_TAG_OPTIONAL_EL) {
-             dd => 1, dt => 1, li => 1, p => 1, tbody => 1, td => 1, tfoot => 1,
-             th => 1, thead => 1, tr => 1, body => 1, html => 1,
-           }->{$entry->[1]}) {
              !!!cp ('t75');
-             !!!parse-error (type => 'in body:#eof');
+             !!!parse-error (type => 'in body:#eof', token => $token);
              last;
            }
          }
-Line 4237 
 sub _tree_construction_main ($) {
+Line 5406 
 sub _tree_construction_main ($) {
            unless (length $token->{data}) {
              !!!cp ('t194');
              !!!next-token;
-             redo B;
+             next B;
            } else {
              !!!cp ('t195');
            }
          }
-             !!!parse-error (type => 'in table:#character');
+         !!!parse-error (type => 'in table:#text', token => $token);
              ## As if in body, but insert into foster parent element
              ## ISSUE: Spec says that "whenever a node would be inserted
-Line 4251 
 sub _tree_construction_main ($) {
+Line 5420 
 sub _tree_construction_main ($) {
              ## result in a new Text node.
              $reconstruct_active_formatting_elements->($insert_to_foster);
-             if ({
+             if ($self->{open_elements}->[-1]->[1] & TABLE_ROWS_EL) {
-                  table => 1, tbody => 1, tfoot => 1,
-                  thead => 1, tr => 1,
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                # MUST
                my $foster_parent_element;
                my $next_sibling;
                my $prev_sibling;
                OE: for (reverse 0..$#{$self->{open_elements}}) {
-                 if ($self->{open_elements}->[$_]->[1] eq 'table') {
+                 if ($self->{open_elements}->[$_]->[1] & TABLE_EL) {
                    my $parent = $self->{open_elements}->[$_]->[0]->parent_node;
                    if (defined $parent and $parent->node_type == 1) {
                      !!!cp ('t196');
-Line 4295 
 sub _tree_construction_main ($) {
+Line 5461 
 sub _tree_construction_main ($) {
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{type} == START_TAG_TOKEN) {
-             if ({
+         if ({
-                  tr => ($self->{insertion_mode} != IN_ROW_IM),
+              tr => ($self->{insertion_mode} != IN_ROW_IM),
-                  th => 1, td => 1,
+              th => 1, td => 1,
-                 }->{$token->{tag_name}}) {
+             }->{$token->{tag_name}}) {
-               if ($self->{insertion_mode} == IN_TABLE_IM) {
+           if ($self->{insertion_mode} == IN_TABLE_IM) {
-                 ## Clear back to table context
+             ## Clear back to table context
-                 while ($self->{open_elements}->[-1]->[1] ne 'table' and
+             while (not ($self->{open_elements}->[-1]->[1]
-                        $self->{open_elements}->[-1]->[1] ne 'html') {
+                             & TABLE_SCOPING_EL)) {
-                   !!!cp ('t201');
+               !!!cp ('t201');
-                   pop @{$self->{open_elements}};
+               pop @{$self->{open_elements}};
-                 }
+             }
-                 !!!insert-element ('tbody');
+             !!!insert-element ('tbody',, $token);
-                 $self->{insertion_mode} = IN_TABLE_BODY_IM;
+             $self->{insertion_mode} = IN_TABLE_BODY_IM;
-                 ## reprocess in the "in table body" insertion mode...
+             ## reprocess in the "in table body" insertion mode...
-               }
+           }
-               if ($self->{insertion_mode} == IN_TABLE_BODY_IM) {
+           if ($self->{insertion_mode} == IN_TABLE_BODY_IM) {
-                 unless ($token->{tag_name} eq 'tr') {
+             unless ($token->{tag_name} eq 'tr') {
-                   !!!cp ('t202');
+               !!!cp ('t202');
-                   !!!parse-error (type => 'missing start tag:tr');
+               !!!parse-error (type => 'missing start tag:tr', token => $token);
-                 }
+             }
-                 ## Clear back to table body context
+             ## Clear back to table body context
-                 while (not {
+             while (not ($self->{open_elements}->[-1]->[1]
-                   tbody => 1, tfoot => 1, thead => 1, html => 1,
+                             & TABLE_ROWS_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
+               !!!cp ('t203');
-                   !!!cp ('t203');
+               ## ISSUE: Can this case be reached?
-                   ## ISSUE: Can this case be reached?
+               pop @{$self->{open_elements}};
-                   pop @{$self->{open_elements}};
+             }
-                 }
                  $self->{insertion_mode} = IN_ROW_IM;
                  if ($token->{tag_name} eq 'tr') {
                    !!!cp ('t204');
-                   !!!insert-element ($token->{tag_name}, $token->{attributes});
+                   !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
+                   !!!nack ('t204');
                    !!!next-token;
-                   redo B;
+                   next B;
                  } else {
                    !!!cp ('t205');
-                   !!!insert-element ('tr');
+                   !!!insert-element ('tr',, $token);
                    ## reprocess in the "in row" insertion mode
                  }
                } else {
-Line 4345 
 sub _tree_construction_main ($) {
+Line 5511 
 sub _tree_construction_main ($) {
                }
                ## Clear back to table row context
-               while (not {
+               while (not ($self->{open_elements}->[-1]->[1]
-                 tr => 1, html => 1,
+                               & TABLE_ROW_SCOPING_EL)) {
-               }->{$self->{open_elements}->[-1]->[1]}) {
                  !!!cp ('t207');
                  pop @{$self->{open_elements}};
                }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                $self->{insertion_mode} = IN_CELL_IM;
                push @$active_formatting_elements, ['#marker', ''];
+               !!!nack ('t207.1');
                !!!next-token;
-               redo B;
+               next B;
              } elsif ({
                        caption => 1, col => 1, colgroup => 1,
                        tbody => 1, tfoot => 1, thead => 1,
-Line 4370 
 sub _tree_construction_main ($) {
+Line 5536 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq 'tr') {
+                   if ($node->[1] & TABLE_ROW_EL) {
                      !!!cp ('t208');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             html => 1,
-                             ## NOTE: This element does not appear here, maybe.
-                             table => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t209');
                      last INSCOPE;
                    }
                  } # INSCOPE
                  unless (defined $i) {
-                  !!!cp ('t210');
+                   !!!cp ('t210');
  ## TODO: This type is wrong.
-                  !!!parse-error (type => 'unmacthed end tag:'.$token->{tag_name});
+                   !!!parse-error (type => 'unmacthed end tag',
+                                   text => $token->{tag_name}, token => $token);
                    ## Ignore the token
+                   !!!nack ('t210.1');
                    !!!next-token;
-                   redo B;
+                   next B;
                  }
                  ## Clear back to table row context
-                 while (not {
+                 while (not ($self->{open_elements}->[-1]->[1]
-                   tr => 1, html => 1,
+                                 & TABLE_ROW_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t211');
                    ## ISSUE: Can this case be reached?
                    pop @{$self->{open_elements}};
-Line 4407 
 sub _tree_construction_main ($) {
+Line 5569 
 sub _tree_construction_main ($) {
                  if ($token->{tag_name} eq 'tr') {
                    !!!cp ('t212');
                    ## reprocess
-                   redo B;
+                   !!!ack-later;
+                   next B;
                  } else {
                    !!!cp ('t213');
                    ## reprocess in the "in table body" insertion mode...
-Line 4419 
 sub _tree_construction_main ($) {
+Line 5582 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ({
+                   if ($node->[1] & TABLE_ROW_GROUP_EL) {
-                        tbody => 1, thead => 1, tfoot => 1,
-                       }->{$node->[1]}) {
                      !!!cp ('t214');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t215');
                      last INSCOPE;
                    }
                  } # INSCOPE
                  unless (defined $i) {
                    !!!cp ('t216');
- ## TODO: This erorr type ios wrong.
+ ## TODO: This erorr type is wrong.
-                   !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                   !!!parse-error (type => 'unmatched end tag',
+                                   text => $token->{tag_name}, token => $token);
                    ## Ignore the token
+                   !!!nack ('t216.1');
                    !!!next-token;
-                   redo B;
+                   next B;
                  }
                  ## Clear back to table body context
-                 while (not {
+                 while (not ($self->{open_elements}->[-1]->[1]
-                   tbody => 1, tfoot => 1, thead => 1, html => 1,
+                                 & TABLE_ROWS_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t217');
                    ## ISSUE: Can this state be reached?
                    pop @{$self->{open_elements}};
-Line 4466 
 sub _tree_construction_main ($) {
+Line 5626 
 sub _tree_construction_main ($) {
                if ($token->{tag_name} eq 'col') {
                  ## Clear back to table context
-                 while ($self->{open_elements}->[-1]->[1] ne 'table' and
+                 while (not ($self->{open_elements}->[-1]->[1]
-                        $self->{open_elements}->[-1]->[1] ne 'html') {
+                                 & TABLE_SCOPING_EL)) {
                    !!!cp ('t219');
                    ## ISSUE: Can this state be reached?
                    pop @{$self->{open_elements}};
                  }
-                 !!!insert-element ('colgroup');
+                 !!!insert-element ('colgroup',, $token);
                  $self->{insertion_mode} = IN_COLUMN_GROUP_IM;
                  ## reprocess
-                 redo B;
+                 !!!ack-later;
+                 next B;
                } elsif ({
                          caption => 1,
                          colgroup => 1,
                          tbody => 1, tfoot => 1, thead => 1,
                         }->{$token->{tag_name}}) {
                  ## Clear back to table context
-                 while ($self->{open_elements}->[-1]->[1] ne 'table' and
+                 while (not ($self->{open_elements}->[-1]->[1]
-                        $self->{open_elements}->[-1]->[1] ne 'html') {
+                                 & TABLE_SCOPING_EL)) {
                    !!!cp ('t220');
                    ## ISSUE: Can this state be reached?
                    pop @{$self->{open_elements}};
-Line 4493 
 sub _tree_construction_main ($) {
+Line 5654 
 sub _tree_construction_main ($) {
                  push @$active_formatting_elements, ['#marker', '']
                      if $token->{tag_name} eq 'caption';
-                 !!!insert-element ($token->{tag_name}, $token->{attributes});
+                 !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                  $self->{insertion_mode} = {
                                             caption => IN_CAPTION_IM,
                                             colgroup => IN_COLUMN_GROUP_IM,
-Line 4502 
 sub _tree_construction_main ($) {
+Line 5663 
 sub _tree_construction_main ($) {
                                             thead => IN_TABLE_BODY_IM,
                                            }->{$token->{tag_name}};
                  !!!next-token;
-                 redo B;
+                 !!!nack ('t220.1');
+                 next B;
                } else {
                  die "$0: in table: <>: $token->{tag_name}";
                }
              } elsif ($token->{tag_name} eq 'table') {
-               !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+               !!!parse-error (type => 'not closed',
+                               text => $self->{open_elements}->[-1]->[0]
+                                   ->manakai_local_name,
+                               token => $token);
                ## As if </table>
                ## have a table element in table scope
                my $i;
                INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                  my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq 'table') {
+                 if ($node->[1] & TABLE_EL) {
                    !!!cp ('t221');
                    $i = $_;
                    last INSCOPE;
-                 } elsif ({
+                 } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           #table => 1,
-                           html => 1,
-                          }->{$node->[1]}) {
                    !!!cp ('t222');
                    last INSCOPE;
                  }
-Line 4529 
 sub _tree_construction_main ($) {
+Line 5691 
 sub _tree_construction_main ($) {
                unless (defined $i) {
                  !!!cp ('t223');
  ## TODO: The following is wrong, maybe.
-                 !!!parse-error (type => 'unmatched end tag:table');
+                 !!!parse-error (type => 'unmatched end tag', text => 'table',
+                                 token => $token);
                  ## Ignore tokens </table><table>
+                 !!!nack ('t223.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                }
  ## TODO: Followings are removed from the latest spec.
                ## generate implied end tags
-               while ({
+               while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
-                       dd => 1, dt => 1, li => 1, p => 1,
-                      }->{$self->{open_elements}->[-1]->[1]}) {
                  !!!cp ('t224');
                  pop @{$self->{open_elements}};
                }
-               if ($self->{open_elements}->[-1]->[1] ne 'table') {
+               unless ($self->{open_elements}->[-1]->[1] & TABLE_EL) {
                  !!!cp ('t225');
- ## ISSUE: Can this case be reached?
+                 ## NOTE: |<table><tr><table>|
-                 !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+                 !!!parse-error (type => 'not closed',
+                                 text => $self->{open_elements}->[-1]->[0]
+                                     ->manakai_local_name,
+                                 token => $token);
                } else {
                  !!!cp ('t226');
                }
-Line 4557 
 sub _tree_construction_main ($) {
+Line 5722 
 sub _tree_construction_main ($) {
                $self->_reset_insertion_mode;
-               ## reprocess
+           ## reprocess
-               redo B;
+           !!!ack-later;
+           next B;
          } elsif ($token->{tag_name} eq 'style') {
            if (not $open_tables->[-1]->[1]) { # tainted
              !!!cp ('t227.8');
              ## NOTE: This is a "as if in head" code clone.
              $parse_rcdata->(CDATA_CONTENT_MODEL);
-             redo B;
+             next B;
            } else {
              !!!cp ('t227.7');
              #
-Line 4574 
 sub _tree_construction_main ($) {
+Line 5740 
 sub _tree_construction_main ($) {
              !!!cp ('t227.6');
              ## NOTE: This is a "as if in head" code clone.
              $script_start_tag->();
-             redo B;
+             next B;
            } else {
              !!!cp ('t227.5');
              #
-Line 4585 
 sub _tree_construction_main ($) {
+Line 5751 
 sub _tree_construction_main ($) {
                my $type = lc $token->{attributes}->{type}->{value};
                if ($type eq 'hidden') {
                  !!!cp ('t227.3');
-                 !!!parse-error (type => 'in table:'.$token->{tag_name});
+                 !!!parse-error (type => 'in table',
+                                 text => $token->{tag_name}, token => $token);
-                 !!!insert-element ($token->{tag_name}, $token->{attributes});
+                 !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                  ## TODO: form element pointer
                  pop @{$self->{open_elements}};
                  !!!next-token;
-                 redo B;
+                 !!!ack ('t227.2.1');
+                 next B;
                } else {
                  !!!cp ('t227.2');
                  #
-Line 4612 
 sub _tree_construction_main ($) {
+Line 5780 
 sub _tree_construction_main ($) {
            #
          }
-         !!!parse-error (type => 'in table:'.$token->{tag_name});
+         !!!parse-error (type => 'in table', text => $token->{tag_name},
+                         token => $token);
          $insert = $insert_to_foster;
          #
-Line 4623 
 sub _tree_construction_main ($) {
+Line 5792 
 sub _tree_construction_main ($) {
                my $i;
                INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                  my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq $token->{tag_name}) {
+                 if ($node->[1] & TABLE_ROW_EL) {
                    !!!cp ('t228');
                    $i = $_;
                    last INSCOPE;
-                 } elsif ({
+                 } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
-                          }->{$node->[1]}) {
                    !!!cp ('t229');
                    last INSCOPE;
                  }
                } # INSCOPE
                unless (defined $i) {
                  !!!cp ('t230');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
+                 !!!nack ('t230.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t232');
                }
                ## Clear back to table row context
-               while (not {
+               while (not ($self->{open_elements}->[-1]->[1]
-                 tr => 1, html => 1,
+                               & TABLE_ROW_SCOPING_EL)) {
-               }->{$self->{open_elements}->[-1]->[1]}) {
                  !!!cp ('t231');
  ## ISSUE: Can this state be reached?
                  pop @{$self->{open_elements}};
-Line 4656 
 sub _tree_construction_main ($) {
+Line 5824 
 sub _tree_construction_main ($) {
                pop @{$self->{open_elements}}; # tr
                $self->{insertion_mode} = IN_TABLE_BODY_IM;
                !!!next-token;
-               redo B;
+               !!!nack ('t231.1');
+               next B;
              } elsif ($token->{tag_name} eq 'table') {
                if ($self->{insertion_mode} == IN_ROW_IM) {
                  ## As if </tr>
-Line 4664 
 sub _tree_construction_main ($) {
+Line 5833 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq 'tr') {
+                   if ($node->[1] & TABLE_ROW_EL) {
                      !!!cp ('t233');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t234');
                      last INSCOPE;
                    }
-Line 4678 
 sub _tree_construction_main ($) {
+Line 5845 
 sub _tree_construction_main ($) {
                  unless (defined $i) {
                    !!!cp ('t235');
  ## TODO: The following is wrong.
-                   !!!parse-error (type => 'unmatched end tag:'.$token->{type});
+                   !!!parse-error (type => 'unmatched end tag',
+                                   text => $token->{type}, token => $token);
                    ## Ignore the token
+                   !!!nack ('t236.1');
                    !!!next-token;
-                   redo B;
+                   next B;
                  }
                  ## Clear back to table row context
-                 while (not {
+                 while (not ($self->{open_elements}->[-1]->[1]
-                   tr => 1, html => 1,
+                                 & TABLE_ROW_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t236');
  ## ISSUE: Can this state be reached?
                    pop @{$self->{open_elements}};
-Line 4703 
 sub _tree_construction_main ($) {
+Line 5871 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ({
+                   if ($node->[1] & TABLE_ROW_GROUP_EL) {
-                        tbody => 1, thead => 1, tfoot => 1,
-                       }->{$node->[1]}) {
                      !!!cp ('t237');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t238');
                      last INSCOPE;
                    }
                  } # INSCOPE
                  unless (defined $i) {
                    !!!cp ('t239');
-                   !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                   !!!parse-error (type => 'unmatched end tag',
+                                   text => $token->{tag_name}, token => $token);
                    ## Ignore the token
+                   !!!nack ('t239.1');
                    !!!next-token;
-                   redo B;
+                   next B;
                  }
                  ## Clear back to table body context
-                 while (not {
+                 while (not ($self->{open_elements}->[-1]->[1]
-                   tbody => 1, tfoot => 1, thead => 1, html => 1,
+                                 & TABLE_ROWS_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t240');
                    pop @{$self->{open_elements}};
                  }
-Line 4753 
 sub _tree_construction_main ($) {
+Line 5918 
 sub _tree_construction_main ($) {
                my $i;
                INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                  my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq $token->{tag_name}) {
+                 if ($node->[1] & TABLE_EL) {
                    !!!cp ('t241');
                    $i = $_;
                    last INSCOPE;
-                 } elsif ({
+                 } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
-                          }->{$node->[1]}) {
                    !!!cp ('t242');
                    last INSCOPE;
                  }
                } # INSCOPE
                unless (defined $i) {
                  !!!cp ('t243');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
+                 !!!nack ('t243.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                }
                splice @{$self->{open_elements}}, $i;
-Line 4778 
 sub _tree_construction_main ($) {
+Line 5943 
 sub _tree_construction_main ($) {
                $self->_reset_insertion_mode;
                !!!next-token;
-               redo B;
+               next B;
              } elsif ({
                        tbody => 1, tfoot => 1, thead => 1,
                       }->{$token->{tag_name}} and
-Line 4788 
 sub _tree_construction_main ($) {
+Line 5953 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq $token->{tag_name}) {
+                   if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
                      !!!cp ('t247');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t248');
                      last INSCOPE;
                    }
                  } # INSCOPE
                    unless (defined $i) {
                      !!!cp ('t249');
-                     !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                     !!!parse-error (type => 'unmatched end tag',
+                                     text => $token->{tag_name}, token => $token);
                      ## Ignore the token
+                     !!!nack ('t249.1');
                      !!!next-token;
-                     redo B;
+                     next B;
                    }
                  ## As if </tr>
-Line 4812 
 sub _tree_construction_main ($) {
+Line 5977 
 sub _tree_construction_main ($) {
                  my $i;
                  INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                    my $node = $self->{open_elements}->[$_];
-                   if ($node->[1] eq 'tr') {
+                   if ($node->[1] & TABLE_ROW_EL) {
                      !!!cp ('t250');
                      $i = $_;
                      last INSCOPE;
-                   } elsif ({
+                   } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                             table => 1, html => 1,
-                            }->{$node->[1]}) {
                      !!!cp ('t251');
                      last INSCOPE;
                    }
                  } # INSCOPE
                    unless (defined $i) {
                      !!!cp ('t252');
-                     !!!parse-error (type => 'unmatched end tag:tr');
+                     !!!parse-error (type => 'unmatched end tag',
+                                     text => 'tr', token => $token);
                      ## Ignore the token
+                     !!!nack ('t252.1');
                      !!!next-token;
-                     redo B;
+                     next B;
                    }
                  ## Clear back to table row context
-                 while (not {
+                 while (not ($self->{open_elements}->[-1]->[1]
-                   tr => 1, html => 1,
+                                 & TABLE_ROW_SCOPING_EL)) {
-                 }->{$self->{open_elements}->[-1]->[1]}) {
                    !!!cp ('t253');
  ## ISSUE: Can this case be reached?
                    pop @{$self->{open_elements}};
-Line 4849 
 sub _tree_construction_main ($) {
+Line 6013 
 sub _tree_construction_main ($) {
                my $i;
                INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
                  my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq $token->{tag_name}) {
+                 if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
                    !!!cp ('t254');
                    $i = $_;
                    last INSCOPE;
-                 } elsif ({
+                 } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
-                          }->{$node->[1]}) {
                    !!!cp ('t255');
                    last INSCOPE;
                  }
                } # INSCOPE
                unless (defined $i) {
                  !!!cp ('t256');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => $token->{tag_name}, token => $token);
                  ## Ignore the token
+                 !!!nack ('t256.1');
                  !!!next-token;
-                 redo B;
+                 next B;
                }
                ## Clear back to table body context
-               while (not {
+               while (not ($self->{open_elements}->[-1]->[1]
-                 tbody => 1, tfoot => 1, thead => 1, html => 1,
+                               & TABLE_ROWS_SCOPING_EL)) {
-               }->{$self->{open_elements}->[-1]->[1]}) {
                  !!!cp ('t257');
  ## ISSUE: Can this case be reached?
                  pop @{$self->{open_elements}};
-Line 4879 
 sub _tree_construction_main ($) {
+Line 6042 
 sub _tree_construction_main ($) {
                pop @{$self->{open_elements}};
                $self->{insertion_mode} = IN_TABLE_IM;
+               !!!nack ('t257.1');
                !!!next-token;
-               redo B;
+               next B;
              } elsif ({
                        body => 1, caption => 1, col => 1, colgroup => 1,
                        html => 1, td => 1, th => 1,
                        tr => 1, # $self->{insertion_mode} == IN_ROW_IM
                        tbody => 1, tfoot => 1, thead => 1, # $self->{insertion_mode} == IN_TABLE_IM
                       }->{$token->{tag_name}}) {
-               !!!cp ('t258');
+           !!!cp ('t258');
-               !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
-               ## Ignore the token
+                           text => $token->{tag_name}, token => $token);
-               !!!next-token;
+           ## Ignore the token
-               redo B;
+           !!!nack ('t258.1');
+            !!!next-token;
+           next B;
          } else {
            !!!cp ('t259');
-           !!!parse-error (type => 'in table:/'.$token->{tag_name});
+           !!!parse-error (type => 'in table:/',
+                           text => $token->{tag_name}, token => $token);
            $insert = $insert_to_foster;
            #
          }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
-         unless ($self->{open_elements}->[-1]->[1] eq 'html' and
+         unless ($self->{open_elements}->[-1]->[1] & HTML_EL and
                  @{$self->{open_elements}} == 1) { # redundant, maybe
-           !!!parse-error (type => 'in body:#eof');
+           !!!parse-error (type => 'in body:#eof', token => $token);
            !!!cp ('t259.1');
            #
          } else {
-Line 4922 
 sub _tree_construction_main ($) {
+Line 6089 
 sub _tree_construction_main ($) {
                unless (length $token->{data}) {
                  !!!cp ('t260');
                  !!!next-token;
-                 redo B;
+                 next B;
                }
              }
-Line 4931 
 sub _tree_construction_main ($) {
+Line 6098 
 sub _tree_construction_main ($) {
            } elsif ($token->{type} == START_TAG_TOKEN) {
              if ($token->{tag_name} eq 'col') {
                !!!cp ('t262');
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+               !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
                pop @{$self->{open_elements}};
+               !!!ack ('t262.1');
                !!!next-token;
-               redo B;
+               next B;
              } else {
                !!!cp ('t263');
                #
              }
            } elsif ($token->{type} == END_TAG_TOKEN) {
              if ($token->{tag_name} eq 'colgroup') {
-               if ($self->{open_elements}->[-1]->[1] eq 'html') {
+               if ($self->{open_elements}->[-1]->[1] & HTML_EL) {
                  !!!cp ('t264');
-                 !!!parse-error (type => 'unmatched end tag:colgroup');
+                 !!!parse-error (type => 'unmatched end tag',
+                                 text => 'colgroup', token => $token);
                  ## Ignore the token
                  !!!next-token;
-                 redo B;
+                 next B;
                } else {
                  !!!cp ('t265');
                  pop @{$self->{open_elements}}; # colgroup
                  $self->{insertion_mode} = IN_TABLE_IM;
                  !!!next-token;
-                 redo B;
+                 next B;
                }
              } elsif ($token->{tag_name} eq 'col') {
                !!!cp ('t266');
-               !!!parse-error (type => 'unmatched end tag:col');
+               !!!parse-error (type => 'unmatched end tag',
+                               text => 'col', token => $token);
                ## Ignore the token
                !!!next-token;
-               redo B;
+               next B;
              } else {
                !!!cp ('t267');
                #
              }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
-         if ($self->{open_elements}->[-1]->[1] eq 'html' or
+         if ($self->{open_elements}->[-1]->[1] & HTML_EL and
              @{$self->{open_elements}} == 1) { # redundant, maybe
            !!!cp ('t270.2');
            ## Stop parsing.
-Line 4976 
 sub _tree_construction_main ($) {
+Line 6146 
 sub _tree_construction_main ($) {
            pop @{$self->{open_elements}}; # colgroup
            $self->{insertion_mode} = IN_TABLE_IM;
            ## Reprocess.
-           redo B;
+           next B;
          }
        } else {
          die "$0: $token->{type}: Unknown token type";
        }
            ## As if </colgroup>
-           if ($self->{open_elements}->[-1]->[1] eq 'html') {
+           if ($self->{open_elements}->[-1]->[1] & HTML_EL) {
              !!!cp ('t269');
  ## TODO: Wrong error type?
-             !!!parse-error (type => 'unmatched end tag:colgroup');
+             !!!parse-error (type => 'unmatched end tag',
+                             text => 'colgroup', token => $token);
              ## Ignore the token
+             !!!nack ('t269.1');
              !!!next-token;
-             redo B;
+             next B;
            } else {
              !!!cp ('t270');
              pop @{$self->{open_elements}}; # colgroup
              $self->{insertion_mode} = IN_TABLE_IM;
+             !!!ack-later;
              ## reprocess
-             redo B;
+             next B;
            }
      } elsif ($self->{insertion_mode} & SELECT_IMS) {
        if ($token->{type} == CHARACTER_TOKEN) {
          !!!cp ('t271');
          $self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data});
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{type} == START_TAG_TOKEN) {
-             if ($token->{tag_name} eq 'option') {
+         if ($token->{tag_name} eq 'option') {
-               if ($self->{open_elements}->[-1]->[1] eq 'option') {
+           if ($self->{open_elements}->[-1]->[1] & OPTION_EL) {
-                 !!!cp ('t272');
+             !!!cp ('t272');
-                 ## As if </option>
+             ## As if </option>
-                 pop @{$self->{open_elements}};
+             pop @{$self->{open_elements}};
-               } else {
+           } else {
-                 !!!cp ('t273');
+             !!!cp ('t273');
-               }
+           }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+           !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
-               !!!next-token;
+           !!!nack ('t273.1');
-               redo B;
+           !!!next-token;
-             } elsif ($token->{tag_name} eq 'optgroup') {
+           next B;
-               if ($self->{open_elements}->[-1]->[1] eq 'option') {
+         } elsif ($token->{tag_name} eq 'optgroup') {
-                 !!!cp ('t274');
+           if ($self->{open_elements}->[-1]->[1] & OPTION_EL) {
-                 ## As if </option>
+             !!!cp ('t274');
-                 pop @{$self->{open_elements}};
+             ## As if </option>
-               } else {
+             pop @{$self->{open_elements}};
-                 !!!cp ('t275');
+           } else {
-               }
+             !!!cp ('t275');
+           }
-               if ($self->{open_elements}->[-1]->[1] eq 'optgroup') {
+           if ($self->{open_elements}->[-1]->[1] & OPTGROUP_EL) {
-                 !!!cp ('t276');
+             !!!cp ('t276');
-                 ## As if </optgroup>
+             ## As if </optgroup>
-                 pop @{$self->{open_elements}};
+             pop @{$self->{open_elements}};
-               } else {
+           } else {
-                 !!!cp ('t277');
+             !!!cp ('t277');
-               }
+           }
-               !!!insert-element ($token->{tag_name}, $token->{attributes});
+           !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
-               !!!next-token;
+           !!!nack ('t277.1');
-               redo B;
+           !!!next-token;
-         } elsif ($token->{tag_name} eq 'select' or
+           next B;
-                  $token->{tag_name} eq 'input' or
+         } elsif ({
+                    select => 1, input => 1, textarea => 1,
+                  }->{$token->{tag_name}} or
                   ($self->{insertion_mode} == IN_SELECT_IN_TABLE_IM and
                    {
                     caption => 1, table => 1,
-Line 5045 
 sub _tree_construction_main ($) {
+Line 6221 
 sub _tree_construction_main ($) {
                     tr => 1, td => 1, th => 1,
                    }->{$token->{tag_name}})) {
            ## TODO: The type below is not good - <select> is replaced by </select>
-           !!!parse-error (type => 'not closed:select');
+           !!!parse-error (type => 'not closed', text => 'select',
+                           token => $token);
            ## NOTE: As if the token were </select> (<select> case) or
            ## as if there were </select> (otherwise).
-               ## have an element in table scope
+           ## have an element in table scope
-               my $i;
+           my $i;
-               INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+           INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
-                 my $node = $self->{open_elements}->[$_];
+             my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq 'select') {
+             if ($node->[1] & SELECT_EL) {
-                   !!!cp ('t278');
+               !!!cp ('t278');
-                   $i = $_;
+               $i = $_;
-                   last INSCOPE;
+               last INSCOPE;
-                 } elsif ({
+             } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
+               !!!cp ('t279');
-                          }->{$node->[1]}) {
+               last INSCOPE;
-                   !!!cp ('t279');
+             }
-                   last INSCOPE;
+           } # INSCOPE
-                 }
+           unless (defined $i) {
-               } # INSCOPE
+             !!!cp ('t280');
-               unless (defined $i) {
+             !!!parse-error (type => 'unmatched end tag',
-                 !!!cp ('t280');
+                             text => 'select', token => $token);
-                 !!!parse-error (type => 'unmatched end tag:select');
+             ## Ignore the token
-                 ## Ignore the token
+             !!!nack ('t280.1');
-                 !!!next-token;
+             !!!next-token;
-                 redo B;
+             next B;
-               }
+           }
-               !!!cp ('t281');
+           !!!cp ('t281');
-               splice @{$self->{open_elements}}, $i;
+           splice @{$self->{open_elements}}, $i;
-               $self->_reset_insertion_mode;
+           $self->_reset_insertion_mode;
            if ($token->{tag_name} eq 'select') {
-             !!!cp ('t281.2');
+             !!!nack ('t281.2');
              !!!next-token;
-             redo B;
+             next B;
            } else {
              !!!cp ('t281.1');
+             !!!ack-later;
              ## Reprocess the token.
-             redo B;
+             next B;
            }
          } else {
            !!!cp ('t282');
-           !!!parse-error (type => 'in select:'.$token->{tag_name});
+           !!!parse-error (type => 'in select',
+                           text => $token->{tag_name}, token => $token);
            ## Ignore the token
+           !!!nack ('t282.1');
            !!!next-token;
-           redo B;
+           next B;
          }
        } elsif ($token->{type} == END_TAG_TOKEN) {
-             if ($token->{tag_name} eq 'optgroup') {
+         if ($token->{tag_name} eq 'optgroup') {
-               if ($self->{open_elements}->[-1]->[1] eq 'option' and
+           if ($self->{open_elements}->[-1]->[1] & OPTION_EL and
-                   $self->{open_elements}->[-2]->[1] eq 'optgroup') {
+               $self->{open_elements}->[-2]->[1] & OPTGROUP_EL) {
-                 !!!cp ('t283');
+             !!!cp ('t283');
-                 ## As if </option>
+             ## As if </option>
-                 splice @{$self->{open_elements}}, -2;
+             splice @{$self->{open_elements}}, -2;
-               } elsif ($self->{open_elements}->[-1]->[1] eq 'optgroup') {
+           } elsif ($self->{open_elements}->[-1]->[1] & OPTGROUP_EL) {
-                 !!!cp ('t284');
+             !!!cp ('t284');
-                 pop @{$self->{open_elements}};
+             pop @{$self->{open_elements}};
-               } else {
+           } else {
-                 !!!cp ('t285');
+             !!!cp ('t285');
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+             !!!parse-error (type => 'unmatched end tag',
-                 ## Ignore the token
+                             text => $token->{tag_name}, token => $token);
-               }
+             ## Ignore the token
-               !!!next-token;
+           }
-               redo B;
+           !!!nack ('t285.1');
-             } elsif ($token->{tag_name} eq 'option') {
+           !!!next-token;
-               if ($self->{open_elements}->[-1]->[1] eq 'option') {
+           next B;
-                 !!!cp ('t286');
+         } elsif ($token->{tag_name} eq 'option') {
-                 pop @{$self->{open_elements}};
+           if ($self->{open_elements}->[-1]->[1] & OPTION_EL) {
-               } else {
+             !!!cp ('t286');
-                 !!!cp ('t287');
+             pop @{$self->{open_elements}};
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           } else {
-                 ## Ignore the token
+             !!!cp ('t287');
-               }
+             !!!parse-error (type => 'unmatched end tag',
-               !!!next-token;
+                             text => $token->{tag_name}, token => $token);
-               redo B;
+             ## Ignore the token
-             } elsif ($token->{tag_name} eq 'select') {
+           }
-               ## have an element in table scope
+           !!!nack ('t287.1');
-               my $i;
+           !!!next-token;
-               INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+           next B;
-                 my $node = $self->{open_elements}->[$_];
+         } elsif ($token->{tag_name} eq 'select') {
-                 if ($node->[1] eq $token->{tag_name}) {
+           ## have an element in table scope
-                   !!!cp ('t288');
+           my $i;
-                   $i = $_;
+           INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
-                   last INSCOPE;
+             my $node = $self->{open_elements}->[$_];
-                 } elsif ({
+             if ($node->[1] & SELECT_EL) {
-                           table => 1, html => 1,
+               !!!cp ('t288');
-                          }->{$node->[1]}) {
+               $i = $_;
-                   !!!cp ('t289');
+               last INSCOPE;
-                   last INSCOPE;
+             } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                 }
+               !!!cp ('t289');
-               } # INSCOPE
+               last INSCOPE;
-               unless (defined $i) {
+             }
-                 !!!cp ('t290');
+           } # INSCOPE
-                 !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           unless (defined $i) {
-                 ## Ignore the token
+             !!!cp ('t290');
-                 !!!next-token;
+             !!!parse-error (type => 'unmatched end tag',
-                 redo B;
+                             text => $token->{tag_name}, token => $token);
-               }
+             ## Ignore the token
+             !!!nack ('t290.1');
+             !!!next-token;
+             next B;
+           }
-               !!!cp ('t291');
+           !!!cp ('t291');
-               splice @{$self->{open_elements}}, $i;
+           splice @{$self->{open_elements}}, $i;
-               $self->_reset_insertion_mode;
+           $self->_reset_insertion_mode;
-               !!!next-token;
+           !!!nack ('t291.1');
-               redo B;
+           !!!next-token;
+           next B;
          } elsif ($self->{insertion_mode} == IN_SELECT_IN_TABLE_IM and
                   {
                    caption => 1, table => 1, tbody => 1,
                    tfoot => 1, thead => 1, tr => 1, td => 1, th => 1,
                   }->{$token->{tag_name}}) {
  ## TODO: The following is wrong?
-               !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
-               ## have an element in table scope
+           ## have an element in table scope
-               my $i;
+           my $i;
-               INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+           INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
-                 my $node = $self->{open_elements}->[$_];
+             my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq $token->{tag_name}) {
+             if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
-                   !!!cp ('t292');
+               !!!cp ('t292');
-                   $i = $_;
+               $i = $_;
-                   last INSCOPE;
+               last INSCOPE;
-                 } elsif ({
+             } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
+               !!!cp ('t293');
-                          }->{$node->[1]}) {
+               last INSCOPE;
-                   !!!cp ('t293');
+             }
-                   last INSCOPE;
+           } # INSCOPE
-                 }
+           unless (defined $i) {
-               } # INSCOPE
+             !!!cp ('t294');
-               unless (defined $i) {
+             ## Ignore the token
-                 !!!cp ('t294');
+             !!!nack ('t294.1');
-                 ## Ignore the token
+             !!!next-token;
-                 !!!next-token;
+             next B;
-                 redo B;
+           }
-               }
-               ## As if </select>
+           ## As if </select>
-               ## have an element in table scope
+           ## have an element in table scope
-               undef $i;
+           undef $i;
-               INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+           INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
-                 my $node = $self->{open_elements}->[$_];
+             my $node = $self->{open_elements}->[$_];
-                 if ($node->[1] eq 'select') {
+             if ($node->[1] & SELECT_EL) {
-                   !!!cp ('t295');
+               !!!cp ('t295');
-                   $i = $_;
+               $i = $_;
-                   last INSCOPE;
+               last INSCOPE;
-                 } elsif ({
+             } elsif ($node->[1] & TABLE_SCOPING_EL) {
-                           table => 1, html => 1,
-                          }->{$node->[1]}) {
  ## ISSUE: Can this state be reached?
-                   !!!cp ('t296');
+               !!!cp ('t296');
-                   last INSCOPE;
+               last INSCOPE;
-                 }
+             }
-               } # INSCOPE
+           } # INSCOPE
-               unless (defined $i) {
+           unless (defined $i) {
-                 !!!cp ('t297');
+             !!!cp ('t297');
  ## TODO: The following error type is correct?
-                 !!!parse-error (type => 'unmatched end tag:select');
+             !!!parse-error (type => 'unmatched end tag',
-                 ## Ignore the </select> token
+                             text => 'select', token => $token);
-                 !!!next-token; ## TODO: ok?
+             ## Ignore the </select> token
-                 redo B;
+             !!!nack ('t297.1');
-               }
+             !!!next-token; ## TODO: ok?
+             next B;
+           }
-               !!!cp ('t298');
+           !!!cp ('t298');
-               splice @{$self->{open_elements}}, $i;
+           splice @{$self->{open_elements}}, $i;
-               $self->_reset_insertion_mode;
+           $self->_reset_insertion_mode;
-               ## reprocess
+           !!!ack-later;
-               redo B;
+           ## reprocess
+           next B;
          } else {
            !!!cp ('t299');
-           !!!parse-error (type => 'in select:/'.$token->{tag_name});
+           !!!parse-error (type => 'in select:/',
+                           text => $token->{tag_name}, token => $token);
            ## Ignore the token
+           !!!nack ('t299.3');
            !!!next-token;
-           redo B;
+           next B;
          }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
-         unless ($self->{open_elements}->[-1]->[1] eq 'html' and
+         unless ($self->{open_elements}->[-1]->[1] & HTML_EL and
                  @{$self->{open_elements}} == 1) { # redundant, maybe
            !!!cp ('t299.1');
-           !!!parse-error (type => 'in body:#eof');
+           !!!parse-error (type => 'in body:#eof', token => $token);
          } else {
            !!!cp ('t299.2');
          }
-Line 5247 
 sub _tree_construction_main ($) {
+Line 6435 
 sub _tree_construction_main ($) {
            unless (length $token->{data}) {
              !!!cp ('t300');
              !!!next-token;
-             redo B;
+             next B;
            }
          }
          if ($self->{insertion_mode} == AFTER_HTML_BODY_IM) {
            !!!cp ('t301');
-           !!!parse-error (type => 'after html:#character');
+           !!!parse-error (type => 'after html:#text', token => $token);
            ## Reprocess in the "after body" insertion mode.
          } else {
-Line 5261 
 sub _tree_construction_main ($) {
+Line 6449 
 sub _tree_construction_main ($) {
          }
          ## "after body" insertion mode
-         !!!parse-error (type => 'after body:#character');
+         !!!parse-error (type => 'after body:#text', token => $token);
          $self->{insertion_mode} = IN_BODY_IM;
          ## reprocess
-         redo B;
+         next B;
        } elsif ($token->{type} == START_TAG_TOKEN) {
          if ($self->{insertion_mode} == AFTER_HTML_BODY_IM) {
            !!!cp ('t303');
-           !!!parse-error (type => 'after html:'.$token->{tag_name});
+           !!!parse-error (type => 'after html',
+                           text => $token->{tag_name}, token => $token);
            ## Reprocess in the "after body" insertion mode.
          } else {
-Line 5277 
 sub _tree_construction_main ($) {
+Line 6466 
 sub _tree_construction_main ($) {
          }
          ## "after body" insertion mode
-         !!!parse-error (type => 'after body:'.$token->{tag_name});
+         !!!parse-error (type => 'after body',
+                         text => $token->{tag_name}, token => $token);
          $self->{insertion_mode} = IN_BODY_IM;
+         !!!ack-later;
          ## reprocess
-         redo B;
+         next B;
        } elsif ($token->{type} == END_TAG_TOKEN) {
          if ($self->{insertion_mode} == AFTER_HTML_BODY_IM) {
            !!!cp ('t305');
-           !!!parse-error (type => 'after html:/'.$token->{tag_name});
+           !!!parse-error (type => 'after html:/',
+                           text => $token->{tag_name}, token => $token);
            $self->{insertion_mode} = AFTER_BODY_IM;
            ## Reprocess in the "after body" insertion mode.
-Line 5297 
 sub _tree_construction_main ($) {
+Line 6489 
 sub _tree_construction_main ($) {
          if ($token->{tag_name} eq 'html') {
            if (defined $self->{inner_html_node}) {
              !!!cp ('t307');
-             !!!parse-error (type => 'unmatched end tag:html');
+             !!!parse-error (type => 'unmatched end tag',
+                             text => 'html', token => $token);
              ## Ignore the token
              !!!next-token;
-             redo B;
+             next B;
            } else {
              !!!cp ('t308');
              $self->{insertion_mode} = AFTER_HTML_BODY_IM;
              !!!next-token;
-             redo B;
+             next B;
            }
          } else {
            !!!cp ('t309');
-           !!!parse-error (type => 'after body:/'.$token->{tag_name});
+           !!!parse-error (type => 'after body:/',
+                           text => $token->{tag_name}, token => $token);
            $self->{insertion_mode} = IN_BODY_IM;
            ## reprocess
-           redo B;
+           next B;
          }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
          !!!cp ('t309.2');
-Line 5330 
 sub _tree_construction_main ($) {
+Line 6524 
 sub _tree_construction_main ($) {
            unless (length $token->{data}) {
              !!!cp ('t310');
              !!!next-token;
-             redo B;
+             next B;
            }
          }
          if ($token->{data} =~ s/^[^\x09\x0A\x0B\x0C\x20]+//) {
            if ($self->{insertion_mode} == IN_FRAMESET_IM) {
              !!!cp ('t311');
-             !!!parse-error (type => 'in frameset:#character');
+             !!!parse-error (type => 'in frameset:#text', token => $token);
            } elsif ($self->{insertion_mode} == AFTER_FRAMESET_IM) {
              !!!cp ('t312');
-             !!!parse-error (type => 'after frameset:#character');
+             !!!parse-error (type => 'after frameset:#text', token => $token);
-           } else { # "after html frameset"
+           } else { # "after after frameset"
              !!!cp ('t313');
-             !!!parse-error (type => 'after html:#character');
+             !!!parse-error (type => 'after html:#text', token => $token);
-             $self->{insertion_mode} = AFTER_FRAMESET_IM;
-             ## Reprocess in the "after frameset" insertion mode.
-             !!!parse-error (type => 'after frameset:#character');
            }
            ## Ignore the token.
-Line 5358 
 sub _tree_construction_main ($) {
+Line 6548 
 sub _tree_construction_main ($) {
              !!!cp ('t315');
              !!!next-token;
            }
-           redo B;
+           next B;
          }
          die qq[$0: Character "$token->{data}"];
        } elsif ($token->{type} == START_TAG_TOKEN) {
-         if ($self->{insertion_mode} == AFTER_HTML_FRAMESET_IM) {
-           !!!cp ('t316');
-           !!!parse-error (type => 'after html:'.$token->{tag_name});
-           $self->{insertion_mode} = AFTER_FRAMESET_IM;
-           ## Process in the "after frameset" insertion mode.
-         } else {
-           !!!cp ('t317');
-         }
          if ($token->{tag_name} eq 'frameset' and
              $self->{insertion_mode} == IN_FRAMESET_IM) {
            !!!cp ('t318');
-           !!!insert-element ($token->{tag_name}, $token->{attributes});
+           !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
+           !!!nack ('t318.1');
            !!!next-token;
-           redo B;
+           next B;
          } elsif ($token->{tag_name} eq 'frame' and
                   $self->{insertion_mode} == IN_FRAMESET_IM) {
            !!!cp ('t319');
-           !!!insert-element ($token->{tag_name}, $token->{attributes});
+           !!!insert-element ($token->{tag_name}, $token->{attributes}, $token);
            pop @{$self->{open_elements}};
+           !!!ack ('t319.1');
            !!!next-token;
-           redo B;
+           next B;
          } elsif ($token->{tag_name} eq 'noframes') {
            !!!cp ('t320');
-           ## NOTE: As if in body.
+           ## NOTE: As if in head.
            $parse_rcdata->(CDATA_CONTENT_MODEL);
-           redo B;
+           next B;
+           ## NOTE: |<!DOCTYPE HTML><frameset></frameset></html><noframes></noframes>|
+           ## has no parse error.
          } else {
            if ($self->{insertion_mode} == IN_FRAMESET_IM) {
              !!!cp ('t321');
-             !!!parse-error (type => 'in frameset:'.$token->{tag_name});
+             !!!parse-error (type => 'in frameset',
-           } else {
+                             text => $token->{tag_name}, token => $token);
+           } elsif ($self->{insertion_mode} == AFTER_FRAMESET_IM) {
              !!!cp ('t322');
-             !!!parse-error (type => 'after frameset:'.$token->{tag_name});
+             !!!parse-error (type => 'after frameset',
+                             text => $token->{tag_name}, token => $token);
+           } else { # "after after frameset"
+             !!!cp ('t322.2');
+             !!!parse-error (type => 'after after frameset',
+                             text => $token->{tag_name}, token => $token);
            }
            ## Ignore the token
+           !!!nack ('t322.1');
            !!!next-token;
-           redo B;
+           next B;
          }
        } elsif ($token->{type} == END_TAG_TOKEN) {
-         if ($self->{insertion_mode} == AFTER_HTML_FRAMESET_IM) {
-           !!!cp ('t323');
-           !!!parse-error (type => 'after html:/'.$token->{tag_name});
-           $self->{insertion_mode} = AFTER_FRAMESET_IM;
-           ## Process in the "after frameset" insertion mode.
-         } else {
-           !!!cp ('t324');
-         }
          if ($token->{tag_name} eq 'frameset' and
              $self->{insertion_mode} == IN_FRAMESET_IM) {
-           if ($self->{open_elements}->[-1]->[1] eq 'html' and
+           if ($self->{open_elements}->[-1]->[1] & HTML_EL and
                @{$self->{open_elements}} == 1) {
              !!!cp ('t325');
-             !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+             !!!parse-error (type => 'unmatched end tag',
+                             text => $token->{tag_name}, token => $token);
              ## Ignore the token
              !!!next-token;
            } else {
-Line 5429 
 sub _tree_construction_main ($) {
+Line 6612 
 sub _tree_construction_main ($) {
            }
            if (not defined $self->{inner_html_node} and
-               $self->{open_elements}->[-1]->[1] ne 'frameset') {
+               not ($self->{open_elements}->[-1]->[1] & FRAMESET_EL)) {
              !!!cp ('t327');
              $self->{insertion_mode} = AFTER_FRAMESET_IM;
            } else {
              !!!cp ('t328');
            }
-           redo B;
+           next B;
          } elsif ($token->{tag_name} eq 'html' and
                   $self->{insertion_mode} == AFTER_FRAMESET_IM) {
            !!!cp ('t329');
            $self->{insertion_mode} = AFTER_HTML_FRAMESET_IM;
            !!!next-token;
-           redo B;
+           next B;
          } else {
            if ($self->{insertion_mode} == IN_FRAMESET_IM) {
              !!!cp ('t330');
-             !!!parse-error (type => 'in frameset:/'.$token->{tag_name});
+             !!!parse-error (type => 'in frameset:/',
-           } else {
+                             text => $token->{tag_name}, token => $token);
+           } elsif ($self->{insertion_mode} == AFTER_FRAMESET_IM) {
+             !!!cp ('t330.1');
+             !!!parse-error (type => 'after frameset:/',
+                             text => $token->{tag_name}, token => $token);
+           } else { # "after after html"
              !!!cp ('t331');
-             !!!parse-error (type => 'after frameset:/'.$token->{tag_name});
+             !!!parse-error (type => 'after after frameset:/',
+                             text => $token->{tag_name}, token => $token);
            }
            ## Ignore the token
            !!!next-token;
-           redo B;
+           next B;
          }
        } elsif ($token->{type} == END_OF_FILE_TOKEN) {
-         unless ($self->{open_elements}->[-1]->[1] eq 'html' and
+         unless ($self->{open_elements}->[-1]->[1] & HTML_EL and
                  @{$self->{open_elements}} == 1) { # redundant, maybe
            !!!cp ('t331.1');
-           !!!parse-error (type => 'in body:#eof');
+           !!!parse-error (type => 'in body:#eof', token => $token);
          } else {
            !!!cp ('t331.2');
          }
-Line 5480 
 sub _tree_construction_main ($) {
+Line 6669 
 sub _tree_construction_main ($) {
          !!!cp ('t332');
          ## NOTE: This is an "as if in head" code clone
          $script_start_tag->();
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'style') {
          !!!cp ('t333');
          ## NOTE: This is an "as if in head" code clone
          $parse_rcdata->(CDATA_CONTENT_MODEL);
-         redo B;
+         next B;
        } elsif ({
                  base => 1, link => 1,
                 }->{$token->{tag_name}}) {
          !!!cp ('t334');
          ## NOTE: This is an "as if in head" code clone, only "-t" differs
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec.
+         !!!ack ('t334.1');
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'meta') {
          ## NOTE: This is an "as if in head" code clone, only "-t" differs
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          my $meta_el = pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec.
          unless ($self->{confident}) {
-           if ($token->{attributes}->{charset}) { ## TODO: And if supported
+           if ($token->{attributes}->{charset}) {
              !!!cp ('t335');
+             ## NOTE: Whether the encoding is supported or not is handled
+             ## in the {change_encoding} callback.
              $self->{change_encoding}
-                 ->($self, $token->{attributes}->{charset}->{value});
+                 ->($self, $token->{attributes}->{charset}->{value}, $token);
              $meta_el->[0]->get_attribute_node_ns (undef, 'charset')
                  ->set_user_data (manakai_has_reference =>
                                       $token->{attributes}->{charset}
                                           ->{has_reference});
            } elsif ($token->{attributes}->{content}) {
-             ## ISSUE: Algorithm name in the spec was incorrect so that not linked to the definition.
              if ($token->{attributes}->{content}->{value}
-                 =~ /\A[^;]*;[\x09-\x0D\x20]*[Cc][Hh][Aa][Rr][Ss][Ee][Tt]
+                 =~ /[Cc][Hh][Aa][Rr][Ss][Ee][Tt]
                      [\x09-\x0D\x20]*=
                      [\x09-\x0D\x20]*(?>"([^"]*)"|'([^']*)'|
-                     ([^"'\x09-\x0D\x20][^\x09-\x0D\x20]*))/x) {
+                     ([^"'\x09-\x0D\x20][^\x09-\x0D\x20\x3B]*))/x) {
                !!!cp ('t336');
+               ## NOTE: Whether the encoding is supported or not is handled
+               ## in the {change_encoding} callback.
                $self->{change_encoding}
-                   ->($self, defined $1 ? $1 : defined $2 ? $2 : $3);
+                   ->($self, defined $1 ? $1 : defined $2 ? $2 : $3, $token);
                $meta_el->[0]->get_attribute_node_ns (undef, 'content')
                    ->set_user_data (manakai_has_reference =>
                                         $token->{attributes}->{content}
-Line 5543 
 sub _tree_construction_main ($) {
+Line 6736 
 sub _tree_construction_main ($) {
            }
          }
+         !!!ack ('t338.1');
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'title') {
          !!!cp ('t341');
          ## NOTE: This is an "as if in head" code clone
          $parse_rcdata->(RCDATA_CONTENT_MODEL);
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'body') {
-         !!!parse-error (type => 'in body:body');
+         !!!parse-error (type => 'in body', text => 'body', token => $token);
          if (@{$self->{open_elements}} == 1 or
-             $self->{open_elements}->[1]->[1] ne 'body') {
+             not ($self->{open_elements}->[1]->[1] & BODY_EL)) {
            !!!cp ('t342');
            ## Ignore the token
          } else {
-Line 5568 
 sub _tree_construction_main ($) {
+Line 6762 
 sub _tree_construction_main ($) {
              }
            }
          }
+         !!!nack ('t343.1');
          !!!next-token;
-         redo B;
+         next B;
        } elsif ({
                  address => 1, blockquote => 1, center => 1, dir => 1,
                  div => 1, dl => 1, fieldset => 1,
                  h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1,
                  menu => 1, ol => 1, p => 1, ul => 1,
                  pre => 1, listing => 1,
+                 form => 1,
+                 table => 1,
+                 hr => 1,
                 }->{$token->{tag_name}}) {
+         if ($token->{tag_name} eq 'form' and defined $self->{form_element}) {
+           !!!cp ('t350');
+           !!!parse-error (type => 'in form:form', token => $token);
+           ## Ignore the token
+           !!!nack ('t350.1');
+           !!!next-token;
+           next B;
+         }
          ## has a p element in scope
          INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
+           if ($_->[1] & P_EL) {
              !!!cp ('t344');
-             !!!back-token;
+             !!!back-token; # <form>
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'p',
-             redo B;
+                       line => $token->{line}, column => $token->{column}};
-           } elsif ({
+             next B;
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
+           } elsif ($_->[1] & SCOPING_EL) {
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
              !!!cp ('t345');
              last INSCOPE;
            }
          } # INSCOPE
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          if ($token->{tag_name} eq 'pre' or $token->{tag_name} eq 'listing') {
+           !!!nack ('t346.1');
            !!!next-token;
            if ($token->{type} == CHARACTER_TOKEN) {
              $token->{data} =~ s/^\x0A//;
-Line 5607 
 sub _tree_construction_main ($) {
+Line 6813 
 sub _tree_construction_main ($) {
            } else {
              !!!cp ('t348');
            }
-         } else {
+         } elsif ($token->{tag_name} eq 'form') {
-           !!!cp ('t347');
+           !!!cp ('t347.1');
+           $self->{form_element} = $self->{open_elements}->[-1]->[0];
+           !!!nack ('t347.2');
            !!!next-token;
-         }
+         } elsif ($token->{tag_name} eq 'table') {
-         redo B;
+           !!!cp ('t382');
-       } elsif ($token->{tag_name} eq 'form') {
+           push @{$open_tables}, [$self->{open_elements}->[-1]->[0]];
-         if (defined $self->{form_element}) {
-           !!!cp ('t350');
+           $self->{insertion_mode} = IN_TABLE_IM;
-           !!!parse-error (type => 'in form:form');
-           ## Ignore the token
+           !!!nack ('t382.1');
+           !!!next-token;
+         } elsif ($token->{tag_name} eq 'hr') {
+           !!!cp ('t386');
+           pop @{$self->{open_elements}};
+           !!!nack ('t386.1');
            !!!next-token;
-           redo B;
          } else {
-           ## has a p element in scope
+           !!!nack ('t347.1');
-           INSCOPE: for (reverse @{$self->{open_elements}}) {
-             if ($_->[1] eq 'p') {
-               !!!cp ('t351');
-               !!!back-token;
-               $token = {type => END_TAG_TOKEN, tag_name => 'p'};
-               redo B;
-             } elsif ({
-                       applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                       button => 1, marquee => 1, object => 1, html => 1,
-                      }->{$_->[1]}) {
-               !!!cp ('t352');
-               last INSCOPE;
-             }
-           } # INSCOPE
-           !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-           $self->{form_element} = $self->{open_elements}->[-1]->[0];
            !!!next-token;
-           redo B;
          }
-       } elsif ($token->{tag_name} eq 'li') {
+         next B;
+       } elsif ({li => 1, dt => 1, dd => 1}->{$token->{tag_name}}) {
          ## has a p element in scope
          INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
+           if ($_->[1] & P_EL) {
              !!!cp ('t353');
-             !!!back-token;
+             !!!back-token; # <x>
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'p',
-             redo B;
+                       line => $token->{line}, column => $token->{column}};
-           } elsif ({
+             next B;
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
+           } elsif ($_->[1] & SCOPING_EL) {
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
              !!!cp ('t354');
              last INSCOPE;
            }
-Line 5661 
 sub _tree_construction_main ($) {
+Line 6856 
 sub _tree_construction_main ($) {
          ## Step 1
          my $i = -1;
          my $node = $self->{open_elements}->[$i];
+         my $li_or_dtdd = {li => {li => 1},
+                           dt => {dt => 1, dd => 1},
+                           dd => {dt => 1, dd => 1}}->{$token->{tag_name}};
          LI: {
            ## Step 2
-           if ($node->[1] eq 'li') {
+           if ($li_or_dtdd->{$node->[0]->manakai_local_name}) {
              if ($i != -1) {
                !!!cp ('t355');
-               !!!parse-error (type => 'end tag missing:'.
+               !!!parse-error (type => 'not closed',
-                               $self->{open_elements}->[-1]->[1]);
+                               text => $self->{open_elements}->[-1]->[0]
+                                   ->manakai_local_name,
+                               token => $token);
              } else {
                !!!cp ('t356');
              }
-Line 5678 
 sub _tree_construction_main ($) {
+Line 6878 
 sub _tree_construction_main ($) {
            }
            ## Step 3
-           if (not $formatting_category->{$node->[1]} and
+           if (not ($node->[1] & FORMATTING_EL) and
                #not $phrasing_category->{$node->[1]} and
-               ($special_category->{$node->[1]} or
+               ($node->[1] & SPECIAL_EL or
-                $scoping_category->{$node->[1]}) and
+                $node->[1] & SCOPING_EL) and
-               $node->[1] ne 'address' and $node->[1] ne 'div') {
+               not ($node->[1] & ADDRESS_EL) and
+               not ($node->[1] & DIV_EL)) {
              !!!cp ('t358');
              last LI;
            }
-Line 5694 
 sub _tree_construction_main ($) {
+Line 6895 
 sub _tree_construction_main ($) {
            redo LI;
          } # LI
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
+         !!!nack ('t359.1');
          !!!next-token;
-         redo B;
+         next B;
-       } elsif ($token->{tag_name} eq 'dd' or $token->{tag_name} eq 'dt') {
-         ## has a p element in scope
-         INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
-             !!!cp ('t360');
-             !!!back-token;
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
-             redo B;
-           } elsif ({
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
-             !!!cp ('t361');
-             last INSCOPE;
-           }
-         } # INSCOPE
-         ## Step 1
-         my $i = -1;
-         my $node = $self->{open_elements}->[$i];
-         LI: {
-           ## Step 2
-           if ($node->[1] eq 'dt' or $node->[1] eq 'dd') {
-             if ($i != -1) {
-               !!!cp ('t362');
-               !!!parse-error (type => 'end tag missing:'.
-                               $self->{open_elements}->[-1]->[1]);
-             } else {
-               !!!cp ('t363');
-             }
-             splice @{$self->{open_elements}}, $i;
-             last LI;
-           } else {
-             !!!cp ('t364');
-           }
-           ## Step 3
-           if (not $formatting_category->{$node->[1]} and
-               #not $phrasing_category->{$node->[1]} and
-               ($special_category->{$node->[1]} or
-                $scoping_category->{$node->[1]}) and
-               $node->[1] ne 'address' and $node->[1] ne 'div') {
-             !!!cp ('t365');
-             last LI;
-           }
-           !!!cp ('t366');
-           ## Step 4
-           $i--;
-           $node = $self->{open_elements}->[$i];
-           redo LI;
-         } # LI
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         !!!next-token;
-         redo B;
        } elsif ($token->{tag_name} eq 'plaintext') {
          ## has a p element in scope
          INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
+           if ($_->[1] & P_EL) {
              !!!cp ('t367');
-             !!!back-token;
+             !!!back-token; # <plaintext>
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'p',
-             redo B;
+                       line => $token->{line}, column => $token->{column}};
-           } elsif ({
+             next B;
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
+           } elsif ($_->[1] & SCOPING_EL) {
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
              !!!cp ('t368');
              last INSCOPE;
            }
          } # INSCOPE
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          $self->{content_model} = PLAINTEXT_CONTENT_MODEL;
+         !!!nack ('t368.1');
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'a') {
          AFE: for my $i (reverse 0..$#$active_formatting_elements) {
            my $node = $active_formatting_elements->[$i];
-           if ($node->[1] eq 'a') {
+           if ($node->[1] & A_EL) {
              !!!cp ('t371');
-             !!!parse-error (type => 'in a:a');
+             !!!parse-error (type => 'in a:a', token => $token);
-             !!!back-token;
+             !!!back-token; # <a>
-             $token = {type => END_TAG_TOKEN, tag_name => 'a'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'a',
-             $formatting_end_tag->($token->{tag_name});
+                       line => $token->{line}, column => $token->{column}};
+             $formatting_end_tag->($token);
              AFE2: for (reverse 0..$#$active_formatting_elements) {
                if ($active_formatting_elements->[$_]->[0] eq $node->[0]) {
-Line 5810 
 sub _tree_construction_main ($) {
+Line 6956 
 sub _tree_construction_main ($) {
          $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          push @$active_formatting_elements, $self->{open_elements}->[-1];
+         !!!nack ('t374.1');
          !!!next-token;
-         redo B;
+         next B;
-       } elsif ({
-                 b => 1, big => 1, em => 1, font => 1, i => 1,
-                 s => 1, small => 1, strile => 1,
-                 strong => 1, tt => 1, u => 1,
-                }->{$token->{tag_name}}) {
-         !!!cp ('t375');
-         $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         push @$active_formatting_elements, $self->{open_elements}->[-1];
-         !!!next-token;
-         redo B;
        } elsif ($token->{tag_name} eq 'nobr') {
          $reconstruct_active_formatting_elements->($insert_to_current);
          ## has a |nobr| element in scope
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ($node->[1] eq 'nobr') {
+           if ($node->[1] & NOBR_EL) {
              !!!cp ('t376');
-             !!!parse-error (type => 'in nobr:nobr');
+             !!!parse-error (type => 'in nobr:nobr', token => $token);
-             !!!back-token;
+             !!!back-token; # <nobr>
-             $token = {type => END_TAG_TOKEN, tag_name => 'nobr'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'nobr',
-             redo B;
+                       line => $token->{line}, column => $token->{column}};
-           } elsif ({
+             next B;
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
+           } elsif ($node->[1] & SCOPING_EL) {
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t377');
              last INSCOPE;
            }
          } # INSCOPE
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          push @$active_formatting_elements, $self->{open_elements}->[-1];
+         !!!nack ('t377.1');
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'button') {
          ## has a button element in scope
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ($node->[1] eq 'button') {
+           if ($node->[1] & BUTTON_EL) {
              !!!cp ('t378');
-             !!!parse-error (type => 'in button:button');
+             !!!parse-error (type => 'in button:button', token => $token);
-             !!!back-token;
+             !!!back-token; # <button>
-             $token = {type => END_TAG_TOKEN, tag_name => 'button'};
+             $token = {type => END_TAG_TOKEN, tag_name => 'button',
-             redo B;
+                       line => $token->{line}, column => $token->{column}};
-           } elsif ({
+             next B;
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
+           } elsif ($node->[1] & SCOPING_EL) {
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t379');
              last INSCOPE;
            }
-Line 5875 
 sub _tree_construction_main ($) {
+Line 7006 
 sub _tree_construction_main ($) {
          $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
          ## TODO: associate with $self->{form_element} if defined
          push @$active_formatting_elements, ['#marker', ''];
+         !!!nack ('t379.1');
          !!!next-token;
-         redo B;
+         next B;
-       } elsif ({
-                 applet => 1, marquee => 1, object => 1,
-                }->{$token->{tag_name}}) {
-         !!!cp ('t380');
-         $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         push @$active_formatting_elements, ['#marker', ''];
-         !!!next-token;
-         redo B;
-       } elsif ($token->{tag_name} eq 'xmp') {
-         !!!cp ('t381');
-         $reconstruct_active_formatting_elements->($insert_to_current);
-         $parse_rcdata->(CDATA_CONTENT_MODEL);
-         redo B;
-       } elsif ($token->{tag_name} eq 'table') {
-         ## has a p element in scope
-         INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
-             !!!cp ('t382');
-             !!!back-token;
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
-             redo B;
-           } elsif ({
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
-             !!!cp ('t383');
-             last INSCOPE;
-           }
-         } # INSCOPE
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         push @{$open_tables}, [$self->{open_elements}->[-1]->[0]];
-         $self->{insertion_mode} = IN_TABLE_IM;
-         !!!next-token;
-         redo B;
        } elsif ({
-                 area => 1, basefont => 1, bgsound => 1, br => 1,
+                 xmp => 1,
-                 embed => 1, img => 1, param => 1, spacer => 1, wbr => 1,
+                 iframe => 1,
-                 image => 1,
+                 noembed => 1,
+                 noframes => 1, ## NOTE: This is an "as if in head" code clone.
+                 noscript => 0, ## TODO: 1 if scripting is enabled
                 }->{$token->{tag_name}}) {
-         if ($token->{tag_name} eq 'image') {
+         if ($token->{tag_name} eq 'xmp') {
-           !!!cp ('t384');
+           !!!cp ('t381');
-           !!!parse-error (type => 'image');
+           $reconstruct_active_formatting_elements->($insert_to_current);
-           $token->{tag_name} = 'img';
          } else {
-           !!!cp ('t385');
+           !!!cp ('t399');
          }
+         ## NOTE: There is an "as if in body" code clone.
-         ## NOTE: There is an "as if <br>" code clone.
+         $parse_rcdata->(CDATA_CONTENT_MODEL);
-         $reconstruct_active_formatting_elements->($insert_to_current);
+         next B;
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         pop @{$self->{open_elements}};
-         !!!next-token;
-         redo B;
-       } elsif ($token->{tag_name} eq 'hr') {
-         ## has a p element in scope
-         INSCOPE: for (reverse @{$self->{open_elements}}) {
-           if ($_->[1] eq 'p') {
-             !!!cp ('t386');
-             !!!back-token;
-             $token = {type => END_TAG_TOKEN, tag_name => 'p'};
-             redo B;
-           } elsif ({
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$_->[1]}) {
-             !!!cp ('t387');
-             last INSCOPE;
-           }
-         } # INSCOPE
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         pop @{$self->{open_elements}};
-         !!!next-token;
-         redo B;
-       } elsif ($token->{tag_name} eq 'input') {
-         !!!cp ('t388');
-         $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         ## TODO: associate with $self->{form_element} if defined
-         pop @{$self->{open_elements}};
-         !!!next-token;
-         redo B;
        } elsif ($token->{tag_name} eq 'isindex') {
-         !!!parse-error (type => 'isindex');
+         !!!parse-error (type => 'isindex', token => $token);
          if (defined $self->{form_element}) {
            !!!cp ('t389');
            ## Ignore the token
+           !!!nack ('t389'); ## NOTE: Not acknowledged.
            !!!next-token;
-           redo B;
+           next B;
          } else {
+           !!!ack ('t391.1');
            my $at = $token->{attributes};
            my $form_attrs;
            $form_attrs->{action} = $at->{action} if $at->{action};
-Line 5994 
 sub _tree_construction_main ($) {
+Line 7052 
 sub _tree_construction_main ($) {
            delete $at->{prompt};
            my @tokens = (
                          {type => START_TAG_TOKEN, tag_name => 'form',
-                          attributes => $form_attrs},
+                          attributes => $form_attrs,
-                         {type => START_TAG_TOKEN, tag_name => 'hr'},
+                          line => $token->{line}, column => $token->{column}},
-                         {type => START_TAG_TOKEN, tag_name => 'p'},
+                         {type => START_TAG_TOKEN, tag_name => 'hr',
-                         {type => START_TAG_TOKEN, tag_name => 'label'},
+                          line => $token->{line}, column => $token->{column}},
+                         {type => START_TAG_TOKEN, tag_name => 'p',
+                          line => $token->{line}, column => $token->{column}},
+                         {type => START_TAG_TOKEN, tag_name => 'label',
+                          line => $token->{line}, column => $token->{column}},
                         );
            if ($prompt_attr) {
              !!!cp ('t390');
-             push @tokens, {type => CHARACTER_TOKEN, data => $prompt_attr->{value}};
+             push @tokens, {type => CHARACTER_TOKEN, data => $prompt_attr->{value},
+                            #line => $token->{line}, column => $token->{column},
+                           };
            } else {
              !!!cp ('t391');
              push @tokens, {type => CHARACTER_TOKEN,
-                            data => 'This is a searchable index. Insert your search keywords here: '}; # SHOULD
+                            data => 'This is a searchable index. Insert your search keywords here: ',
+                            #line => $token->{line}, column => $token->{column},
+                           }; # SHOULD
              ## TODO: make this configurable
            }
            push @tokens,
-                         {type => START_TAG_TOKEN, tag_name => 'input', attributes => $at},
+                         {type => START_TAG_TOKEN, tag_name => 'input', attributes => $at,
+                          line => $token->{line}, column => $token->{column}},
                          #{type => CHARACTER_TOKEN, data => ''}, # SHOULD
-                         {type => END_TAG_TOKEN, tag_name => 'label'},
+                         {type => END_TAG_TOKEN, tag_name => 'label',
-                         {type => END_TAG_TOKEN, tag_name => 'p'},
+                          line => $token->{line}, column => $token->{column}},
-                         {type => START_TAG_TOKEN, tag_name => 'hr'},
+                         {type => END_TAG_TOKEN, tag_name => 'p',
-                         {type => END_TAG_TOKEN, tag_name => 'form'};
+                          line => $token->{line}, column => $token->{column}},
-           $token = shift @tokens;
+                         {type => START_TAG_TOKEN, tag_name => 'hr',
+                          line => $token->{line}, column => $token->{column}},
+                         {type => END_TAG_TOKEN, tag_name => 'form',
+                          line => $token->{line}, column => $token->{column}};
            !!!back-token (@tokens);
-           redo B;
+           !!!next-token;
+           next B;
          }
        } elsif ($token->{tag_name} eq 'textarea') {
          my $tag_name = $token->{tag_name};
          my $el;
-         !!!create-element ($el, $token->{tag_name}, $token->{attributes});
+         !!!create-element ($el, $HTML_NS, $token->{tag_name}, $token->{attributes}, $token);
          ## TODO: $self->{form_element} if defined
          $self->{content_model} = RCDATA_CONTENT_MODEL;
-Line 6031 
 sub _tree_construction_main ($) {
+Line 7102 
 sub _tree_construction_main ($) {
          $insert->($el);
          my $text = '';
+         !!!nack ('t392.1');
          !!!next-token;
          if ($token->{type} == CHARACTER_TOKEN) {
            $token->{data} =~ s/^\x0A//;
-Line 6061 
 sub _tree_construction_main ($) {
+Line 7133 
 sub _tree_construction_main ($) {
            ## Ignore the token
          } else {
            !!!cp ('t398');
-           !!!parse-error (type => 'in RCDATA:#'.$token->{type});
+           !!!parse-error (type => 'in RCDATA:#eof', token => $token);
          }
          !!!next-token;
+         next B;
+       } elsif ($token->{tag_name} eq 'rt' or
+                $token->{tag_name} eq 'rp') {
+         ## has a |ruby| element in scope
+         INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
+           my $node = $self->{open_elements}->[$_];
+           if ($node->[1] & RUBY_EL) {
+             !!!cp ('t398.1');
+             ## generate implied end tags
+             while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
+               !!!cp ('t398.2');
+               pop @{$self->{open_elements}};
+             }
+             unless ($self->{open_elements}->[-1]->[1] & RUBY_EL) {
+               !!!cp ('t398.3');
+               !!!parse-error (type => 'not closed',
+                               text => $self->{open_elements}->[-1]->[0]
+                                   ->manakai_local_name,
+                               token => $token);
+               pop @{$self->{open_elements}}
+                   while not $self->{open_elements}->[-1]->[1] & RUBY_EL;
+             }
+             last INSCOPE;
+           } elsif ($node->[1] & SCOPING_EL) {
+             !!!cp ('t398.4');
+             last INSCOPE;
+           }
+         } # INSCOPE
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
+         !!!nack ('t398.5');
+         !!!next-token;
          redo B;
-       } elsif ({
+       } elsif ($token->{tag_name} eq 'math' or
-                 iframe => 1,
+                $token->{tag_name} eq 'svg') {
-                 noembed => 1,
-                 noframes => 1,
-                 noscript => 0, ## TODO: 1 if scripting is enabled
-                }->{$token->{tag_name}}) {
-         !!!cp ('t399');
-         ## NOTE: There is an "as if in body" code clone.
-         $parse_rcdata->(CDATA_CONTENT_MODEL);
-         redo B;
-       } elsif ($token->{tag_name} eq 'select') {
-         !!!cp ('t400');
          $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
-         ## TODO: associate with $self->{form_element} if defined
+         ## "Adjust MathML attributes" ('math' only) - done in insert-element-f
+         ## "adjust SVG attributes" ('svg' only) - done in insert-element-f
+         ## "adjust foreign attributes" - done in insert-element-f
-         if ($self->{insertion_mode} & TABLE_IMS or
+         !!!insert-element-f ($token->{tag_name} eq 'math' ? $MML_NS : $SVG_NS, $token->{tag_name}, $token->{attributes}, $token);
-             $self->{insertion_mode} & BODY_TABLE_IMS or
-             $self->{insertion_mode} == IN_COLUMN_GROUP_IM) {
+         if ($self->{self_closing}) {
-           !!!cp ('t400.1');
+           pop @{$self->{open_elements}};
-           $self->{insertion_mode} = IN_SELECT_IN_TABLE_IM;
+           !!!ack ('t398.1');
          } else {
-           !!!cp ('t400.2');
+           !!!cp ('t398.2');
-           $self->{insertion_mode} = IN_SELECT_IM;
+           $self->{insertion_mode} |= IN_FOREIGN_CONTENT_IM;
+           ## NOTE: |<body><math><mi><svg>| -> "in foreign content" insertion
+           ## mode, "in body" (not "in foreign content") secondary insertion
+           ## mode, maybe.
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ({
                  caption => 1, col => 1, colgroup => 1, frame => 1,
                  frameset => 1, head => 1, option => 1, optgroup => 1,
-Line 6101 
 sub _tree_construction_main ($) {
+Line 7202 
 sub _tree_construction_main ($) {
                  thead => 1, tr => 1,
                 }->{$token->{tag_name}}) {
          !!!cp ('t401');
-         !!!parse-error (type => 'in body:'.$token->{tag_name});
+         !!!parse-error (type => 'in body',
+                         text => $token->{tag_name}, token => $token);
          ## Ignore the token
+         !!!nack ('t401.1'); ## NOTE: |<col/>| or |<frame/>| here is an error.
          !!!next-token;
-         redo B;
+         next B;
          ## ISSUE: An issue on HTML5 new elements in the spec.
        } else {
-         !!!cp ('t402');
+         if ($token->{tag_name} eq 'image') {
+           !!!cp ('t384');
+           !!!parse-error (type => 'image', token => $token);
+           $token->{tag_name} = 'img';
+         } else {
+           !!!cp ('t385');
+         }
+         ## NOTE: There is an "as if <br>" code clone.
          $reconstruct_active_formatting_elements->($insert_to_current);
-         !!!insert-element-t ($token->{tag_name}, $token->{attributes});
+         !!!insert-element-t ($token->{tag_name}, $token->{attributes}, $token);
+         if ({
+              applet => 1, marquee => 1, object => 1,
+             }->{$token->{tag_name}}) {
+           !!!cp ('t380');
+           push @$active_formatting_elements, ['#marker', ''];
+           !!!nack ('t380.1');
+         } elsif ({
+                   b => 1, big => 1, em => 1, font => 1, i => 1,
+                   s => 1, small => 1, strile => 1,
+                   strong => 1, tt => 1, u => 1,
+                  }->{$token->{tag_name}}) {
+           !!!cp ('t375');
+           push @$active_formatting_elements, $self->{open_elements}->[-1];
+           !!!nack ('t375.1');
+         } elsif ($token->{tag_name} eq 'input') {
+           !!!cp ('t388');
+           ## TODO: associate with $self->{form_element} if defined
+           pop @{$self->{open_elements}};
+           !!!ack ('t388.2');
+         } elsif ({
+                   area => 1, basefont => 1, bgsound => 1, br => 1,
+                   embed => 1, img => 1, param => 1, spacer => 1, wbr => 1,
+                   #image => 1,
+                  }->{$token->{tag_name}}) {
+           !!!cp ('t388.1');
+           pop @{$self->{open_elements}};
+           !!!ack ('t388.3');
+         } elsif ($token->{tag_name} eq 'select') {
+           ## TODO: associate with $self->{form_element} if defined
+           if ($self->{insertion_mode} & TABLE_IMS or
+               $self->{insertion_mode} & BODY_TABLE_IMS or
+               $self->{insertion_mode} == IN_COLUMN_GROUP_IM) {
+             !!!cp ('t400.1');
+             $self->{insertion_mode} = IN_SELECT_IN_TABLE_IM;
+           } else {
+             !!!cp ('t400.2');
+             $self->{insertion_mode} = IN_SELECT_IM;
+           }
+           !!!nack ('t400.3');
+         } else {
+           !!!nack ('t402');
+         }
          !!!next-token;
-         redo B;
+         next B;
        }
      } elsif ($token->{type} == END_TAG_TOKEN) {
        if ($token->{tag_name} eq 'body') {
-         if (@{$self->{open_elements}} > 1 and
+         ## has a |body| element in scope
-             $self->{open_elements}->[1]->[1] eq 'body') {
+         my $i;
-           for (@{$self->{open_elements}}) {
+         INSCOPE: {
-             unless ({
+           for (reverse @{$self->{open_elements}}) {
-                        dd => 1, dt => 1, li => 1, p => 1, td => 1,
+             if ($_->[1] & BODY_EL) {
-                        th => 1, tr => 1, body => 1, html => 1,
+               !!!cp ('t405');
-                      tbody => 1, tfoot => 1, thead => 1,
+               $i = $_;
-                     }->{$_->[1]}) {
+               last INSCOPE;
-               !!!cp ('t403');
+             } elsif ($_->[1] & SCOPING_EL) {
-               !!!parse-error (type => 'not closed:'.$_->[1]);
+               !!!cp ('t405.1');
-             } else {
+               last;
-               !!!cp ('t404');
              }
            }
-           $self->{insertion_mode} = AFTER_BODY_IM;
+           !!!parse-error (type => 'start tag not allowed',
-           !!!next-token;
+                           text => $token->{tag_name}, token => $token);
-           redo B;
+           ## NOTE: Ignore the token.
-         } else {
-           !!!cp ('t405');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
-           ## Ignore the token
            !!!next-token;
-           redo B;
+           next B;
+         } # INSCOPE
+         for (@{$self->{open_elements}}) {
+           unless ($_->[1] & ALL_END_TAG_OPTIONAL_EL) {
+             !!!cp ('t403');
+             !!!parse-error (type => 'not closed',
+                             text => $_->[0]->manakai_local_name,
+                             token => $token);
+             last;
+           } else {
+             !!!cp ('t404');
+           }
          }
+         $self->{insertion_mode} = AFTER_BODY_IM;
+         !!!next-token;
+         next B;
        } elsif ($token->{tag_name} eq 'html') {
-         if (@{$self->{open_elements}} > 1 and $self->{open_elements}->[1]->[1] eq 'body') {
+         ## TODO: Update this code.  It seems that the code below is not
+         ## up-to-date, though it has same effect as speced.
+         if (@{$self->{open_elements}} > 1 and
+             $self->{open_elements}->[1]->[1] & BODY_EL) {
            ## ISSUE: There is an issue in the spec.
-           if ($self->{open_elements}->[-1]->[1] ne 'body') {
+           unless ($self->{open_elements}->[-1]->[1] & BODY_EL) {
              !!!cp ('t406');
-             !!!parse-error (type => 'not closed:'.$self->{open_elements}->[1]->[1]);
+             !!!parse-error (type => 'not closed',
+                             text => $self->{open_elements}->[1]->[0]
+                                 ->manakai_local_name,
+                             token => $token);
            } else {
              !!!cp ('t407');
            }
            $self->{insertion_mode} = AFTER_BODY_IM;
            ## reprocess
-           redo B;
+           next B;
          } else {
            !!!cp ('t408');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
            ## Ignore the token
            !!!next-token;
-           redo B;
+           next B;
          }
        } elsif ({
                  address => 1, blockquote => 1, center => 1, dir => 1,
-Line 6173 
 sub _tree_construction_main ($) {
+Line 7346 
 sub _tree_construction_main ($) {
          my $i;
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ($node->[1] eq $token->{tag_name}) {
+           if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
              !!!cp ('t410');
              $i = $_;
              last INSCOPE;
-           } elsif ({
+           } elsif ($node->[1] & SCOPING_EL) {
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t411');
              last INSCOPE;
            }
-Line 6188 
 sub _tree_construction_main ($) {
+Line 7358 
 sub _tree_construction_main ($) {
          unless (defined $i) { # has an element in scope
            !!!cp ('t413');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
+           ## NOTE: Ignore the token.
          } else {
            ## Step 1. generate implied end tags
            while ({
+                   ## END_TAG_OPTIONAL_EL
                    dd => ($token->{tag_name} ne 'dd'),
                    dt => ($token->{tag_name} ne 'dt'),
                    li => ($token->{tag_name} ne 'li'),
                    p => 1,
-                  }->{$self->{open_elements}->[-1]->[1]}) {
+                   rt => 1,
+                   rp => 1,
+                  }->{$self->{open_elements}->[-1]->[0]->manakai_local_name}) {
              !!!cp ('t409');
              pop @{$self->{open_elements}};
            }
            ## Step 2.
-           if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) {
+           if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                   ne $token->{tag_name}) {
              !!!cp ('t412');
-             !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+             !!!parse-error (type => 'not closed',
+                             text => $self->{open_elements}->[-1]->[0]
+                                 ->manakai_local_name,
+                             token => $token);
            } else {
              !!!cp ('t414');
            }
-Line 6219 
 sub _tree_construction_main ($) {
+Line 7398 
 sub _tree_construction_main ($) {
                }->{$token->{tag_name}};
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'form') {
          undef $self->{form_element};
-Line 6227 
 sub _tree_construction_main ($) {
+Line 7406 
 sub _tree_construction_main ($) {
          my $i;
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ($node->[1] eq $token->{tag_name}) {
+           if ($node->[1] & FORM_EL) {
              !!!cp ('t418');
              $i = $_;
              last INSCOPE;
-           } elsif ({
+           } elsif ($node->[1] & SCOPING_EL) {
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t419');
              last INSCOPE;
            }
-Line 6242 
 sub _tree_construction_main ($) {
+Line 7418 
 sub _tree_construction_main ($) {
          unless (defined $i) { # has an element in scope
            !!!cp ('t421');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
+           ## NOTE: Ignore the token.
          } else {
            ## Step 1. generate implied end tags
-           while ({
+           while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
-                   dd => 1, dt => 1, li => 1, p => 1,
-                  }->{$self->{open_elements}->[-1]->[1]}) {
              !!!cp ('t417');
              pop @{$self->{open_elements}};
            }
            ## Step 2.
-           if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) {
+           if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                   ne $token->{tag_name}) {
              !!!cp ('t417.1');
-             !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+             !!!parse-error (type => 'not closed',
+                             text => $self->{open_elements}->[-1]->[0]
+                                 ->manakai_local_name,
+                             token => $token);
            } else {
              !!!cp ('t420');
            }
-Line 6265 
 sub _tree_construction_main ($) {
+Line 7445 
 sub _tree_construction_main ($) {
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ({
                  h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1,
                 }->{$token->{tag_name}}) {
-Line 6273 
 sub _tree_construction_main ($) {
+Line 7453 
 sub _tree_construction_main ($) {
          my $i;
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ({
+           if ($node->[1] & HEADING_EL) {
-                h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1,
-               }->{$node->[1]}) {
              !!!cp ('t423');
              $i = $_;
              last INSCOPE;
-           } elsif ({
+           } elsif ($node->[1] & SCOPING_EL) {
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t424');
              last INSCOPE;
            }
-Line 6290 
 sub _tree_construction_main ($) {
+Line 7465 
 sub _tree_construction_main ($) {
          unless (defined $i) { # has an element in scope
            !!!cp ('t425.1');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
+           ## NOTE: Ignore the token.
          } else {
            ## Step 1. generate implied end tags
-           while ({
+           while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
-                   dd => 1, dt => 1, li => 1, p => 1,
-                  }->{$self->{open_elements}->[-1]->[1]}) {
              !!!cp ('t422');
              pop @{$self->{open_elements}};
            }
            ## Step 2.
-           if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) {
+           if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                   ne $token->{tag_name}) {
              !!!cp ('t425');
-             !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+             !!!parse-error (type => 'unmatched end tag',
+                             text => $token->{tag_name}, token => $token);
            } else {
              !!!cp ('t426');
            }
-Line 6313 
 sub _tree_construction_main ($) {
+Line 7490 
 sub _tree_construction_main ($) {
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'p') {
          ## has an element in scope
          my $i;
          INSCOPE: for (reverse 0..$#{$self->{open_elements}}) {
            my $node = $self->{open_elements}->[$_];
-           if ($node->[1] eq $token->{tag_name}) {
+           if ($node->[1] & P_EL) {
              !!!cp ('t410.1');
              $i = $_;
              last INSCOPE;
-           } elsif ({
+           } elsif ($node->[1] & SCOPING_EL) {
-                     applet => 1, table => 1, caption => 1, td => 1, th => 1,
-                     button => 1, marquee => 1, object => 1, html => 1,
-                    }->{$node->[1]}) {
              !!!cp ('t411.1');
              last INSCOPE;
            }
          } # INSCOPE
          if (defined $i) {
-           if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) {
+           if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                   ne $token->{tag_name}) {
              !!!cp ('t412.1');
-             !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+             !!!parse-error (type => 'not closed',
+                             text => $self->{open_elements}->[-1]->[0]
+                                 ->manakai_local_name,
+                             token => $token);
            } else {
              !!!cp ('t414.1');
            }
-Line 6343 
 sub _tree_construction_main ($) {
+Line 7521 
 sub _tree_construction_main ($) {
            splice @{$self->{open_elements}}, $i;
          } else {
            !!!cp ('t413.1');
-           !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+           !!!parse-error (type => 'unmatched end tag',
+                           text => $token->{tag_name}, token => $token);
            !!!cp ('t415.1');
            ## As if <p>, then reprocess the current token
            my $el;
-           !!!create-element ($el, 'p');
+           !!!create-element ($el, $HTML_NS, 'p',, $token);
            $insert->($el);
            ## NOTE: Not inserted into |$self->{open_elements}|.
          }
          !!!next-token;
-         redo B;
+         next B;
        } elsif ({
                  a => 1,
                  b => 1, big => 1, em => 1, font => 1, i => 1,
-Line 6362 
 sub _tree_construction_main ($) {
+Line 7541 
 sub _tree_construction_main ($) {
                  strong => 1, tt => 1, u => 1,
                 }->{$token->{tag_name}}) {
          !!!cp ('t427');
-         $formatting_end_tag->($token->{tag_name});
+         $formatting_end_tag->($token);
-         redo B;
+         next B;
        } elsif ($token->{tag_name} eq 'br') {
          !!!cp ('t428');
-         !!!parse-error (type => 'unmatched end tag:br');
+         !!!parse-error (type => 'unmatched end tag',
+                         text => 'br', token => $token);
          ## As if <br>
          $reconstruct_active_formatting_elements->($insert_to_current);
          my $el;
-         !!!create-element ($el, 'br');
+         !!!create-element ($el, $HTML_NS, 'br',, $token);
          $insert->($el);
          ## Ignore the token.
          !!!next-token;
-         redo B;
+         next B;
        } elsif ({
                  caption => 1, col => 1, colgroup => 1, frame => 1,
                  frameset => 1, head => 1, option => 1, optgroup => 1,
-Line 6391 
 sub _tree_construction_main ($) {
+Line 7571 
 sub _tree_construction_main ($) {
                  noscript => 0, ## TODO: if scripting is enabled
                 }->{$token->{tag_name}}) {
          !!!cp ('t429');
-         !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+         !!!parse-error (type => 'unmatched end tag',
+                         text => $token->{tag_name}, token => $token);
          ## Ignore the token
          !!!next-token;
-         redo B;
+         next B;
          ## ISSUE: Issue on HTML5 new elements in spec
-Line 6405 
 sub _tree_construction_main ($) {
+Line 7586 
 sub _tree_construction_main ($) {
          ## Step 2
          S2: {
-           if ($node->[1] eq $token->{tag_name}) {
+           if ($node->[0]->manakai_local_name eq $token->{tag_name}) {
              ## Step 1
              ## generate implied end tags
-             while ({
+             while ($self->{open_elements}->[-1]->[1] & END_TAG_OPTIONAL_EL) {
-                     dd => 1, dt => 1, li => 1, p => 1,
-                    }->{$self->{open_elements}->[-1]->[1]}) {
                !!!cp ('t430');
-               ## ISSUE: Can this case be reached?
+               ## NOTE: |<ruby><rt></ruby>|.
+               ## ISSUE: <ruby><rt></rt> will also take this code path,
+               ## which seems wrong.
                pop @{$self->{open_elements}};
+               $node_i++;
              }
              ## Step 2
-             if ($token->{tag_name} ne $self->{open_elements}->[-1]->[1]) {
+             if ($self->{open_elements}->[-1]->[0]->manakai_local_name
+                     ne $token->{tag_name}) {
                !!!cp ('t431');
                ## NOTE: <x><y></x>
-               !!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]);
+               !!!parse-error (type => 'not closed',
+                               text => $self->{open_elements}->[-1]->[0]
+                                   ->manakai_local_name,
+                               token => $token);
              } else {
                !!!cp ('t432');
              }
              ## Step 3
-             splice @{$self->{open_elements}}, $node_i;
+             splice @{$self->{open_elements}}, $node_i if $node_i < 0;
              !!!next-token;
              last S2;
            } else {
              ## Step 3
-             if (not $formatting_category->{$node->[1]} and
+             if (not ($node->[1] & FORMATTING_EL) and
                  #not $phrasing_category->{$node->[1]} and
-                 ($special_category->{$node->[1]} or
+                 ($node->[1] & SPECIAL_EL or
-                  $scoping_category->{$node->[1]})) {
+                  $node->[1] & SCOPING_EL)) {
                !!!cp ('t433');
-               !!!parse-error (type => 'unmatched end tag:'.$token->{tag_name});
+               !!!parse-error (type => 'unmatched end tag',
+                               text => $token->{tag_name}, token => $token);
                ## Ignore the token
                !!!next-token;
                last S2;
-Line 6453 
 sub _tree_construction_main ($) {
+Line 7640 
 sub _tree_construction_main ($) {
            ## Step 5;
            redo S2;
          } # S2
-         redo B;
+         next B;
        }
      }
-     redo B;
+     next B;
+   } continue { # B
+     if ($self->{insertion_mode} & IN_FOREIGN_CONTENT_IM) {
+       ## NOTE: The code below is executed in cases where it does not have
+       ## to be, but it it is harmless even in those cases.
+       ## has an element in scope
+       INSCOPE: {
+         for (reverse 0..$#{$self->{open_elements}}) {
+           my $node = $self->{open_elements}->[$_];
+           if ($node->[1] & FOREIGN_EL) {
+             last INSCOPE;
+           } elsif ($node->[1] & SCOPING_EL) {
+             last;
+           }
+         }
+         ## NOTE: No foreign element in scope.
+         $self->{insertion_mode} &= ~ IN_FOREIGN_CONTENT_IM;
+       } # INSCOPE
+     }
    } # B
    ## Stop parsing # MUST
-Line 6464 
 sub _tree_construction_main ($) {
+Line 7670 
 sub _tree_construction_main ($) {
    ## TODO: script stuffs
  } # _tree_construct_main
- sub set_inner_html ($$$) {
+ sub set_inner_html ($$$;$) {
    my $class = shift;
    my $node = shift;
    my $s = \$_[0];
    my $onerror = $_[1];
+   my $get_wrapper = $_[2] || sub ($) { return $_[0] };
    ## ISSUE: Should {confident} be true?
-Line 6487 
 sub set_inner_html ($$$) {
+Line 7694 
 sub set_inner_html ($$$) {
      }
      ## Step 3, 4, 5 # MUST
-     $class->parse_string ($$s => $node, $onerror);
+     $class->parse_char_string ($$s => $node, $onerror, $get_wrapper);
    } elsif ($nt == 1) {
      ## TODO: If non-html element
      ## NOTE: Most of this code is copied from |parse_string|
+ ## TODO: Support for $get_wrapper
      ## Step 1 # MUST
      my $this_doc = $node->owner_document;
      my $doc = $this_doc->implementation->create_document;
-Line 6502 
 sub set_inner_html ($$$) {
+Line 7711 
 sub set_inner_html ($$$) {
      ## Step 8 # MUST
      my $i = 0;
-     my $line = 1;
+     $p->{line_prev} = $p->{line} = 1;
-     my $column = 0;
+     $p->{column_prev} = $p->{column} = 0;
      $p->{set_next_char} = sub {
        my $self = shift;
-Line 6512 
 sub set_inner_html ($$$) {
+Line 7721 
 sub set_inner_html ($$$) {
        $self->{next_char} = -1 and return if $i >= length $$s;
        $self->{next_char} = ord substr $$s, $i++, 1;
-       $column++;
+       ($p->{line_prev}, $p->{column_prev}) = ($p->{line}, $p->{column});
+       $p->{column}++;
        if ($self->{next_char} == 0x000A) { # LF
-         $line++;
+         $p->{line}++;
-         $column = 0;
+         $p->{column} = 0;
          !!!cp ('i1');
        } elsif ($self->{next_char} == 0x000D) { # CR
          $i++ if substr ($$s, $i, 1) eq "\x0A";
          $self->{next_char} = 0x000A; # LF # MUST
-         $line++;
+         $p->{line}++;
-         $column = 0;
+         $p->{column} = 0;
          !!!cp ('i2');
        } elsif ($self->{next_char} > 0x10FFFF) {
          $self->{next_char} = 0xFFFD; # REPLACEMENT CHARACTER # MUST
-Line 6531 
 sub set_inner_html ($$$) {
+Line 7742 
 sub set_inner_html ($$$) {
          !!!cp ('i4');
          !!!parse-error (type => 'NULL');
          $self->{next_char} = 0xFFFD; # REPLACEMENT CHARACTER # MUST
+       } elsif ($self->{next_char} <= 0x0008 or
+                (0x000E <= $self->{next_char} and
+                 $self->{next_char} <= 0x001F) or
+                (0x007F <= $self->{next_char} and
+                 $self->{next_char} <= 0x009F) or
+                (0xD800 <= $self->{next_char} and
+                 $self->{next_char} <= 0xDFFF) or
+                (0xFDD0 <= $self->{next_char} and
+                 $self->{next_char} <= 0xFDDF) or
+                {
+xFFFE => 1, 0xFFFF => 1, 0x1FFFE => 1, 0x1FFFF => 1,
+x2FFFE => 1, 0x2FFFF => 1, 0x3FFFE => 1, 0x3FFFF => 1,
+x4FFFE => 1, 0x4FFFF => 1, 0x5FFFE => 1, 0x5FFFF => 1,
+x6FFFE => 1, 0x6FFFF => 1, 0x7FFFE => 1, 0x7FFFF => 1,
+x8FFFE => 1, 0x8FFFF => 1, 0x9FFFE => 1, 0x9FFFF => 1,
+xAFFFE => 1, 0xAFFFF => 1, 0xBFFFE => 1, 0xBFFFF => 1,
+xCFFFE => 1, 0xCFFFF => 1, 0xDFFFE => 1, 0xDFFFF => 1,
+xEFFFE => 1, 0xEFFFF => 1, 0xFFFFE => 1, 0xFFFFF => 1,
+x10FFFE => 1, 0x10FFFF => 1,
+                }->{$self->{next_char}}) {
+         !!!cp ('i4.1');
+         if ($self->{next_char} < 0x10000) {
+           !!!parse-error (type => 'control char',
+                           text => (sprintf 'U+%04X', $self->{next_char}));
+         } else {
+           !!!parse-error (type => 'control char',
+                           text => (sprintf 'U-%08X', $self->{next_char}));
+         }
        }
      };
      $p->{prev_char} = [-1, -1, -1];
-Line 6538 
 sub set_inner_html ($$$) {
+Line 7777 
 sub set_inner_html ($$$) {
      my $ponerror = $onerror || sub {
        my (%opt) = @_;
-       warn "Parse error ($opt{type}) at line $opt{line} column $opt{column}\n";
+       my $line = $opt{line};
+       my $column = $opt{column};
+       if (defined $opt{token} and defined $opt{token}->{line}) {
+         $line = $opt{token}->{line};
+         $column = $opt{token}->{column};
+       }
+       warn "Parse error ($opt{type}) at line $line column $column\n";
      };
      $p->{parse_error} = sub {
-       $ponerror->(@_, line => $line, column => $column);
+       $ponerror->(line => $p->{line}, column => $p->{column}, @_);
      };
      $p->_initialize_tokenizer;
-Line 6565 
 sub set_inner_html ($$$) {
+Line 7810 
 sub set_inner_html ($$$) {
          unless defined $p->{content_model};
          ## ISSUE: What is "the name of the element"? local name?
-     $p->{inner_html_node} = [$node, $node_ln];
+     $p->{inner_html_node} = [$node, $el_category->{$node_ln}];
+       ## TODO: Foreign element OK?
      ## Step 3
      my $root = $doc->create_element_ns
-Line 6575 
 sub set_inner_html ($$$) {
+Line 7821 
 sub set_inner_html ($$$) {
      $doc->append_child ($root);
      ## Step 5 # MUST
-     push @{$p->{open_elements}}, [$root, 'html'];
+     push @{$p->{open_elements}}, [$root, $el_category->{html}];
      undef $p->{head_element};
-Line 6621 
 sub set_inner_html ($$$) {
+Line 7867 
 sub set_inner_html ($$$) {
      ## ISSUE: mutation events?
      $p->_terminate_tree_constructor;
+     delete $p->{parse_error}; # delete loop
    } else {
      die "$0: |set_inner_html| is not defined for node of type $nt";
    }

 Legend:



Removed from v.1.106
 


changed lines


 
Added in v.1.170
 Legend:



Removed from v.1.106
 


changed lines


 
Added in v.1.170
-Removed from v.1.106
+Added in v.1.170

admin@suikawiki.org	ViewVC Help
Powered by ViewVC 1.1.24