| 303 |
sub ROW_IMS () { 0b10000000 } |
sub ROW_IMS () { 0b10000000 } |
| 304 |
sub BODY_AFTER_IMS () { 0b100000000 } |
sub BODY_AFTER_IMS () { 0b100000000 } |
| 305 |
sub FRAME_IMS () { 0b1000000000 } |
sub FRAME_IMS () { 0b1000000000 } |
| 306 |
|
sub SELECT_IMS () { 0b10000000000 } |
| 307 |
|
|
| 308 |
## NOTE: "initial" and "before html" insertion modes have no constants. |
## NOTE: "initial" and "before html" insertion modes have no constants. |
| 309 |
|
|
| 326 |
sub AFTER_BODY_IM () { BODY_AFTER_IMS } |
sub AFTER_BODY_IM () { BODY_AFTER_IMS } |
| 327 |
sub IN_FRAMESET_IM () { FRAME_IMS | 0b01 } |
sub IN_FRAMESET_IM () { FRAME_IMS | 0b01 } |
| 328 |
sub AFTER_FRAMESET_IM () { FRAME_IMS | 0b10 } |
sub AFTER_FRAMESET_IM () { FRAME_IMS | 0b10 } |
| 329 |
sub IN_SELECT_IM () { 0b01 } |
sub IN_SELECT_IM () { SELECT_IMS | 0b01 } |
| 330 |
|
sub IN_SELECT_IN_TABLE_IM () { SELECT_IMS | 0b10 } |
| 331 |
sub IN_COLUMN_GROUP_IM () { 0b10 } |
sub IN_COLUMN_GROUP_IM () { 0b10 } |
| 332 |
|
|
| 333 |
## Implementations MUST act as if state machine in the spec |
## Implementations MUST act as if state machine in the spec |
| 2745 |
|
|
| 2746 |
## Step 3 |
## Step 3 |
| 2747 |
S3: { |
S3: { |
|
## ISSUE: Oops! "If node is the first node in the stack of open |
|
|
## elements, then set last to true. If the context element of the |
|
|
## HTML fragment parsing algorithm is neither a td element nor a |
|
|
## th element, then set node to the context element. (fragment case)": |
|
|
## The second "if" is in the scope of the first "if"!? |
|
| 2748 |
if ($self->{open_elements}->[0]->[0] eq $node->[0]) { |
if ($self->{open_elements}->[0]->[0] eq $node->[0]) { |
| 2749 |
$last = 1; |
$last = 1; |
| 2750 |
if (defined $self->{inner_html_node}) { |
if (defined $self->{inner_html_node}) { |
| 2905 |
!!!cp ('t39'); |
!!!cp ('t39'); |
| 2906 |
}; # $clear_up_to_marker |
}; # $clear_up_to_marker |
| 2907 |
|
|
| 2908 |
my $parse_rcdata = sub ($$) { |
my $insert; |
| 2909 |
my ($content_model_flag, $insert) = @_; |
|
| 2910 |
|
my $parse_rcdata = sub ($) { |
| 2911 |
|
my ($content_model_flag) = @_; |
| 2912 |
|
|
| 2913 |
## Step 1 |
## Step 1 |
| 2914 |
my $start_tag_name = $token->{tag_name}; |
my $start_tag_name = $token->{tag_name}; |
| 2916 |
!!!create-element ($el, $start_tag_name, $token->{attributes}); |
!!!create-element ($el, $start_tag_name, $token->{attributes}); |
| 2917 |
|
|
| 2918 |
## Step 2 |
## Step 2 |
| 2919 |
$insert->($el); # /context node/->append_child ($el) |
$insert->($el); |
| 2920 |
|
|
| 2921 |
## Step 3 |
## Step 3 |
| 2922 |
$self->{content_model} = $content_model_flag; # CDATA or RCDATA |
$self->{content_model} = $content_model_flag; # CDATA or RCDATA |
| 2946 |
$token->{tag_name} eq $start_tag_name) { |
$token->{tag_name} eq $start_tag_name) { |
| 2947 |
!!!cp ('t42'); |
!!!cp ('t42'); |
| 2948 |
## Ignore the token |
## Ignore the token |
|
} elsif ($content_model_flag == CDATA_CONTENT_MODEL) { |
|
|
!!!cp ('t43'); |
|
|
!!!parse-error (type => 'in CDATA:#'.$token->{type}); |
|
|
} elsif ($content_model_flag == RCDATA_CONTENT_MODEL) { |
|
|
!!!cp ('t44'); |
|
|
!!!parse-error (type => 'in RCDATA:#'.$token->{type}); |
|
| 2949 |
} else { |
} else { |
| 2950 |
die "$0: $content_model_flag in parse_rcdata"; |
## NOTE: An end-of-file token. |
| 2951 |
|
if ($content_model_flag == CDATA_CONTENT_MODEL) { |
| 2952 |
|
!!!cp ('t43'); |
| 2953 |
|
!!!parse-error (type => 'in CDATA:#'.$token->{type}); |
| 2954 |
|
} elsif ($content_model_flag == RCDATA_CONTENT_MODEL) { |
| 2955 |
|
!!!cp ('t44'); |
| 2956 |
|
!!!parse-error (type => 'in RCDATA:#'.$token->{type}); |
| 2957 |
|
} else { |
| 2958 |
|
die "$0: $content_model_flag in parse_rcdata"; |
| 2959 |
|
} |
| 2960 |
} |
} |
| 2961 |
!!!next-token; |
!!!next-token; |
| 2962 |
}; # $parse_rcdata |
}; # $parse_rcdata |
| 2963 |
|
|
| 2964 |
my $script_start_tag = sub ($) { |
my $script_start_tag = sub () { |
|
my $insert = $_[0]; |
|
| 2965 |
my $script_el; |
my $script_el; |
| 2966 |
!!!create-element ($script_el, 'script', $token->{attributes}); |
!!!create-element ($script_el, 'script', $token->{attributes}); |
| 2967 |
## TODO: mark as "parser-inserted" |
## TODO: mark as "parser-inserted" |
| 3012 |
!!!next-token; |
!!!next-token; |
| 3013 |
}; # $script_start_tag |
}; # $script_start_tag |
| 3014 |
|
|
| 3015 |
|
## NOTE: $open_tables->[-1]->[0] is the "current table" element node. |
| 3016 |
|
## NOTE: $open_tables->[-1]->[1] is the "tainted" flag. |
| 3017 |
|
my $open_tables = [[$self->{open_elements}->[0]->[0]]]; |
| 3018 |
|
|
| 3019 |
my $formatting_end_tag = sub { |
my $formatting_end_tag = sub { |
| 3020 |
my $tag_name = shift; |
my $tag_name = shift; |
| 3021 |
|
|
| 3022 |
|
## NOTE: The adoptioon agency algorithm (AAA). |
| 3023 |
|
|
| 3024 |
FET: { |
FET: { |
| 3025 |
## Step 1 |
## Step 1 |
| 3026 |
my $formatting_element; |
my $formatting_element; |
| 3174 |
} # S7 |
} # S7 |
| 3175 |
|
|
| 3176 |
## Step 8 |
## Step 8 |
| 3177 |
$common_ancestor_node->[0]->append_child ($last_node->[0]); |
if ({ |
| 3178 |
|
table => 1, tbody => 1, tfoot => 1, thead => 1, tr => 1, |
| 3179 |
|
}->{$common_ancestor_node->[1]}) { |
| 3180 |
|
my $foster_parent_element; |
| 3181 |
|
my $next_sibling; |
| 3182 |
|
OE: for (reverse 0..$#{$self->{open_elements}}) { |
| 3183 |
|
if ($self->{open_elements}->[$_]->[1] eq 'table') { |
| 3184 |
|
my $parent = $self->{open_elements}->[$_]->[0]->parent_node; |
| 3185 |
|
if (defined $parent and $parent->node_type == 1) { |
| 3186 |
|
!!!cp ('t65.1'); |
| 3187 |
|
$foster_parent_element = $parent; |
| 3188 |
|
$next_sibling = $self->{open_elements}->[$_]->[0]; |
| 3189 |
|
} else { |
| 3190 |
|
!!!cp ('t65.2'); |
| 3191 |
|
$foster_parent_element |
| 3192 |
|
= $self->{open_elements}->[$_ - 1]->[0]; |
| 3193 |
|
} |
| 3194 |
|
last OE; |
| 3195 |
|
} |
| 3196 |
|
} # OE |
| 3197 |
|
$foster_parent_element = $self->{open_elements}->[0]->[0] |
| 3198 |
|
unless defined $foster_parent_element; |
| 3199 |
|
$foster_parent_element->insert_before ($last_node->[0], $next_sibling); |
| 3200 |
|
$open_tables->[-1]->[1] = 1; # tainted |
| 3201 |
|
} else { |
| 3202 |
|
!!!cp ('t65.3'); |
| 3203 |
|
$common_ancestor_node->[0]->append_child ($last_node->[0]); |
| 3204 |
|
} |
| 3205 |
|
|
| 3206 |
## Step 9 |
## Step 9 |
| 3207 |
my $clone = [$formatting_element->[0]->clone_node (0), |
my $clone = [$formatting_element->[0]->clone_node (0), |
| 3247 |
} # FET |
} # FET |
| 3248 |
}; # $formatting_end_tag |
}; # $formatting_end_tag |
| 3249 |
|
|
| 3250 |
my $insert_to_current = sub { |
$insert = my $insert_to_current = sub { |
| 3251 |
$self->{open_elements}->[-1]->[0]->append_child ($_[0]); |
$self->{open_elements}->[-1]->[0]->append_child ($_[0]); |
| 3252 |
}; # $insert_to_current |
}; # $insert_to_current |
| 3253 |
|
|
| 3254 |
my $insert_to_foster = sub { |
my $insert_to_foster = sub { |
| 3255 |
my $child = shift; |
my $child = shift; |
| 3256 |
if ({ |
if ({ |
| 3257 |
table => 1, tbody => 1, tfoot => 1, |
table => 1, tbody => 1, tfoot => 1, thead => 1, tr => 1, |
| 3258 |
thead => 1, tr => 1, |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 3259 |
}->{$self->{open_elements}->[-1]->[1]}) { |
# MUST |
| 3260 |
# MUST |
my $foster_parent_element; |
| 3261 |
my $foster_parent_element; |
my $next_sibling; |
|
my $next_sibling; |
|
| 3262 |
OE: for (reverse 0..$#{$self->{open_elements}}) { |
OE: for (reverse 0..$#{$self->{open_elements}}) { |
| 3263 |
if ($self->{open_elements}->[$_]->[1] eq 'table') { |
if ($self->{open_elements}->[$_]->[1] eq 'table') { |
| 3264 |
my $parent = $self->{open_elements}->[$_]->[0]->parent_node; |
my $parent = $self->{open_elements}->[$_]->[0]->parent_node; |
| 3278 |
unless defined $foster_parent_element; |
unless defined $foster_parent_element; |
| 3279 |
$foster_parent_element->insert_before |
$foster_parent_element->insert_before |
| 3280 |
($child, $next_sibling); |
($child, $next_sibling); |
| 3281 |
} else { |
$open_tables->[-1]->[1] = 1; # tainted |
| 3282 |
!!!cp ('t72'); |
} else { |
| 3283 |
$self->{open_elements}->[-1]->[0]->append_child ($child); |
!!!cp ('t72'); |
| 3284 |
} |
$self->{open_elements}->[-1]->[0]->append_child ($child); |
| 3285 |
|
} |
| 3286 |
}; # $insert_to_foster |
}; # $insert_to_foster |
| 3287 |
|
|
|
my $insert; |
|
|
|
|
| 3288 |
B: { |
B: { |
| 3289 |
if ($token->{type} == DOCTYPE_TOKEN) { |
if ($token->{type} == DOCTYPE_TOKEN) { |
| 3290 |
!!!cp ('t73'); |
!!!cp ('t73'); |
| 3299 |
# |
# |
| 3300 |
} else { |
} else { |
| 3301 |
## Generate implied end tags |
## Generate implied end tags |
| 3302 |
if ({ |
while ({ |
| 3303 |
dd => 1, dt => 1, li => 1, p => 1, td => 1, th => 1, tr => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 3304 |
tbody => 1, tfoot=> 1, thead => 1, |
}->{$self->{open_elements}->[-1]->[1]}) { |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 3305 |
!!!cp ('t75'); |
!!!cp ('t75'); |
| 3306 |
!!!back-token; |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, tag_name => $self->{open_elements}->[-1]->[1]}; |
|
|
redo B; |
|
| 3307 |
} |
} |
| 3308 |
|
|
| 3309 |
if (@{$self->{open_elements}} > 2 or |
if (@{$self->{open_elements}} > 2 or |
| 3369 |
} elsif ($self->{insertion_mode} & HEAD_IMS) { |
} elsif ($self->{insertion_mode} & HEAD_IMS) { |
| 3370 |
if ($token->{type} == CHARACTER_TOKEN) { |
if ($token->{type} == CHARACTER_TOKEN) { |
| 3371 |
if ($token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) { |
if ($token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) { |
| 3372 |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($1); |
unless ($self->{insertion_mode} == BEFORE_HEAD_IM) { |
| 3373 |
|
!!!cp ('t88.2'); |
| 3374 |
|
$self->{open_elements}->[-1]->[0]->manakai_append_text ($1); |
| 3375 |
|
} else { |
| 3376 |
|
!!!cp ('t88.1'); |
| 3377 |
|
## Ignore the token. |
| 3378 |
|
!!!next-token; |
| 3379 |
|
redo B; |
| 3380 |
|
} |
| 3381 |
unless (length $token->{data}) { |
unless (length $token->{data}) { |
| 3382 |
!!!cp ('t88'); |
!!!cp ('t88'); |
| 3383 |
!!!next-token; |
!!!next-token; |
| 3478 |
} |
} |
| 3479 |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
| 3480 |
pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec. |
pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec. |
| 3481 |
pop @{$self->{open_elements}} |
pop @{$self->{open_elements}} # <head> |
| 3482 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3483 |
!!!next-token; |
!!!next-token; |
| 3484 |
redo B; |
redo B; |
| 3493 |
} |
} |
| 3494 |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
| 3495 |
pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec. |
pop @{$self->{open_elements}}; ## ISSUE: This step is missing in the spec. |
| 3496 |
pop @{$self->{open_elements}} |
pop @{$self->{open_elements}} # <head> |
| 3497 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3498 |
!!!next-token; |
!!!next-token; |
| 3499 |
redo B; |
redo B; |
| 3554 |
} |
} |
| 3555 |
} |
} |
| 3556 |
|
|
| 3557 |
pop @{$self->{open_elements}} |
pop @{$self->{open_elements}} # <head> |
| 3558 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3559 |
!!!next-token; |
!!!next-token; |
| 3560 |
redo B; |
redo B; |
| 3578 |
## NOTE: There is a "as if in head" code clone. |
## NOTE: There is a "as if in head" code clone. |
| 3579 |
my $parent = defined $self->{head_element} ? $self->{head_element} |
my $parent = defined $self->{head_element} ? $self->{head_element} |
| 3580 |
: $self->{open_elements}->[-1]->[0]; |
: $self->{open_elements}->[-1]->[0]; |
| 3581 |
$parse_rcdata->(RCDATA_CONTENT_MODEL, |
$parse_rcdata->(RCDATA_CONTENT_MODEL); |
| 3582 |
sub { $parent->append_child ($_[0]) }); |
pop @{$self->{open_elements}} # <head> |
|
pop @{$self->{open_elements}} |
|
| 3583 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3584 |
redo B; |
redo B; |
| 3585 |
} elsif ($token->{tag_name} eq 'style') { |
} elsif ($token->{tag_name} eq 'style') { |
| 3593 |
} else { |
} else { |
| 3594 |
!!!cp ('t115'); |
!!!cp ('t115'); |
| 3595 |
} |
} |
| 3596 |
$parse_rcdata->(CDATA_CONTENT_MODEL, $insert_to_current); |
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 3597 |
pop @{$self->{open_elements}} |
pop @{$self->{open_elements}} # <head> |
| 3598 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3599 |
redo B; |
redo B; |
| 3600 |
} elsif ($token->{tag_name} eq 'noscript') { |
} elsif ($token->{tag_name} eq 'noscript') { |
| 3633 |
} |
} |
| 3634 |
|
|
| 3635 |
## NOTE: There is a "as if in head" code clone. |
## NOTE: There is a "as if in head" code clone. |
| 3636 |
$script_start_tag->($insert_to_current); |
$script_start_tag->(); |
| 3637 |
pop @{$self->{open_elements}} |
pop @{$self->{open_elements}} # <head> |
| 3638 |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
if $self->{insertion_mode} == AFTER_HEAD_IM; |
| 3639 |
redo B; |
redo B; |
| 3640 |
} elsif ($token->{tag_name} eq 'body' or |
} elsif ($token->{tag_name} eq 'body' or |
| 3922 |
} |
} |
| 3923 |
|
|
| 3924 |
## generate implied end tags |
## generate implied end tags |
| 3925 |
if ({ |
while ({ |
| 3926 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 3927 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
## NOTE: Maybe the following elements never appear here. |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 3928 |
!!!cp ('t158'); |
!!!cp ('t158'); |
| 3929 |
!!!back-token; # <?> |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, tag_name => 'caption'}; |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 3930 |
} |
} |
| 3931 |
|
|
| 3932 |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
| 3979 |
} |
} |
| 3980 |
|
|
| 3981 |
## generate implied end tags |
## generate implied end tags |
| 3982 |
if ({ |
while ({ |
| 3983 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 3984 |
td => ($token->{tag_name} eq 'th'), |
}->{$self->{open_elements}->[-1]->[1]}) { |
|
th => ($token->{tag_name} eq 'td'), |
|
|
|
|
|
## NOTE: Maybe the following elements never appear here. |
|
|
tr => 1, |
|
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 3985 |
!!!cp ('t166'); |
!!!cp ('t166'); |
| 3986 |
!!!back-token; |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 3987 |
} |
} |
| 3988 |
|
|
| 3989 |
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
| 3990 |
!!!cp ('t167'); |
!!!cp ('t167'); |
| 3991 |
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
| 4037 |
} |
} |
| 4038 |
|
|
| 4039 |
## generate implied end tags |
## generate implied end tags |
| 4040 |
if ({ |
while ({ |
| 4041 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 4042 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
## NOTE: The following elements never appear here, maybe. |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 4043 |
!!!cp ('t174'); |
!!!cp ('t174'); |
| 4044 |
!!!back-token; |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 4045 |
} |
} |
| 4046 |
|
|
| 4047 |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
| 4138 |
} |
} |
| 4139 |
|
|
| 4140 |
## generate implied end tags |
## generate implied end tags |
| 4141 |
if ({ |
while ({ |
| 4142 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 4143 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
## NOTE: The following elements never appear, maybe. |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 4144 |
!!!cp ('t187'); |
!!!cp ('t187'); |
| 4145 |
!!!back-token; # </table> |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, tag_name => 'caption'}; |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 4146 |
} |
} |
| 4147 |
|
|
| 4148 |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
if ($self->{open_elements}->[-1]->[1] ne 'caption') { |
| 4195 |
# |
# |
| 4196 |
} elsif ($self->{insertion_mode} & TABLE_IMS) { |
} elsif ($self->{insertion_mode} & TABLE_IMS) { |
| 4197 |
if ($token->{type} == CHARACTER_TOKEN) { |
if ($token->{type} == CHARACTER_TOKEN) { |
| 4198 |
if ($token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) { |
if (not $open_tables->[-1]->[1] and # tainted |
| 4199 |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($1); |
$token->{data} =~ s/^([\x09\x0A\x0B\x0C\x20]+)//) { |
| 4200 |
|
$self->{open_elements}->[-1]->[0]->manakai_append_text ($1); |
| 4201 |
|
|
| 4202 |
unless (length $token->{data}) { |
unless (length $token->{data}) { |
| 4203 |
!!!cp ('t194'); |
!!!cp ('t194'); |
| 4204 |
!!!next-token; |
!!!next-token; |
| 4205 |
redo B; |
redo B; |
| 4206 |
} else { |
} else { |
| 4207 |
!!!cp ('t195'); |
!!!cp ('t195'); |
| 4208 |
} |
} |
| 4209 |
} |
} |
| 4210 |
|
|
| 4211 |
!!!parse-error (type => 'in table:#character'); |
!!!parse-error (type => 'in table:#character'); |
| 4212 |
|
|
| 4253 |
($self->{document}->create_text_node ($token->{data}), |
($self->{document}->create_text_node ($token->{data}), |
| 4254 |
$next_sibling); |
$next_sibling); |
| 4255 |
} |
} |
| 4256 |
} else { |
$open_tables->[-1]->[1] = 1; # tainted |
| 4257 |
!!!cp ('t200'); |
} else { |
| 4258 |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data}); |
!!!cp ('t200'); |
| 4259 |
} |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data}); |
| 4260 |
|
} |
| 4261 |
|
|
| 4262 |
!!!next-token; |
!!!next-token; |
| 4263 |
redo B; |
redo B; |
| 4264 |
} elsif ($token->{type} == START_TAG_TOKEN) { |
} elsif ($token->{type} == START_TAG_TOKEN) { |
| 4265 |
if ({ |
if ({ |
| 4266 |
tr => ($self->{insertion_mode} != IN_ROW_IM), |
tr => ($self->{insertion_mode} != IN_ROW_IM), |
| 4271 |
while ($self->{open_elements}->[-1]->[1] ne 'table' and |
while ($self->{open_elements}->[-1]->[1] ne 'table' and |
| 4272 |
$self->{open_elements}->[-1]->[1] ne 'html') { |
$self->{open_elements}->[-1]->[1] ne 'html') { |
| 4273 |
!!!cp ('t201'); |
!!!cp ('t201'); |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4274 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4275 |
} |
} |
| 4276 |
|
|
| 4291 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4292 |
!!!cp ('t203'); |
!!!cp ('t203'); |
| 4293 |
## ISSUE: Can this case be reached? |
## ISSUE: Can this case be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4294 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4295 |
} |
} |
| 4296 |
|
|
| 4314 |
tr => 1, html => 1, |
tr => 1, html => 1, |
| 4315 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4316 |
!!!cp ('t207'); |
!!!cp ('t207'); |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4317 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4318 |
} |
} |
| 4319 |
|
|
| 4364 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4365 |
!!!cp ('t211'); |
!!!cp ('t211'); |
| 4366 |
## ISSUE: Can this case be reached? |
## ISSUE: Can this case be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4367 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4368 |
} |
} |
| 4369 |
|
|
| 4412 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4413 |
!!!cp ('t217'); |
!!!cp ('t217'); |
| 4414 |
## ISSUE: Can this state be reached? |
## ISSUE: Can this state be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4415 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4416 |
} |
} |
| 4417 |
|
|
| 4435 |
$self->{open_elements}->[-1]->[1] ne 'html') { |
$self->{open_elements}->[-1]->[1] ne 'html') { |
| 4436 |
!!!cp ('t219'); |
!!!cp ('t219'); |
| 4437 |
## ISSUE: Can this state be reached? |
## ISSUE: Can this state be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4438 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4439 |
} |
} |
| 4440 |
|
|
| 4452 |
$self->{open_elements}->[-1]->[1] ne 'html') { |
$self->{open_elements}->[-1]->[1] ne 'html') { |
| 4453 |
!!!cp ('t220'); |
!!!cp ('t220'); |
| 4454 |
## ISSUE: Can this state be reached? |
## ISSUE: Can this state be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4455 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4456 |
} |
} |
| 4457 |
|
|
| 4501 |
} |
} |
| 4502 |
|
|
| 4503 |
## generate implied end tags |
## generate implied end tags |
| 4504 |
if ({ |
while ({ |
| 4505 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 4506 |
td => 1, th => 1, tr => 1, |
}->{$self->{open_elements}->[-1]->[1]}) { |
|
tbody => 1, tfoot=> 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 4507 |
!!!cp ('t224'); |
!!!cp ('t224'); |
| 4508 |
!!!back-token; # <table> |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, tag_name => 'table'}; |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 4509 |
} |
} |
| 4510 |
|
|
| 4511 |
if ($self->{open_elements}->[-1]->[1] ne 'table') { |
if ($self->{open_elements}->[-1]->[1] ne 'table') { |
| 4517 |
} |
} |
| 4518 |
|
|
| 4519 |
splice @{$self->{open_elements}}, $i; |
splice @{$self->{open_elements}}, $i; |
| 4520 |
|
pop @{$open_tables}; |
| 4521 |
|
|
| 4522 |
$self->_reset_insertion_mode; |
$self->_reset_insertion_mode; |
| 4523 |
|
|
| 4524 |
## reprocess |
## reprocess |
| 4525 |
redo B; |
redo B; |
| 4526 |
|
} elsif ($token->{tag_name} eq 'style') { |
| 4527 |
|
if (not $open_tables->[-1]->[1]) { # tainted |
| 4528 |
|
!!!cp ('t227.8'); |
| 4529 |
|
## NOTE: This is a "as if in head" code clone. |
| 4530 |
|
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 4531 |
|
redo B; |
| 4532 |
|
} else { |
| 4533 |
|
!!!cp ('t227.7'); |
| 4534 |
|
# |
| 4535 |
|
} |
| 4536 |
|
} elsif ($token->{tag_name} eq 'script') { |
| 4537 |
|
if (not $open_tables->[-1]->[1]) { # tainted |
| 4538 |
|
!!!cp ('t227.6'); |
| 4539 |
|
## NOTE: This is a "as if in head" code clone. |
| 4540 |
|
$script_start_tag->(); |
| 4541 |
|
redo B; |
| 4542 |
|
} else { |
| 4543 |
|
!!!cp ('t227.5'); |
| 4544 |
|
# |
| 4545 |
|
} |
| 4546 |
|
} elsif ($token->{tag_name} eq 'input') { |
| 4547 |
|
if (not $open_tables->[-1]->[1]) { # tainted |
| 4548 |
|
if ($token->{attributes}->{type}) { ## TODO: case |
| 4549 |
|
my $type = lc $token->{attributes}->{type}->{value}; |
| 4550 |
|
if ($type eq 'hidden') { |
| 4551 |
|
!!!cp ('t227.3'); |
| 4552 |
|
!!!parse-error (type => 'in table:'.$token->{tag_name}); |
| 4553 |
|
|
| 4554 |
|
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
| 4555 |
|
|
| 4556 |
|
## TODO: form element pointer |
| 4557 |
|
|
| 4558 |
|
pop @{$self->{open_elements}}; |
| 4559 |
|
|
| 4560 |
|
!!!next-token; |
| 4561 |
|
redo B; |
| 4562 |
|
} else { |
| 4563 |
|
!!!cp ('t227.2'); |
| 4564 |
|
# |
| 4565 |
|
} |
| 4566 |
|
} else { |
| 4567 |
|
!!!cp ('t227.1'); |
| 4568 |
|
# |
| 4569 |
|
} |
| 4570 |
|
} else { |
| 4571 |
|
!!!cp ('t227.4'); |
| 4572 |
|
# |
| 4573 |
|
} |
| 4574 |
} else { |
} else { |
| 4575 |
!!!cp ('t227'); |
!!!cp ('t227'); |
|
!!!parse-error (type => 'in table:'.$token->{tag_name}); |
|
|
|
|
|
$insert = $insert_to_foster; |
|
| 4576 |
# |
# |
| 4577 |
} |
} |
| 4578 |
|
|
| 4579 |
|
!!!parse-error (type => 'in table:'.$token->{tag_name}); |
| 4580 |
|
|
| 4581 |
|
$insert = $insert_to_foster; |
| 4582 |
|
# |
| 4583 |
} elsif ($token->{type} == END_TAG_TOKEN) { |
} elsif ($token->{type} == END_TAG_TOKEN) { |
| 4584 |
if ($token->{tag_name} eq 'tr' and |
if ($token->{tag_name} eq 'tr' and |
| 4585 |
$self->{insertion_mode} == IN_ROW_IM) { |
$self->{insertion_mode} == IN_ROW_IM) { |
| 4614 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4615 |
!!!cp ('t231'); |
!!!cp ('t231'); |
| 4616 |
## ISSUE: Can this state be reached? |
## ISSUE: Can this state be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4617 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4618 |
} |
} |
| 4619 |
|
|
| 4654 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4655 |
!!!cp ('t236'); |
!!!cp ('t236'); |
| 4656 |
## ISSUE: Can this state be reached? |
## ISSUE: Can this state be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4657 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4658 |
} |
} |
| 4659 |
|
|
| 4693 |
tbody => 1, tfoot => 1, thead => 1, html => 1, |
tbody => 1, tfoot => 1, thead => 1, html => 1, |
| 4694 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4695 |
!!!cp ('t240'); |
!!!cp ('t240'); |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4696 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4697 |
} |
} |
| 4698 |
|
|
| 4708 |
## reprocess in the "in table" insertion mode... |
## reprocess in the "in table" insertion mode... |
| 4709 |
} |
} |
| 4710 |
|
|
| 4711 |
|
## NOTE: </table> in the "in table" insertion mode. |
| 4712 |
|
## When you edit the code fragment below, please ensure that |
| 4713 |
|
## the code for <table> in the "in table" insertion mode |
| 4714 |
|
## is synced with it. |
| 4715 |
|
|
| 4716 |
## have a table element in table scope |
## have a table element in table scope |
| 4717 |
my $i; |
my $i; |
| 4718 |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
| 4735 |
!!!next-token; |
!!!next-token; |
| 4736 |
redo B; |
redo B; |
| 4737 |
} |
} |
|
|
|
|
## generate implied end tags |
|
|
if ({ |
|
|
dd => 1, dt => 1, li => 1, p => 1, |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot=> 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
|
!!!cp ('t244'); |
|
|
## ISSUE: Can this case be reached? |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
|
} |
|
|
|
|
|
if ($self->{open_elements}->[-1]->[1] ne 'table') { |
|
|
!!!cp ('t245'); |
|
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
|
} else { |
|
|
!!!cp ('t246'); |
|
|
} |
|
| 4738 |
|
|
| 4739 |
splice @{$self->{open_elements}}, $i; |
splice @{$self->{open_elements}}, $i; |
| 4740 |
|
pop @{$open_tables}; |
| 4741 |
|
|
| 4742 |
$self->_reset_insertion_mode; |
$self->_reset_insertion_mode; |
| 4743 |
|
|
| 4801 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4802 |
!!!cp ('t253'); |
!!!cp ('t253'); |
| 4803 |
## ISSUE: Can this case be reached? |
## ISSUE: Can this case be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4804 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4805 |
} |
} |
| 4806 |
|
|
| 4838 |
}->{$self->{open_elements}->[-1]->[1]}) { |
}->{$self->{open_elements}->[-1]->[1]}) { |
| 4839 |
!!!cp ('t257'); |
!!!cp ('t257'); |
| 4840 |
## ISSUE: Can this case be reached? |
## ISSUE: Can this case be reached? |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
|
| 4841 |
pop @{$self->{open_elements}}; |
pop @{$self->{open_elements}}; |
| 4842 |
} |
} |
| 4843 |
|
|
| 4933 |
## reprocess |
## reprocess |
| 4934 |
redo B; |
redo B; |
| 4935 |
} |
} |
| 4936 |
} elsif ($self->{insertion_mode} == IN_SELECT_IM) { |
} elsif ($self->{insertion_mode} & SELECT_IMS) { |
| 4937 |
if ($token->{type} == CHARACTER_TOKEN) { |
if ($token->{type} == CHARACTER_TOKEN) { |
| 4938 |
!!!cp ('t271'); |
!!!cp ('t271'); |
| 4939 |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data}); |
$self->{open_elements}->[-1]->[0]->manakai_append_text ($token->{data}); |
| 4972 |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
!!!insert-element ($token->{tag_name}, $token->{attributes}); |
| 4973 |
!!!next-token; |
!!!next-token; |
| 4974 |
redo B; |
redo B; |
| 4975 |
} elsif ($token->{tag_name} eq 'select') { |
} elsif ($token->{tag_name} eq 'select' or |
| 4976 |
## TODO: The type below is not good - <select> is replaced by </select> |
$token->{tag_name} eq 'input' or |
| 4977 |
!!!parse-error (type => 'not closed:select'); |
($self->{insertion_mode} == IN_SELECT_IN_TABLE_IM and |
| 4978 |
## As if </select> instead |
{ |
| 4979 |
|
caption => 1, table => 1, |
| 4980 |
|
tbody => 1, tfoot => 1, thead => 1, |
| 4981 |
|
tr => 1, td => 1, th => 1, |
| 4982 |
|
}->{$token->{tag_name}})) { |
| 4983 |
|
## TODO: The type below is not good - <select> is replaced by </select> |
| 4984 |
|
!!!parse-error (type => 'not closed:select'); |
| 4985 |
|
## NOTE: As if the token were </select> (<select> case) or |
| 4986 |
|
## as if there were </select> (otherwise). |
| 4987 |
## have an element in table scope |
## have an element in table scope |
| 4988 |
my $i; |
my $i; |
| 4989 |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
| 4990 |
my $node = $self->{open_elements}->[$_]; |
my $node = $self->{open_elements}->[$_]; |
| 4991 |
if ($node->[1] eq $token->{tag_name}) { |
if ($node->[1] eq 'select') { |
| 4992 |
!!!cp ('t278'); |
!!!cp ('t278'); |
| 4993 |
$i = $_; |
$i = $_; |
| 4994 |
last INSCOPE; |
last INSCOPE; |
| 5012 |
|
|
| 5013 |
$self->_reset_insertion_mode; |
$self->_reset_insertion_mode; |
| 5014 |
|
|
| 5015 |
!!!next-token; |
if ($token->{tag_name} eq 'select') { |
| 5016 |
redo B; |
!!!cp ('t281.2'); |
| 5017 |
|
!!!next-token; |
| 5018 |
|
redo B; |
| 5019 |
|
} else { |
| 5020 |
|
!!!cp ('t281.1'); |
| 5021 |
|
## Reprocess the token. |
| 5022 |
|
redo B; |
| 5023 |
|
} |
| 5024 |
} else { |
} else { |
| 5025 |
!!!cp ('t282'); |
!!!cp ('t282'); |
| 5026 |
!!!parse-error (type => 'in select:'.$token->{tag_name}); |
!!!parse-error (type => 'in select:'.$token->{tag_name}); |
| 5087 |
|
|
| 5088 |
!!!next-token; |
!!!next-token; |
| 5089 |
redo B; |
redo B; |
| 5090 |
} elsif ({ |
} elsif ($self->{insertion_mode} == IN_SELECT_IN_TABLE_IM and |
| 5091 |
caption => 1, table => 1, tbody => 1, |
{ |
| 5092 |
tfoot => 1, thead => 1, tr => 1, td => 1, th => 1, |
caption => 1, table => 1, tbody => 1, |
| 5093 |
}->{$token->{tag_name}}) { |
tfoot => 1, thead => 1, tr => 1, td => 1, th => 1, |
| 5094 |
|
}->{$token->{tag_name}}) { |
| 5095 |
## TODO: The following is wrong? |
## TODO: The following is wrong? |
| 5096 |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 5097 |
|
|
| 5310 |
} elsif ($token->{tag_name} eq 'noframes') { |
} elsif ($token->{tag_name} eq 'noframes') { |
| 5311 |
!!!cp ('t320'); |
!!!cp ('t320'); |
| 5312 |
## NOTE: As if in body. |
## NOTE: As if in body. |
| 5313 |
$parse_rcdata->(CDATA_CONTENT_MODEL, $insert_to_current); |
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 5314 |
redo B; |
redo B; |
| 5315 |
} else { |
} else { |
| 5316 |
if ($self->{insertion_mode} == IN_FRAMESET_IM) { |
if ($self->{insertion_mode} == IN_FRAMESET_IM) { |
| 5389 |
if ($token->{tag_name} eq 'script') { |
if ($token->{tag_name} eq 'script') { |
| 5390 |
!!!cp ('t332'); |
!!!cp ('t332'); |
| 5391 |
## NOTE: This is an "as if in head" code clone |
## NOTE: This is an "as if in head" code clone |
| 5392 |
$script_start_tag->($insert); |
$script_start_tag->(); |
| 5393 |
redo B; |
redo B; |
| 5394 |
} elsif ($token->{tag_name} eq 'style') { |
} elsif ($token->{tag_name} eq 'style') { |
| 5395 |
!!!cp ('t333'); |
!!!cp ('t333'); |
| 5396 |
## NOTE: This is an "as if in head" code clone |
## NOTE: This is an "as if in head" code clone |
| 5397 |
$parse_rcdata->(CDATA_CONTENT_MODEL, $insert); |
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 5398 |
redo B; |
redo B; |
| 5399 |
} elsif ({ |
} elsif ({ |
| 5400 |
base => 1, link => 1, |
base => 1, link => 1, |
| 5457 |
redo B; |
redo B; |
| 5458 |
} elsif ($token->{tag_name} eq 'title') { |
} elsif ($token->{tag_name} eq 'title') { |
| 5459 |
!!!cp ('t341'); |
!!!cp ('t341'); |
|
!!!parse-error (type => 'in body:title'); |
|
| 5460 |
## NOTE: This is an "as if in head" code clone |
## NOTE: This is an "as if in head" code clone |
| 5461 |
$parse_rcdata->(RCDATA_CONTENT_MODEL, sub { |
$parse_rcdata->(RCDATA_CONTENT_MODEL); |
|
if (defined $self->{head_element}) { |
|
|
!!!cp ('t339'); |
|
|
$self->{head_element}->append_child ($_[0]); |
|
|
} else { |
|
|
!!!cp ('t340'); |
|
|
$insert->($_[0]); |
|
|
} |
|
|
}); |
|
| 5462 |
redo B; |
redo B; |
| 5463 |
} elsif ($token->{tag_name} eq 'body') { |
} elsif ($token->{tag_name} eq 'body') { |
| 5464 |
!!!parse-error (type => 'in body:body'); |
!!!parse-error (type => 'in body:body'); |
| 5482 |
redo B; |
redo B; |
| 5483 |
} elsif ({ |
} elsif ({ |
| 5484 |
address => 1, blockquote => 1, center => 1, dir => 1, |
address => 1, blockquote => 1, center => 1, dir => 1, |
| 5485 |
div => 1, dl => 1, fieldset => 1, listing => 1, |
div => 1, dl => 1, fieldset => 1, |
| 5486 |
|
h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1, |
| 5487 |
menu => 1, ol => 1, p => 1, ul => 1, |
menu => 1, ol => 1, p => 1, ul => 1, |
| 5488 |
pre => 1, |
pre => 1, listing => 1, |
| 5489 |
}->{$token->{tag_name}}) { |
}->{$token->{tag_name}}) { |
| 5490 |
## has a p element in scope |
## has a p element in scope |
| 5491 |
INSCOPE: for (reverse @{$self->{open_elements}}) { |
INSCOPE: for (reverse @{$self->{open_elements}}) { |
| 5504 |
} # INSCOPE |
} # INSCOPE |
| 5505 |
|
|
| 5506 |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
| 5507 |
if ($token->{tag_name} eq 'pre') { |
if ($token->{tag_name} eq 'pre' or $token->{tag_name} eq 'listing') { |
| 5508 |
!!!next-token; |
!!!next-token; |
| 5509 |
if ($token->{type} == CHARACTER_TOKEN) { |
if ($token->{type} == CHARACTER_TOKEN) { |
| 5510 |
$token->{data} =~ s/^\x0A//; |
$token->{data} =~ s/^\x0A//; |
| 5686 |
|
|
| 5687 |
!!!next-token; |
!!!next-token; |
| 5688 |
redo B; |
redo B; |
|
} elsif ({ |
|
|
h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1, |
|
|
}->{$token->{tag_name}}) { |
|
|
## has a p element in scope |
|
|
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
|
|
my $node = $self->{open_elements}->[$_]; |
|
|
if ($node->[1] eq 'p') { |
|
|
!!!cp ('t369'); |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, tag_name => 'p'}; |
|
|
redo B; |
|
|
} elsif ({ |
|
|
table => 1, caption => 1, td => 1, th => 1, |
|
|
button => 1, marquee => 1, object => 1, html => 1, |
|
|
}->{$node->[1]}) { |
|
|
!!!cp ('t370'); |
|
|
last INSCOPE; |
|
|
} |
|
|
} # INSCOPE |
|
|
|
|
|
## NOTE: See <http://html5.org/tools/web-apps-tracker?from=925&to=926> |
|
|
## has an element in scope |
|
|
#my $i; |
|
|
#INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
|
|
# my $node = $self->{open_elements}->[$_]; |
|
|
# if ({ |
|
|
# h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1, |
|
|
# }->{$node->[1]}) { |
|
|
# $i = $_; |
|
|
# last INSCOPE; |
|
|
# } elsif ({ |
|
|
# table => 1, caption => 1, td => 1, th => 1, |
|
|
# button => 1, marquee => 1, object => 1, html => 1, |
|
|
# }->{$node->[1]}) { |
|
|
# last INSCOPE; |
|
|
# } |
|
|
#} # INSCOPE |
|
|
# |
|
|
#if (defined $i) { |
|
|
# !!! parse-error (type => 'in hn:hn'); |
|
|
# splice @{$self->{open_elements}}, $i; |
|
|
#} |
|
|
|
|
|
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
|
|
|
|
|
!!!next-token; |
|
|
redo B; |
|
| 5689 |
} elsif ($token->{tag_name} eq 'a') { |
} elsif ($token->{tag_name} eq 'a') { |
| 5690 |
AFE: for my $i (reverse 0..$#$active_formatting_elements) { |
AFE: for my $i (reverse 0..$#$active_formatting_elements) { |
| 5691 |
my $node = $active_formatting_elements->[$i]; |
my $node = $active_formatting_elements->[$i]; |
| 5786 |
$reconstruct_active_formatting_elements->($insert_to_current); |
$reconstruct_active_formatting_elements->($insert_to_current); |
| 5787 |
|
|
| 5788 |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
| 5789 |
|
|
| 5790 |
|
## TODO: associate with $self->{form_element} if defined |
| 5791 |
|
|
| 5792 |
push @$active_formatting_elements, ['#marker', '']; |
push @$active_formatting_elements, ['#marker', '']; |
| 5793 |
|
|
| 5794 |
!!!next-token; |
!!!next-token; |
| 5806 |
} elsif ($token->{tag_name} eq 'xmp') { |
} elsif ($token->{tag_name} eq 'xmp') { |
| 5807 |
!!!cp ('t381'); |
!!!cp ('t381'); |
| 5808 |
$reconstruct_active_formatting_elements->($insert_to_current); |
$reconstruct_active_formatting_elements->($insert_to_current); |
| 5809 |
$parse_rcdata->(CDATA_CONTENT_MODEL, $insert); |
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 5810 |
redo B; |
redo B; |
| 5811 |
} elsif ($token->{tag_name} eq 'table') { |
} elsif ($token->{tag_name} eq 'table') { |
| 5812 |
## has a p element in scope |
## has a p element in scope |
| 5826 |
} # INSCOPE |
} # INSCOPE |
| 5827 |
|
|
| 5828 |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
| 5829 |
|
push @{$open_tables}, [$self->{open_elements}->[-1]->[0]]; |
| 5830 |
|
|
| 5831 |
$self->{insertion_mode} = IN_TABLE_IM; |
$self->{insertion_mode} = IN_TABLE_IM; |
| 5832 |
|
|
| 5833 |
!!!next-token; |
!!!next-token; |
| 5982 |
}->{$token->{tag_name}}) { |
}->{$token->{tag_name}}) { |
| 5983 |
!!!cp ('t399'); |
!!!cp ('t399'); |
| 5984 |
## NOTE: There is an "as if in body" code clone. |
## NOTE: There is an "as if in body" code clone. |
| 5985 |
$parse_rcdata->(CDATA_CONTENT_MODEL, $insert); |
$parse_rcdata->(CDATA_CONTENT_MODEL); |
| 5986 |
redo B; |
redo B; |
| 5987 |
} elsif ($token->{tag_name} eq 'select') { |
} elsif ($token->{tag_name} eq 'select') { |
| 5988 |
!!!cp ('t400'); |
!!!cp ('t400'); |
| 5989 |
$reconstruct_active_formatting_elements->($insert_to_current); |
$reconstruct_active_formatting_elements->($insert_to_current); |
| 5990 |
|
|
| 5991 |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
!!!insert-element-t ($token->{tag_name}, $token->{attributes}); |
| 5992 |
|
|
| 5993 |
|
## TODO: associate with $self->{form_element} if defined |
| 5994 |
|
|
| 5995 |
$self->{insertion_mode} = IN_SELECT_IM; |
if ($self->{insertion_mode} & TABLE_IMS or |
| 5996 |
|
$self->{insertion_mode} & BODY_TABLE_IMS or |
| 5997 |
|
$self->{insertion_mode} == IN_COLUMN_GROUP_IM) { |
| 5998 |
|
!!!cp ('t400.1'); |
| 5999 |
|
$self->{insertion_mode} = IN_SELECT_IN_TABLE_IM; |
| 6000 |
|
} else { |
| 6001 |
|
!!!cp ('t400.2'); |
| 6002 |
|
$self->{insertion_mode} = IN_SELECT_IM; |
| 6003 |
|
} |
| 6004 |
!!!next-token; |
!!!next-token; |
| 6005 |
redo B; |
redo B; |
| 6006 |
} elsif ({ |
} elsif ({ |
| 6075 |
address => 1, blockquote => 1, center => 1, dir => 1, |
address => 1, blockquote => 1, center => 1, dir => 1, |
| 6076 |
div => 1, dl => 1, fieldset => 1, listing => 1, |
div => 1, dl => 1, fieldset => 1, listing => 1, |
| 6077 |
menu => 1, ol => 1, pre => 1, ul => 1, |
menu => 1, ol => 1, pre => 1, ul => 1, |
|
p => 1, |
|
| 6078 |
dd => 1, dt => 1, li => 1, |
dd => 1, dt => 1, li => 1, |
| 6079 |
button => 1, marquee => 1, object => 1, |
button => 1, marquee => 1, object => 1, |
| 6080 |
}->{$token->{tag_name}}) { |
}->{$token->{tag_name}}) { |
| 6083 |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
| 6084 |
my $node = $self->{open_elements}->[$_]; |
my $node = $self->{open_elements}->[$_]; |
| 6085 |
if ($node->[1] eq $token->{tag_name}) { |
if ($node->[1] eq $token->{tag_name}) { |
|
## generate implied end tags |
|
|
if ({ |
|
|
dd => ($token->{tag_name} ne 'dd'), |
|
|
dt => ($token->{tag_name} ne 'dt'), |
|
|
li => ($token->{tag_name} ne 'li'), |
|
|
p => ($token->{tag_name} ne 'p'), |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot=> 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
|
!!!cp ('t409'); |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
|
} |
|
|
|
|
| 6086 |
!!!cp ('t410'); |
!!!cp ('t410'); |
| 6087 |
$i = $_; |
$i = $_; |
| 6088 |
last INSCOPE unless $token->{tag_name} eq 'p'; |
last INSCOPE; |
| 6089 |
} elsif ({ |
} elsif ({ |
| 6090 |
table => 1, caption => 1, td => 1, th => 1, |
table => 1, caption => 1, td => 1, th => 1, |
| 6091 |
button => 1, marquee => 1, object => 1, html => 1, |
button => 1, marquee => 1, object => 1, html => 1, |
| 6094 |
last INSCOPE; |
last INSCOPE; |
| 6095 |
} |
} |
| 6096 |
} # INSCOPE |
} # INSCOPE |
| 6097 |
|
|
| 6098 |
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
unless (defined $i) { # has an element in scope |
| 6099 |
if (defined $i) { |
!!!cp ('t413'); |
| 6100 |
|
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 6101 |
|
} else { |
| 6102 |
|
## Step 1. generate implied end tags |
| 6103 |
|
while ({ |
| 6104 |
|
dd => ($token->{tag_name} ne 'dd'), |
| 6105 |
|
dt => ($token->{tag_name} ne 'dt'), |
| 6106 |
|
li => ($token->{tag_name} ne 'li'), |
| 6107 |
|
p => 1, |
| 6108 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
| 6109 |
|
!!!cp ('t409'); |
| 6110 |
|
pop @{$self->{open_elements}}; |
| 6111 |
|
} |
| 6112 |
|
|
| 6113 |
|
## Step 2. |
| 6114 |
|
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
| 6115 |
!!!cp ('t412'); |
!!!cp ('t412'); |
| 6116 |
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
| 6117 |
} else { |
} else { |
| 6118 |
!!!cp ('t413'); |
!!!cp ('t414'); |
|
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
|
| 6119 |
} |
} |
| 6120 |
} |
|
| 6121 |
|
## Step 3. |
|
if (defined $i) { |
|
|
!!!cp ('t414'); |
|
| 6122 |
splice @{$self->{open_elements}}, $i; |
splice @{$self->{open_elements}}, $i; |
| 6123 |
} elsif ($token->{tag_name} eq 'p') { |
|
| 6124 |
!!!cp ('t415'); |
## Step 4. |
| 6125 |
## As if <p>, then reprocess the current token |
$clear_up_to_marker->() |
| 6126 |
my $el; |
if { |
| 6127 |
!!!create-element ($el, 'p'); |
button => 1, marquee => 1, object => 1, |
| 6128 |
$insert->($el); |
}->{$token->{tag_name}}; |
|
} else { |
|
|
!!!cp ('t416'); |
|
| 6129 |
} |
} |
|
$clear_up_to_marker->() |
|
|
if { |
|
|
button => 1, marquee => 1, object => 1, |
|
|
}->{$token->{tag_name}}; |
|
| 6130 |
!!!next-token; |
!!!next-token; |
| 6131 |
redo B; |
redo B; |
| 6132 |
} elsif ($token->{tag_name} eq 'form') { |
} elsif ($token->{tag_name} eq 'form') { |
| 6133 |
|
undef $self->{form_element}; |
| 6134 |
|
|
| 6135 |
## has an element in scope |
## has an element in scope |
| 6136 |
|
my $i; |
| 6137 |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
| 6138 |
my $node = $self->{open_elements}->[$_]; |
my $node = $self->{open_elements}->[$_]; |
| 6139 |
if ($node->[1] eq $token->{tag_name}) { |
if ($node->[1] eq $token->{tag_name}) { |
|
## generate implied end tags |
|
|
if ({ |
|
|
dd => 1, dt => 1, li => 1, p => 1, |
|
|
|
|
|
## NOTE: The following elements never appear here, maybe. |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
|
!!!cp ('t417'); |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
|
} |
|
|
|
|
| 6140 |
!!!cp ('t418'); |
!!!cp ('t418'); |
| 6141 |
|
$i = $_; |
| 6142 |
last INSCOPE; |
last INSCOPE; |
| 6143 |
} elsif ({ |
} elsif ({ |
| 6144 |
table => 1, caption => 1, td => 1, th => 1, |
table => 1, caption => 1, td => 1, th => 1, |
| 6148 |
last INSCOPE; |
last INSCOPE; |
| 6149 |
} |
} |
| 6150 |
} # INSCOPE |
} # INSCOPE |
| 6151 |
|
|
| 6152 |
if ($self->{open_elements}->[-1]->[1] eq $token->{tag_name}) { |
unless (defined $i) { # has an element in scope |
|
!!!cp ('t420'); |
|
|
pop @{$self->{open_elements}}; |
|
|
} else { |
|
| 6153 |
!!!cp ('t421'); |
!!!cp ('t421'); |
| 6154 |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 6155 |
|
} else { |
| 6156 |
|
## Step 1. generate implied end tags |
| 6157 |
|
while ({ |
| 6158 |
|
dd => 1, dt => 1, li => 1, p => 1, |
| 6159 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
| 6160 |
|
!!!cp ('t417'); |
| 6161 |
|
pop @{$self->{open_elements}}; |
| 6162 |
|
} |
| 6163 |
|
|
| 6164 |
|
## Step 2. |
| 6165 |
|
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
| 6166 |
|
!!!cp ('t417.1'); |
| 6167 |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
| 6168 |
|
} else { |
| 6169 |
|
!!!cp ('t420'); |
| 6170 |
|
} |
| 6171 |
|
|
| 6172 |
|
## Step 3. |
| 6173 |
|
splice @{$self->{open_elements}}, $i; |
| 6174 |
} |
} |
| 6175 |
|
|
|
undef $self->{form_element}; |
|
| 6176 |
!!!next-token; |
!!!next-token; |
| 6177 |
redo B; |
redo B; |
| 6178 |
} elsif ({ |
} elsif ({ |
| 6185 |
if ({ |
if ({ |
| 6186 |
h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1, |
h1 => 1, h2 => 1, h3 => 1, h4 => 1, h5 => 1, h6 => 1, |
| 6187 |
}->{$node->[1]}) { |
}->{$node->[1]}) { |
|
## generate implied end tags |
|
|
if ({ |
|
|
dd => 1, dt => 1, li => 1, p => 1, |
|
|
td => 1, th => 1, tr => 1, |
|
|
tbody => 1, tfoot=> 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
|
!!!cp ('t422'); |
|
|
!!!back-token; |
|
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
|
} |
|
|
|
|
| 6188 |
!!!cp ('t423'); |
!!!cp ('t423'); |
| 6189 |
$i = $_; |
$i = $_; |
| 6190 |
last INSCOPE; |
last INSCOPE; |
| 6196 |
last INSCOPE; |
last INSCOPE; |
| 6197 |
} |
} |
| 6198 |
} # INSCOPE |
} # INSCOPE |
| 6199 |
|
|
| 6200 |
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
unless (defined $i) { # has an element in scope |
| 6201 |
!!!cp ('t425'); |
!!!cp ('t425.1'); |
| 6202 |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 6203 |
} else { |
} else { |
| 6204 |
!!!cp ('t426'); |
## Step 1. generate implied end tags |
| 6205 |
|
while ({ |
| 6206 |
|
dd => 1, dt => 1, li => 1, p => 1, |
| 6207 |
|
}->{$self->{open_elements}->[-1]->[1]}) { |
| 6208 |
|
!!!cp ('t422'); |
| 6209 |
|
pop @{$self->{open_elements}}; |
| 6210 |
|
} |
| 6211 |
|
|
| 6212 |
|
## Step 2. |
| 6213 |
|
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
| 6214 |
|
!!!cp ('t425'); |
| 6215 |
|
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 6216 |
|
} else { |
| 6217 |
|
!!!cp ('t426'); |
| 6218 |
|
} |
| 6219 |
|
|
| 6220 |
|
## Step 3. |
| 6221 |
|
splice @{$self->{open_elements}}, $i; |
| 6222 |
} |
} |
| 6223 |
|
|
| 6224 |
splice @{$self->{open_elements}}, $i if defined $i; |
!!!next-token; |
| 6225 |
|
redo B; |
| 6226 |
|
} elsif ($token->{tag_name} eq 'p') { |
| 6227 |
|
## has an element in scope |
| 6228 |
|
my $i; |
| 6229 |
|
INSCOPE: for (reverse 0..$#{$self->{open_elements}}) { |
| 6230 |
|
my $node = $self->{open_elements}->[$_]; |
| 6231 |
|
if ($node->[1] eq $token->{tag_name}) { |
| 6232 |
|
!!!cp ('t410.1'); |
| 6233 |
|
$i = $_; |
| 6234 |
|
last INSCOPE; |
| 6235 |
|
} elsif ({ |
| 6236 |
|
table => 1, caption => 1, td => 1, th => 1, |
| 6237 |
|
button => 1, marquee => 1, object => 1, html => 1, |
| 6238 |
|
}->{$node->[1]}) { |
| 6239 |
|
!!!cp ('t411.1'); |
| 6240 |
|
last INSCOPE; |
| 6241 |
|
} |
| 6242 |
|
} # INSCOPE |
| 6243 |
|
|
| 6244 |
|
if (defined $i) { |
| 6245 |
|
if ($self->{open_elements}->[-1]->[1] ne $token->{tag_name}) { |
| 6246 |
|
!!!cp ('t412.1'); |
| 6247 |
|
!!!parse-error (type => 'not closed:'.$self->{open_elements}->[-1]->[1]); |
| 6248 |
|
} else { |
| 6249 |
|
!!!cp ('t414.1'); |
| 6250 |
|
} |
| 6251 |
|
|
| 6252 |
|
splice @{$self->{open_elements}}, $i; |
| 6253 |
|
} else { |
| 6254 |
|
!!!cp ('t413.1'); |
| 6255 |
|
!!!parse-error (type => 'unmatched end tag:'.$token->{tag_name}); |
| 6256 |
|
|
| 6257 |
|
!!!cp ('t415.1'); |
| 6258 |
|
## As if <p>, then reprocess the current token |
| 6259 |
|
my $el; |
| 6260 |
|
!!!create-element ($el, 'p'); |
| 6261 |
|
$insert->($el); |
| 6262 |
|
## NOTE: Not inserted into |$self->{open_elements}|. |
| 6263 |
|
} |
| 6264 |
|
|
| 6265 |
!!!next-token; |
!!!next-token; |
| 6266 |
redo B; |
redo B; |
| 6267 |
} elsif ({ |
} elsif ({ |
| 6317 |
if ($node->[1] eq $token->{tag_name}) { |
if ($node->[1] eq $token->{tag_name}) { |
| 6318 |
## Step 1 |
## Step 1 |
| 6319 |
## generate implied end tags |
## generate implied end tags |
| 6320 |
if ({ |
while ({ |
| 6321 |
dd => 1, dt => 1, li => 1, p => 1, |
dd => 1, dt => 1, li => 1, p => 1, |
| 6322 |
td => 1, th => 1, tr => 1, |
}->{$self->{open_elements}->[-1]->[1]}) { |
|
tbody => 1, tfoot => 1, thead => 1, |
|
|
}->{$self->{open_elements}->[-1]->[1]}) { |
|
| 6323 |
!!!cp ('t430'); |
!!!cp ('t430'); |
| 6324 |
## ISSUE: Can this case be reached? |
## ISSUE: Can this case be reached? |
| 6325 |
!!!back-token; |
pop @{$self->{open_elements}}; |
|
$token = {type => END_TAG_TOKEN, |
|
|
tag_name => $self->{open_elements}->[-1]->[1]}; # MUST |
|
|
redo B; |
|
| 6326 |
} |
} |
| 6327 |
|
|
| 6328 |
## Step 2 |
## Step 2 |