/[suikacvs]/markup/html/whatpm/Whatpm/CSS/Tokenizer.pm

Diff of /markup/html/whatpm/Whatpm/CSS/Tokenizer.pm

Parent Directory | Revision Log | View Patch Patch

-revision 1.13 by wakaba,
Sat Sep  8 17:43:41 2007 UTC
+revision 1.17 by wakaba,
Sun Jan 20 04:02:25 2008 UTC
 Line 1
  package Whatpm::CSS::Tokenizer;
  use strict;
+ our $VERSION=do{my @r=(q$Revision$=~/\d+/g);sprintf "%d."."%02d" x $#r,@r};
+ require Exporter;
+ push our @ISA, 'Exporter';
  sub BEFORE_TOKEN_STATE () { 0 }
  sub BEFORE_NMSTART_STATE () { 1 }
-Line 76 
 our @TokenName = qw(
+Line 80 
 our @TokenName = qw(
    COMMENT_INVALID EOF MINUS STAR VBAR DOT COLON MATCH EXCLAMATION
  );
+ our @EXPORT_OK = qw(
+   IDENT_TOKEN ATKEYWORD_TOKEN HASH_TOKEN FUNCTION_TOKEN URI_TOKEN
+   URI_INVALID_TOKEN URI_PREFIX_TOKEN URI_PREFIX_INVALID_TOKEN
+   STRING_TOKEN INVALID_TOKEN NUMBER_TOKEN DIMENSION_TOKEN PERCENTAGE_TOKEN
+   UNICODE_RANGE_TOKEN DELIM_TOKEN PLUS_TOKEN GREATER_TOKEN COMMA_TOKEN
+   TILDE_TOKEN DASHMATCH_TOKEN PREFIXMATCH_TOKEN SUFFIXMATCH_TOKEN
+   SUBSTRINGMATCH_TOKEN INCLUDES_TOKEN SEMICOLON_TOKEN LBRACE_TOKEN
+   RBRACE_TOKEN LPAREN_TOKEN RPAREN_TOKEN LBRACKET_TOKEN RBRACKET_TOKEN
+   S_TOKEN CDO_TOKEN CDC_TOKEN COMMENT_TOKEN COMMENT_INVALID_TOKEN EOF_TOKEN
+   MINUS_TOKEN STAR_TOKEN VBAR_TOKEN DOT_TOKEN COLON_TOKEN MATCH_TOKEN
+   EXCLAMATION_TOKEN
+ );
+ our %EXPORT_TAGS = ('token' => [@EXPORT_OK]);
  sub new ($) {
-   my $self = bless {token => [], get_char => sub { -1 },
+   my $self = bless {token => [], get_char => sub { -1 }}, shift;
-                     onerror => sub { }}, shift;
    return $self;
  } # new
-Line 309 
 sub get_next_token ($) {
+Line 327 
 sub get_next_token ($) {
 x005B => LBRACKET_TOKEN, # [
 x005D => RBRACKET_TOKEN, # ]
                 }->{$self->{c}}) {
+         my ($l, $c) = ($self->{line}, $self->{column});
          # stay in the state
-         $self->{c} = $self->{get_char}->();
+         $self->{c} = $self->{get_char}->($self);
-         return {type => $t};
+         return {type => $t, line => $l, column => $c};
          # redo A;
        } elsif ({
 x0020 => 1, # SP
-Line 836 
 sub get_next_token ($) {
+Line 855 
 sub get_next_token ($) {
            redo A;
          } else {
            ## Note: In |nl| in ... in |string| or |ident|.
-           $self->{t}->{value} .= chr $self->{c};
            $self->{state} = STRING_STATE;
            $self->{c} = $self->{get_char}->();
            redo A;
-Line 852 
 sub get_next_token ($) {
+Line 870 
 sub get_next_token ($) {
                URI_PREFIX_TOKEN, URI_PREFIX_INVALID_TOKEN,
                URI_PREFIX_INVALID_TOKEN, URI_PREFIX_INVALID_TOKEN,
            }->{$self->{t}->{type}};
-           $self->{t}->{value} .= "\x0D";
            $self->{state} = ESCAPE_BEFORE_LF_STATE;
            $self->{c} = $self->{get_char}->();
            redo A;
          } else {
            ## Note: In |nl| in ... in |string| or |ident|.
-           $self->{t}->{value} .= "\x0D";
            $self->{state} = ESCAPE_BEFORE_LF_STATE;
            $self->{c} = $self->{get_char}->();
            redo A;
-Line 996 
 sub get_next_token ($) {
+Line 1012 
 sub get_next_token ($) {
          redo A;
        }
      } elsif ($self->{state} == ESCAPE_BEFORE_LF_STATE) {
-       ## NOTE: |\n| in |\r\n| in |unicode| in |escape|.
+       ## NOTE: |\n| in |\r\n| in |nl| in |escape|.
        if ($self->{c} == 0x000A) { # \n
-         $self->{t}->{value} .= chr $self->{c};
          $self->{state} = $q == 0 ? NAME_STATE :
              $q == 1 ? URI_UNQUOTED_STATE : STRING_STATE;
          $self->{c} = $self->{get_char}->();
-Line 1118 
 sub get_next_token ($) {
+Line 1133 
 sub get_next_token ($) {
    } # A
  } # get_next_token
+ sub serialize_token ($$) {
+   shift;
+   my $t = shift;
+   ## NOTE: This function is not intended for roundtrip-able serialization.
+   if ($t->{type} == IDENT_TOKEN) {
+     return $t->{value};
+   } elsif ($t->{type} == ATKEYWORD_TOKEN) {
+     return '@' . $t->{value};
+   } elsif ($t->{type} == HASH_TOKEN) {
+     return '#' . $t->{value};
+   } elsif ($t->{type} == FUNCTION_TOKEN) {
+     return $t->{value} . '(';
+   } elsif ($t->{type} == URI_TOKEN) {
+     return 'url(' . $t->{value} . ')';
+   } elsif ($t->{type} == URI_INVALID_TOKEN) {
+     return 'url(' . $t->{value};
+   } elsif ($t->{type} == URI_PREFIX_TOKEN) {
+     return 'url-prefix(' . $t->{value} . ')';
+   } elsif ($t->{type} == URI_PREFIX_INVALID_TOKEN) {
+     return 'url-prefix(' . $t->{value};
+   } elsif ($t->{type} == STRING_TOKEN) {
+     return '"' . $t->{value} . '"';
+   } elsif ($t->{type} == INVALID_TOKEN) {
+     return '"' . $t->{value};
+   } elsif ($t->{type} == NUMBER_TOKEN) {
+     return $t->{number};
+   } elsif ($t->{type} == DIMENSION_TOKEN) {
+     return $t->{number} . $t->{value};
+   } elsif ($t->{type} == PERCENTAGE_TOKEN) {
+     return $t->{number} . '%';
+   } elsif ($t->{type} == UNICODE_RANGE_TOKEN) {
+     return 'U+' . $t->{value};
+   } elsif ($t->{type} == DELIM_TOKEN) {
+     return $t->{value};
+   } elsif ($t->{type} == PLUS_TOKEN) {
+     return '+';
+   } elsif ($t->{type} == GREATER_TOKEN) {
+     return '>';
+   } elsif ($t->{type} == COMMA_TOKEN) {
+     return ',';
+   } elsif ($t->{type} == TILDE_TOKEN) {
+     return '~';
+   } elsif ($t->{type} == DASHMATCH_TOKEN) {
+     return '|=';
+   } elsif ($t->{type} == PREFIXMATCH_TOKEN) {
+     return '^=';
+   } elsif ($t->{type} == SUFFIXMATCH_TOKEN) {
+     return '$=';
+   } elsif ($t->{type} == SUBSTRINGMATCH_TOKEN) {
+     return '*=';
+   } elsif ($t->{type} == INCLUDES_TOKEN) {
+     return '~=';
+   } elsif ($t->{type} == SEMICOLON_TOKEN) {
+     return ';';
+   } elsif ($t->{type} == LBRACE_TOKEN) {
+     return '{';
+   } elsif ($t->{type} == RBRACE_TOKEN) {
+     return '}';
+   } elsif ($t->{type} == LPAREN_TOKEN) {
+     return '(';
+   } elsif ($t->{type} == RPAREN_TOKEN) {
+     return ')';
+   } elsif ($t->{type} == LBRACKET_TOKEN) {
+     return '[';
+   } elsif ($t->{type} == RBRACKET_TOKEN) {
+     return ']';
+   } elsif ($t->{type} == S_TOKEN) {
+     return ' ';
+   } elsif ($t->{type} == CDO_TOKEN) {
+     return '<!--';
+   } elsif ($t->{type} == CDC_TOKEN) {
+     return '-->';
+   } elsif ($t->{type} == COMMENT_TOKEN) {
+     return '/**/';
+   } elsif ($t->{type} == COMMENT_INVALID_TOKEN) {
+     return '/*';
+   } elsif ($t->{type} == EOF_TOKEN) {
+     return '{EOF}';
+   } elsif ($t->{type} == MINUS_TOKEN) {
+     return '-';
+   } elsif ($t->{type} == STAR_TOKEN) {
+     return '*';
+   } elsif ($t->{type} == VBAR_TOKEN) {
+     return '|';
+   } elsif ($t->{type} == COLON_TOKEN) {
+     return ':';
+   } elsif ($t->{type} == MATCH_TOKEN) {
+     return '=';
+   } elsif ($t->{type} == EXCLAMATION_TOKEN) {
+     return '!';
+   } else {
+     return '{'.$t->{type}.'}';
+   }
+ } # serialize_token
+ =head1 LICENSE
+ Copyright 2007 Wakaba <w@suika.fam.cx>
+ This library is free software; you can redistribute it
+ and/or modify it under the same terms as Perl itself.
+ =cut
 ;
  # $Date$

 Legend:



Removed from v.1.13
 


changed lines


 
Added in v.1.17
 Legend:



Removed from v.1.13
 


changed lines


 
Added in v.1.17
-Removed from v.1.13
+Added in v.1.17

admin@suikawiki.org	ViewVC Help
Powered by ViewVC 1.1.24