60 lines
2.9 KiB
Erlang
60 lines
2.9 KiB
Erlang
Definitions.
|
|
|
|
ESCAPED = \\[:.]
|
|
IDENTIFIER = [-A-Za-z0-9_]+(({ESCAPED})?[-A-Za-z0-9_]+)*
|
|
QUOTED = (\"[^"]*\"|\'[^']*\')
|
|
PARENTESIS = \([^)]*\)
|
|
INT = [0-9]+
|
|
NOT = (n|N)(o|O)(t|T)
|
|
ODD = (o|O)(d|D)(d|D)
|
|
EVEN = (e|E)(v|V)(e|E)(n|N)
|
|
PSEUDO_PATT = (\+|-)?({INT})?(n|N)((\+|-){INT})?
|
|
SYMBOL = [\[\]*]
|
|
ATTRIBUTE_IDENTIFIER = \s[is]\]
|
|
W = [\s\t\r\n\f]
|
|
|
|
Rules.
|
|
|
|
{IDENTIFIER} : {token, {identifier, TokenLine, TokenChars}}.
|
|
{QUOTED} : {token, {quoted, TokenLine, remove_wrapper(TokenChars)}}.
|
|
{ATTRIBUTE_IDENTIFIER} : {token, {attribute_identifier, TokenLine, TokenChars}}.
|
|
{SYMBOL} : {token, {TokenChars, TokenLine}}.
|
|
#{IDENTIFIER} : {token, {hash, TokenLine, unescape_inside_id_name(tail(TokenChars))}}.
|
|
\.{IDENTIFIER} : {token, {class, TokenLine, unescape_inside_class_name(tail(TokenChars))}}.
|
|
\:{NOT}\( : {token, {pseudo_not, TokenLine}}.
|
|
\:{IDENTIFIER} : {token, {pseudo, TokenLine, tail(TokenChars)}}.
|
|
\({INT}\) : {token, {pseudo_class_int, TokenLine, list_to_integer(remove_wrapper(TokenChars))}}.
|
|
\({ODD}\) : {token, {pseudo_class_odd, TokenLine}}.
|
|
\({EVEN}\) : {token, {pseudo_class_even, TokenLine}}.
|
|
\({PSEUDO_PATT}\) : {token, {pseudo_class_pattern, TokenLine, remove_wrapper(TokenChars)}}.
|
|
\({QUOTED}\) : {token, {pseudo_class_quoted, TokenLine, remove_wrapper(remove_wrapper(TokenChars))}}.
|
|
{W}*\) : {token, {close_parentesis, TokenLine}}.
|
|
~= : {token, {includes, TokenLine}}.
|
|
\|= : {token, {dash_match, TokenLine}}.
|
|
\^= : {token, {prefix_match, TokenLine}}.
|
|
\$= : {token, {suffix_match, TokenLine}}.
|
|
\*= : {token, {substring_match, TokenLine}}.
|
|
= : {token, {equal, TokenLine}}.
|
|
{W}*,{W}* : {token, {comma, TokenLine}}.
|
|
{W}*>{W}* : {token, {greater, TokenLine}}.
|
|
{W}*\+{W}* : {token, {plus, TokenLine}}.
|
|
{W}*~{W}* : {token, {tilde, TokenLine}}.
|
|
{W}*\|{W}* : {token, {namespace_pipe, TokenLine}}.
|
|
{W}+ : {token, {space, TokenLine}}.
|
|
. : {token, {unknown, TokenLine, TokenChars}}.
|
|
|
|
Erlang code.
|
|
|
|
remove_wrapper(Chars) ->
|
|
Len = string:len(Chars),
|
|
string:substr(Chars, 2, Len - 2).
|
|
|
|
tail([_|T]) ->
|
|
T.
|
|
|
|
unescape_inside_class_name(Chars) ->
|
|
lists:flatten(string:replace(Chars, "\\:", ":", all)).
|
|
|
|
unescape_inside_id_name(Chars) ->
|
|
lists:flatten(string:replace(Chars, "\\.", ".", all)).
|