You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
101 lines
4.1 KiB
101 lines
4.1 KiB
<?php |
|
|
|
/* |
|
* This file is part of the Symfony package. |
|
* |
|
* (c) Fabien Potencier <fabien@symfony.com> |
|
* |
|
* For the full copyright and license information, please view the LICENSE |
|
* file that was distributed with this source code. |
|
*/ |
|
|
|
namespace Symfony\Component\ExpressionLanguage; |
|
|
|
/** |
|
* Lexes an expression. |
|
* |
|
* @author Fabien Potencier <fabien@symfony.com> |
|
*/ |
|
class Lexer |
|
{ |
|
/** |
|
* Tokenizes an expression. |
|
* |
|
* @return TokenStream |
|
* |
|
* @throws SyntaxError |
|
*/ |
|
public function tokenize(string $expression) |
|
{ |
|
$expression = str_replace(["\r", "\n", "\t", "\v", "\f"], ' ', $expression); |
|
$cursor = 0; |
|
$tokens = []; |
|
$brackets = []; |
|
$end = \strlen($expression); |
|
|
|
while ($cursor < $end) { |
|
if (' ' == $expression[$cursor]) { |
|
++$cursor; |
|
|
|
continue; |
|
} |
|
|
|
if (preg_match('/[0-9]+(?:\.[0-9]+)?([Ee][\+\-][0-9]+)?/A', $expression, $match, 0, $cursor)) { |
|
// numbers |
|
$number = (float) $match[0]; // floats |
|
if (preg_match('/^[0-9]+$/', $match[0]) && $number <= \PHP_INT_MAX) { |
|
$number = (int) $match[0]; // integers lower than the maximum |
|
} |
|
$tokens[] = new Token(Token::NUMBER_TYPE, $number, $cursor + 1); |
|
$cursor += \strlen($match[0]); |
|
} elseif (false !== strpos('([{', $expression[$cursor])) { |
|
// opening bracket |
|
$brackets[] = [$expression[$cursor], $cursor]; |
|
|
|
$tokens[] = new Token(Token::PUNCTUATION_TYPE, $expression[$cursor], $cursor + 1); |
|
++$cursor; |
|
} elseif (false !== strpos(')]}', $expression[$cursor])) { |
|
// closing bracket |
|
if (empty($brackets)) { |
|
throw new SyntaxError(sprintf('Unexpected "%s".', $expression[$cursor]), $cursor, $expression); |
|
} |
|
|
|
[$expect, $cur] = array_pop($brackets); |
|
if ($expression[$cursor] != strtr($expect, '([{', ')]}')) { |
|
throw new SyntaxError(sprintf('Unclosed "%s".', $expect), $cur, $expression); |
|
} |
|
|
|
$tokens[] = new Token(Token::PUNCTUATION_TYPE, $expression[$cursor], $cursor + 1); |
|
++$cursor; |
|
} elseif (preg_match('/"([^"\\\\]*(?:\\\\.[^"\\\\]*)*)"|\'([^\'\\\\]*(?:\\\\.[^\'\\\\]*)*)\'/As', $expression, $match, 0, $cursor)) { |
|
// strings |
|
$tokens[] = new Token(Token::STRING_TYPE, stripcslashes(substr($match[0], 1, -1)), $cursor + 1); |
|
$cursor += \strlen($match[0]); |
|
} elseif (preg_match('/(?<=^|[\s(])not in(?=[\s(])|\!\=\=|(?<=^|[\s(])not(?=[\s(])|(?<=^|[\s(])and(?=[\s(])|\=\=\=|\>\=|(?<=^|[\s(])or(?=[\s(])|\<\=|\*\*|\.\.|(?<=^|[\s(])in(?=[\s(])|&&|\|\||(?<=^|[\s(])matches|\=\=|\!\=|\*|~|%|\/|\>|\||\!|\^|&|\+|\<|\-/A', $expression, $match, 0, $cursor)) { |
|
// operators |
|
$tokens[] = new Token(Token::OPERATOR_TYPE, $match[0], $cursor + 1); |
|
$cursor += \strlen($match[0]); |
|
} elseif (false !== strpos('.,?:', $expression[$cursor])) { |
|
// punctuation |
|
$tokens[] = new Token(Token::PUNCTUATION_TYPE, $expression[$cursor], $cursor + 1); |
|
++$cursor; |
|
} elseif (preg_match('/[a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*/A', $expression, $match, 0, $cursor)) { |
|
// names |
|
$tokens[] = new Token(Token::NAME_TYPE, $match[0], $cursor + 1); |
|
$cursor += \strlen($match[0]); |
|
} else { |
|
// unlexable |
|
throw new SyntaxError(sprintf('Unexpected character "%s".', $expression[$cursor]), $cursor, $expression); |
|
} |
|
} |
|
|
|
$tokens[] = new Token(Token::EOF_TYPE, null, $cursor + 1); |
|
|
|
if (!empty($brackets)) { |
|
[$expect, $cur] = array_pop($brackets); |
|
throw new SyntaxError(sprintf('Unclosed "%s".', $expect), $cur, $expression); |
|
} |
|
|
|
return new TokenStream($tokens, $expression); |
|
} |
|
}
|
|
|