123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\ExpressionLanguage;
- /**
- * Parsers a token stream.
- *
- * This parser implements a "Precedence climbing" algorithm.
- *
- * @see http://www.engr.mun.ca/~theo/Misc/exp_parsing.htm
- * @see http://en.wikipedia.org/wiki/Operator-precedence_parser
- *
- * @author Fabien Potencier <fabien@symfony.com>
- */
- class Parser
- {
- const OPERATOR_LEFT = 1;
- const OPERATOR_RIGHT = 2;
- private $stream;
- private $unaryOperators;
- private $binaryOperators;
- private $functions;
- private $names;
- public function __construct(array $functions)
- {
- $this->functions = $functions;
- $this->unaryOperators = [
- 'not' => ['precedence' => 50],
- '!' => ['precedence' => 50],
- '-' => ['precedence' => 500],
- '+' => ['precedence' => 500],
- ];
- $this->binaryOperators = [
- 'or' => ['precedence' => 10, 'associativity' => self::OPERATOR_LEFT],
- '||' => ['precedence' => 10, 'associativity' => self::OPERATOR_LEFT],
- 'and' => ['precedence' => 15, 'associativity' => self::OPERATOR_LEFT],
- '&&' => ['precedence' => 15, 'associativity' => self::OPERATOR_LEFT],
- '|' => ['precedence' => 16, 'associativity' => self::OPERATOR_LEFT],
- '^' => ['precedence' => 17, 'associativity' => self::OPERATOR_LEFT],
- '&' => ['precedence' => 18, 'associativity' => self::OPERATOR_LEFT],
- '==' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '===' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '!=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '!==' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '<' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '>' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '>=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '<=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- 'not in' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- 'in' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- 'matches' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
- '..' => ['precedence' => 25, 'associativity' => self::OPERATOR_LEFT],
- '+' => ['precedence' => 30, 'associativity' => self::OPERATOR_LEFT],
- '-' => ['precedence' => 30, 'associativity' => self::OPERATOR_LEFT],
- '~' => ['precedence' => 40, 'associativity' => self::OPERATOR_LEFT],
- '*' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
- '/' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
- '%' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
- '**' => ['precedence' => 200, 'associativity' => self::OPERATOR_RIGHT],
- ];
- }
- /**
- * Converts a token stream to a node tree.
- *
- * The valid names is an array where the values
- * are the names that the user can use in an expression.
- *
- * If the variable name in the compiled PHP code must be
- * different, define it as the key.
- *
- * For instance, ['this' => 'container'] means that the
- * variable 'container' can be used in the expression
- * but the compiled code will use 'this'.
- *
- * @param TokenStream $stream A token stream instance
- * @param array $names An array of valid names
- *
- * @return Node\Node A node tree
- *
- * @throws SyntaxError
- */
- public function parse(TokenStream $stream, $names = [])
- {
- $this->stream = $stream;
- $this->names = $names;
- $node = $this->parseExpression();
- if (!$stream->isEOF()) {
- throw new SyntaxError(sprintf('Unexpected token "%s" of value "%s".', $stream->current->type, $stream->current->value), $stream->current->cursor, $stream->getExpression());
- }
- return $node;
- }
- public function parseExpression($precedence = 0)
- {
- $expr = $this->getPrimary();
- $token = $this->stream->current;
- while ($token->test(Token::OPERATOR_TYPE) && isset($this->binaryOperators[$token->value]) && $this->binaryOperators[$token->value]['precedence'] >= $precedence) {
- $op = $this->binaryOperators[$token->value];
- $this->stream->next();
- $expr1 = $this->parseExpression(self::OPERATOR_LEFT === $op['associativity'] ? $op['precedence'] + 1 : $op['precedence']);
- $expr = new Node\BinaryNode($token->value, $expr, $expr1);
- $token = $this->stream->current;
- }
- if (0 === $precedence) {
- return $this->parseConditionalExpression($expr);
- }
- return $expr;
- }
- protected function getPrimary()
- {
- $token = $this->stream->current;
- if ($token->test(Token::OPERATOR_TYPE) && isset($this->unaryOperators[$token->value])) {
- $operator = $this->unaryOperators[$token->value];
- $this->stream->next();
- $expr = $this->parseExpression($operator['precedence']);
- return $this->parsePostfixExpression(new Node\UnaryNode($token->value, $expr));
- }
- if ($token->test(Token::PUNCTUATION_TYPE, '(')) {
- $this->stream->next();
- $expr = $this->parseExpression();
- $this->stream->expect(Token::PUNCTUATION_TYPE, ')', 'An opened parenthesis is not properly closed');
- return $this->parsePostfixExpression($expr);
- }
- return $this->parsePrimaryExpression();
- }
- protected function parseConditionalExpression($expr)
- {
- while ($this->stream->current->test(Token::PUNCTUATION_TYPE, '?')) {
- $this->stream->next();
- if (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ':')) {
- $expr2 = $this->parseExpression();
- if ($this->stream->current->test(Token::PUNCTUATION_TYPE, ':')) {
- $this->stream->next();
- $expr3 = $this->parseExpression();
- } else {
- $expr3 = new Node\ConstantNode(null);
- }
- } else {
- $this->stream->next();
- $expr2 = $expr;
- $expr3 = $this->parseExpression();
- }
- $expr = new Node\ConditionalNode($expr, $expr2, $expr3);
- }
- return $expr;
- }
- public function parsePrimaryExpression()
- {
- $token = $this->stream->current;
- switch ($token->type) {
- case Token::NAME_TYPE:
- $this->stream->next();
- switch ($token->value) {
- case 'true':
- case 'TRUE':
- return new Node\ConstantNode(true);
- case 'false':
- case 'FALSE':
- return new Node\ConstantNode(false);
- case 'null':
- case 'NULL':
- return new Node\ConstantNode(null);
- default:
- if ('(' === $this->stream->current->value) {
- if (false === isset($this->functions[$token->value])) {
- throw new SyntaxError(sprintf('The function "%s" does not exist.', $token->value), $token->cursor, $this->stream->getExpression(), $token->value, array_keys($this->functions));
- }
- $node = new Node\FunctionNode($token->value, $this->parseArguments());
- } else {
- if (!\in_array($token->value, $this->names, true)) {
- throw new SyntaxError(sprintf('Variable "%s" is not valid.', $token->value), $token->cursor, $this->stream->getExpression(), $token->value, $this->names);
- }
- // is the name used in the compiled code different
- // from the name used in the expression?
- if (\is_int($name = array_search($token->value, $this->names))) {
- $name = $token->value;
- }
- $node = new Node\NameNode($name);
- }
- }
- break;
- case Token::NUMBER_TYPE:
- case Token::STRING_TYPE:
- $this->stream->next();
- return new Node\ConstantNode($token->value);
- default:
- if ($token->test(Token::PUNCTUATION_TYPE, '[')) {
- $node = $this->parseArrayExpression();
- } elseif ($token->test(Token::PUNCTUATION_TYPE, '{')) {
- $node = $this->parseHashExpression();
- } else {
- throw new SyntaxError(sprintf('Unexpected token "%s" of value "%s".', $token->type, $token->value), $token->cursor, $this->stream->getExpression());
- }
- }
- return $this->parsePostfixExpression($node);
- }
- public function parseArrayExpression()
- {
- $this->stream->expect(Token::PUNCTUATION_TYPE, '[', 'An array element was expected');
- $node = new Node\ArrayNode();
- $first = true;
- while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ']')) {
- if (!$first) {
- $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'An array element must be followed by a comma');
- // trailing ,?
- if ($this->stream->current->test(Token::PUNCTUATION_TYPE, ']')) {
- break;
- }
- }
- $first = false;
- $node->addElement($this->parseExpression());
- }
- $this->stream->expect(Token::PUNCTUATION_TYPE, ']', 'An opened array is not properly closed');
- return $node;
- }
- public function parseHashExpression()
- {
- $this->stream->expect(Token::PUNCTUATION_TYPE, '{', 'A hash element was expected');
- $node = new Node\ArrayNode();
- $first = true;
- while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, '}')) {
- if (!$first) {
- $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'A hash value must be followed by a comma');
- // trailing ,?
- if ($this->stream->current->test(Token::PUNCTUATION_TYPE, '}')) {
- break;
- }
- }
- $first = false;
- // a hash key can be:
- //
- // * a number -- 12
- // * a string -- 'a'
- // * a name, which is equivalent to a string -- a
- // * an expression, which must be enclosed in parentheses -- (1 + 2)
- if ($this->stream->current->test(Token::STRING_TYPE) || $this->stream->current->test(Token::NAME_TYPE) || $this->stream->current->test(Token::NUMBER_TYPE)) {
- $key = new Node\ConstantNode($this->stream->current->value);
- $this->stream->next();
- } elseif ($this->stream->current->test(Token::PUNCTUATION_TYPE, '(')) {
- $key = $this->parseExpression();
- } else {
- $current = $this->stream->current;
- throw new SyntaxError(sprintf('A hash key must be a quoted string, a number, a name, or an expression enclosed in parentheses (unexpected token "%s" of value "%s".', $current->type, $current->value), $current->cursor, $this->stream->getExpression());
- }
- $this->stream->expect(Token::PUNCTUATION_TYPE, ':', 'A hash key must be followed by a colon (:)');
- $value = $this->parseExpression();
- $node->addElement($value, $key);
- }
- $this->stream->expect(Token::PUNCTUATION_TYPE, '}', 'An opened hash is not properly closed');
- return $node;
- }
- public function parsePostfixExpression($node)
- {
- $token = $this->stream->current;
- while (Token::PUNCTUATION_TYPE == $token->type) {
- if ('.' === $token->value) {
- $this->stream->next();
- $token = $this->stream->current;
- $this->stream->next();
- if (
- Token::NAME_TYPE !== $token->type
- &&
- // Operators like "not" and "matches" are valid method or property names,
- //
- // In other words, besides NAME_TYPE, OPERATOR_TYPE could also be parsed as a property or method.
- // This is because operators are processed by the lexer prior to names. So "not" in "foo.not()" or "matches" in "foo.matches" will be recognized as an operator first.
- // But in fact, "not" and "matches" in such expressions shall be parsed as method or property names.
- //
- // And this ONLY works if the operator consists of valid characters for a property or method name.
- //
- // Other types, such as STRING_TYPE and NUMBER_TYPE, can't be parsed as property nor method names.
- //
- // As a result, if $token is NOT an operator OR $token->value is NOT a valid property or method name, an exception shall be thrown.
- (Token::OPERATOR_TYPE !== $token->type || !preg_match('/[a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*/A', $token->value))
- ) {
- throw new SyntaxError('Expected name.', $token->cursor, $this->stream->getExpression());
- }
- $arg = new Node\ConstantNode($token->value, true);
- $arguments = new Node\ArgumentsNode();
- if ($this->stream->current->test(Token::PUNCTUATION_TYPE, '(')) {
- $type = Node\GetAttrNode::METHOD_CALL;
- foreach ($this->parseArguments()->nodes as $n) {
- $arguments->addElement($n);
- }
- } else {
- $type = Node\GetAttrNode::PROPERTY_CALL;
- }
- $node = new Node\GetAttrNode($node, $arg, $arguments, $type);
- } elseif ('[' === $token->value) {
- $this->stream->next();
- $arg = $this->parseExpression();
- $this->stream->expect(Token::PUNCTUATION_TYPE, ']');
- $node = new Node\GetAttrNode($node, $arg, new Node\ArgumentsNode(), Node\GetAttrNode::ARRAY_CALL);
- } else {
- break;
- }
- $token = $this->stream->current;
- }
- return $node;
- }
- /**
- * Parses arguments.
- */
- public function parseArguments()
- {
- $args = [];
- $this->stream->expect(Token::PUNCTUATION_TYPE, '(', 'A list of arguments must begin with an opening parenthesis');
- while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ')')) {
- if (!empty($args)) {
- $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'Arguments must be separated by a comma');
- }
- $args[] = $this->parseExpression();
- }
- $this->stream->expect(Token::PUNCTUATION_TYPE, ')', 'A list of arguments must be closed by a parenthesis');
- return new Node\Node($args);
- }
- }
|