410 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			PHP
		
	
	
			
		
		
	
	
			410 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			PHP
		
	
	
<?php
 | 
						|
 | 
						|
/*
 | 
						|
 * This file is part of the Symfony package.
 | 
						|
 *
 | 
						|
 * (c) Fabien Potencier <fabien@symfony.com>
 | 
						|
 *
 | 
						|
 * For the full copyright and license information, please view the LICENSE
 | 
						|
 * file that was distributed with this source code.
 | 
						|
 */
 | 
						|
 | 
						|
namespace Symfony\Component\ExpressionLanguage;
 | 
						|
 | 
						|
/**
 | 
						|
 * Parsers a token stream.
 | 
						|
 *
 | 
						|
 * This parser implements a "Precedence climbing" algorithm.
 | 
						|
 *
 | 
						|
 * @see http://www.engr.mun.ca/~theo/Misc/exp_parsing.htm
 | 
						|
 * @see http://en.wikipedia.org/wiki/Operator-precedence_parser
 | 
						|
 *
 | 
						|
 * @author Fabien Potencier <fabien@symfony.com>
 | 
						|
 */
 | 
						|
class Parser
 | 
						|
{
 | 
						|
    public const OPERATOR_LEFT = 1;
 | 
						|
    public const OPERATOR_RIGHT = 2;
 | 
						|
 | 
						|
    private $stream;
 | 
						|
    private $unaryOperators;
 | 
						|
    private $binaryOperators;
 | 
						|
    private $functions;
 | 
						|
    private $names;
 | 
						|
    private $lint;
 | 
						|
 | 
						|
    public function __construct(array $functions)
 | 
						|
    {
 | 
						|
        $this->functions = $functions;
 | 
						|
 | 
						|
        $this->unaryOperators = [
 | 
						|
            'not' => ['precedence' => 50],
 | 
						|
            '!' => ['precedence' => 50],
 | 
						|
            '-' => ['precedence' => 500],
 | 
						|
            '+' => ['precedence' => 500],
 | 
						|
        ];
 | 
						|
        $this->binaryOperators = [
 | 
						|
            'or' => ['precedence' => 10, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '||' => ['precedence' => 10, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            'and' => ['precedence' => 15, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '&&' => ['precedence' => 15, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '|' => ['precedence' => 16, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '^' => ['precedence' => 17, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '&' => ['precedence' => 18, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '==' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '===' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '!=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '!==' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '<' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '>' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '>=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '<=' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            'not in' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            'in' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            'matches' => ['precedence' => 20, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '..' => ['precedence' => 25, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '+' => ['precedence' => 30, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '-' => ['precedence' => 30, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '~' => ['precedence' => 40, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '*' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '/' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '%' => ['precedence' => 60, 'associativity' => self::OPERATOR_LEFT],
 | 
						|
            '**' => ['precedence' => 200, 'associativity' => self::OPERATOR_RIGHT],
 | 
						|
        ];
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Converts a token stream to a node tree.
 | 
						|
     *
 | 
						|
     * The valid names is an array where the values
 | 
						|
     * are the names that the user can use in an expression.
 | 
						|
     *
 | 
						|
     * If the variable name in the compiled PHP code must be
 | 
						|
     * different, define it as the key.
 | 
						|
     *
 | 
						|
     * For instance, ['this' => 'container'] means that the
 | 
						|
     * variable 'container' can be used in the expression
 | 
						|
     * but the compiled code will use 'this'.
 | 
						|
     *
 | 
						|
     * @return Node\Node A node tree
 | 
						|
     *
 | 
						|
     * @throws SyntaxError
 | 
						|
     */
 | 
						|
    public function parse(TokenStream $stream, array $names = [])
 | 
						|
    {
 | 
						|
        $this->lint = false;
 | 
						|
 | 
						|
        return $this->doParse($stream, $names);
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Validates the syntax of an expression.
 | 
						|
     *
 | 
						|
     * The syntax of the passed expression will be checked, but not parsed.
 | 
						|
     * If you want to skip checking dynamic variable names, pass `null` instead of the array.
 | 
						|
     *
 | 
						|
     * @throws SyntaxError When the passed expression is invalid
 | 
						|
     */
 | 
						|
    public function lint(TokenStream $stream, ?array $names = []): void
 | 
						|
    {
 | 
						|
        $this->lint = true;
 | 
						|
        $this->doParse($stream, $names);
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * @throws SyntaxError
 | 
						|
     */
 | 
						|
    private function doParse(TokenStream $stream, ?array $names = []): Node\Node
 | 
						|
    {
 | 
						|
        $this->stream = $stream;
 | 
						|
        $this->names = $names;
 | 
						|
 | 
						|
        $node = $this->parseExpression();
 | 
						|
        if (!$stream->isEOF()) {
 | 
						|
            throw new SyntaxError(sprintf('Unexpected token "%s" of value "%s".', $stream->current->type, $stream->current->value), $stream->current->cursor, $stream->getExpression());
 | 
						|
        }
 | 
						|
 | 
						|
        $this->stream = null;
 | 
						|
        $this->names = null;
 | 
						|
 | 
						|
        return $node;
 | 
						|
    }
 | 
						|
 | 
						|
    public function parseExpression(int $precedence = 0)
 | 
						|
    {
 | 
						|
        $expr = $this->getPrimary();
 | 
						|
        $token = $this->stream->current;
 | 
						|
        while ($token->test(Token::OPERATOR_TYPE) && isset($this->binaryOperators[$token->value]) && $this->binaryOperators[$token->value]['precedence'] >= $precedence) {
 | 
						|
            $op = $this->binaryOperators[$token->value];
 | 
						|
            $this->stream->next();
 | 
						|
 | 
						|
            $expr1 = $this->parseExpression(self::OPERATOR_LEFT === $op['associativity'] ? $op['precedence'] + 1 : $op['precedence']);
 | 
						|
            $expr = new Node\BinaryNode($token->value, $expr, $expr1);
 | 
						|
 | 
						|
            $token = $this->stream->current;
 | 
						|
        }
 | 
						|
 | 
						|
        if (0 === $precedence) {
 | 
						|
            return $this->parseConditionalExpression($expr);
 | 
						|
        }
 | 
						|
 | 
						|
        return $expr;
 | 
						|
    }
 | 
						|
 | 
						|
    protected function getPrimary()
 | 
						|
    {
 | 
						|
        $token = $this->stream->current;
 | 
						|
 | 
						|
        if ($token->test(Token::OPERATOR_TYPE) && isset($this->unaryOperators[$token->value])) {
 | 
						|
            $operator = $this->unaryOperators[$token->value];
 | 
						|
            $this->stream->next();
 | 
						|
            $expr = $this->parseExpression($operator['precedence']);
 | 
						|
 | 
						|
            return $this->parsePostfixExpression(new Node\UnaryNode($token->value, $expr));
 | 
						|
        }
 | 
						|
 | 
						|
        if ($token->test(Token::PUNCTUATION_TYPE, '(')) {
 | 
						|
            $this->stream->next();
 | 
						|
            $expr = $this->parseExpression();
 | 
						|
            $this->stream->expect(Token::PUNCTUATION_TYPE, ')', 'An opened parenthesis is not properly closed');
 | 
						|
 | 
						|
            return $this->parsePostfixExpression($expr);
 | 
						|
        }
 | 
						|
 | 
						|
        return $this->parsePrimaryExpression();
 | 
						|
    }
 | 
						|
 | 
						|
    protected function parseConditionalExpression(Node\Node $expr)
 | 
						|
    {
 | 
						|
        while ($this->stream->current->test(Token::PUNCTUATION_TYPE, '?')) {
 | 
						|
            $this->stream->next();
 | 
						|
            if (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ':')) {
 | 
						|
                $expr2 = $this->parseExpression();
 | 
						|
                if ($this->stream->current->test(Token::PUNCTUATION_TYPE, ':')) {
 | 
						|
                    $this->stream->next();
 | 
						|
                    $expr3 = $this->parseExpression();
 | 
						|
                } else {
 | 
						|
                    $expr3 = new Node\ConstantNode(null);
 | 
						|
                }
 | 
						|
            } else {
 | 
						|
                $this->stream->next();
 | 
						|
                $expr2 = $expr;
 | 
						|
                $expr3 = $this->parseExpression();
 | 
						|
            }
 | 
						|
 | 
						|
            $expr = new Node\ConditionalNode($expr, $expr2, $expr3);
 | 
						|
        }
 | 
						|
 | 
						|
        return $expr;
 | 
						|
    }
 | 
						|
 | 
						|
    public function parsePrimaryExpression()
 | 
						|
    {
 | 
						|
        $token = $this->stream->current;
 | 
						|
        switch ($token->type) {
 | 
						|
            case Token::NAME_TYPE:
 | 
						|
                $this->stream->next();
 | 
						|
                switch ($token->value) {
 | 
						|
                    case 'true':
 | 
						|
                    case 'TRUE':
 | 
						|
                        return new Node\ConstantNode(true);
 | 
						|
 | 
						|
                    case 'false':
 | 
						|
                    case 'FALSE':
 | 
						|
                        return new Node\ConstantNode(false);
 | 
						|
 | 
						|
                    case 'null':
 | 
						|
                    case 'NULL':
 | 
						|
                        return new Node\ConstantNode(null);
 | 
						|
 | 
						|
                    default:
 | 
						|
                        if ('(' === $this->stream->current->value) {
 | 
						|
                            if (false === isset($this->functions[$token->value])) {
 | 
						|
                                throw new SyntaxError(sprintf('The function "%s" does not exist.', $token->value), $token->cursor, $this->stream->getExpression(), $token->value, array_keys($this->functions));
 | 
						|
                            }
 | 
						|
 | 
						|
                            $node = new Node\FunctionNode($token->value, $this->parseArguments());
 | 
						|
                        } else {
 | 
						|
                            if (!$this->lint || \is_array($this->names)) {
 | 
						|
                                if (!\in_array($token->value, $this->names, true)) {
 | 
						|
                                    throw new SyntaxError(sprintf('Variable "%s" is not valid.', $token->value), $token->cursor, $this->stream->getExpression(), $token->value, $this->names);
 | 
						|
                                }
 | 
						|
 | 
						|
                                // is the name used in the compiled code different
 | 
						|
                                // from the name used in the expression?
 | 
						|
                                if (\is_int($name = array_search($token->value, $this->names))) {
 | 
						|
                                    $name = $token->value;
 | 
						|
                                }
 | 
						|
                            } else {
 | 
						|
                                $name = $token->value;
 | 
						|
                            }
 | 
						|
 | 
						|
                            $node = new Node\NameNode($name);
 | 
						|
                        }
 | 
						|
                }
 | 
						|
                break;
 | 
						|
 | 
						|
            case Token::NUMBER_TYPE:
 | 
						|
            case Token::STRING_TYPE:
 | 
						|
                $this->stream->next();
 | 
						|
 | 
						|
                return new Node\ConstantNode($token->value);
 | 
						|
 | 
						|
            default:
 | 
						|
                if ($token->test(Token::PUNCTUATION_TYPE, '[')) {
 | 
						|
                    $node = $this->parseArrayExpression();
 | 
						|
                } elseif ($token->test(Token::PUNCTUATION_TYPE, '{')) {
 | 
						|
                    $node = $this->parseHashExpression();
 | 
						|
                } else {
 | 
						|
                    throw new SyntaxError(sprintf('Unexpected token "%s" of value "%s".', $token->type, $token->value), $token->cursor, $this->stream->getExpression());
 | 
						|
                }
 | 
						|
        }
 | 
						|
 | 
						|
        return $this->parsePostfixExpression($node);
 | 
						|
    }
 | 
						|
 | 
						|
    public function parseArrayExpression()
 | 
						|
    {
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, '[', 'An array element was expected');
 | 
						|
 | 
						|
        $node = new Node\ArrayNode();
 | 
						|
        $first = true;
 | 
						|
        while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ']')) {
 | 
						|
            if (!$first) {
 | 
						|
                $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'An array element must be followed by a comma');
 | 
						|
 | 
						|
                // trailing ,?
 | 
						|
                if ($this->stream->current->test(Token::PUNCTUATION_TYPE, ']')) {
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            $first = false;
 | 
						|
 | 
						|
            $node->addElement($this->parseExpression());
 | 
						|
        }
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, ']', 'An opened array is not properly closed');
 | 
						|
 | 
						|
        return $node;
 | 
						|
    }
 | 
						|
 | 
						|
    public function parseHashExpression()
 | 
						|
    {
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, '{', 'A hash element was expected');
 | 
						|
 | 
						|
        $node = new Node\ArrayNode();
 | 
						|
        $first = true;
 | 
						|
        while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, '}')) {
 | 
						|
            if (!$first) {
 | 
						|
                $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'A hash value must be followed by a comma');
 | 
						|
 | 
						|
                // trailing ,?
 | 
						|
                if ($this->stream->current->test(Token::PUNCTUATION_TYPE, '}')) {
 | 
						|
                    break;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            $first = false;
 | 
						|
 | 
						|
            // a hash key can be:
 | 
						|
            //
 | 
						|
            //  * a number -- 12
 | 
						|
            //  * a string -- 'a'
 | 
						|
            //  * a name, which is equivalent to a string -- a
 | 
						|
            //  * an expression, which must be enclosed in parentheses -- (1 + 2)
 | 
						|
            if ($this->stream->current->test(Token::STRING_TYPE) || $this->stream->current->test(Token::NAME_TYPE) || $this->stream->current->test(Token::NUMBER_TYPE)) {
 | 
						|
                $key = new Node\ConstantNode($this->stream->current->value);
 | 
						|
                $this->stream->next();
 | 
						|
            } elseif ($this->stream->current->test(Token::PUNCTUATION_TYPE, '(')) {
 | 
						|
                $key = $this->parseExpression();
 | 
						|
            } else {
 | 
						|
                $current = $this->stream->current;
 | 
						|
 | 
						|
                throw new SyntaxError(sprintf('A hash key must be a quoted string, a number, a name, or an expression enclosed in parentheses (unexpected token "%s" of value "%s".', $current->type, $current->value), $current->cursor, $this->stream->getExpression());
 | 
						|
            }
 | 
						|
 | 
						|
            $this->stream->expect(Token::PUNCTUATION_TYPE, ':', 'A hash key must be followed by a colon (:)');
 | 
						|
            $value = $this->parseExpression();
 | 
						|
 | 
						|
            $node->addElement($value, $key);
 | 
						|
        }
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, '}', 'An opened hash is not properly closed');
 | 
						|
 | 
						|
        return $node;
 | 
						|
    }
 | 
						|
 | 
						|
    public function parsePostfixExpression(Node\Node $node)
 | 
						|
    {
 | 
						|
        $token = $this->stream->current;
 | 
						|
        while (Token::PUNCTUATION_TYPE == $token->type) {
 | 
						|
            if ('.' === $token->value) {
 | 
						|
                $this->stream->next();
 | 
						|
                $token = $this->stream->current;
 | 
						|
                $this->stream->next();
 | 
						|
 | 
						|
                if (
 | 
						|
                    Token::NAME_TYPE !== $token->type
 | 
						|
                    &&
 | 
						|
                    // Operators like "not" and "matches" are valid method or property names,
 | 
						|
                    //
 | 
						|
                    // In other words, besides NAME_TYPE, OPERATOR_TYPE could also be parsed as a property or method.
 | 
						|
                    // This is because operators are processed by the lexer prior to names. So "not" in "foo.not()" or "matches" in "foo.matches" will be recognized as an operator first.
 | 
						|
                    // But in fact, "not" and "matches" in such expressions shall be parsed as method or property names.
 | 
						|
                    //
 | 
						|
                    // And this ONLY works if the operator consists of valid characters for a property or method name.
 | 
						|
                    //
 | 
						|
                    // Other types, such as STRING_TYPE and NUMBER_TYPE, can't be parsed as property nor method names.
 | 
						|
                    //
 | 
						|
                    // As a result, if $token is NOT an operator OR $token->value is NOT a valid property or method name, an exception shall be thrown.
 | 
						|
                    (Token::OPERATOR_TYPE !== $token->type || !preg_match('/[a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*/A', $token->value))
 | 
						|
                ) {
 | 
						|
                    throw new SyntaxError('Expected name.', $token->cursor, $this->stream->getExpression());
 | 
						|
                }
 | 
						|
 | 
						|
                $arg = new Node\ConstantNode($token->value, true);
 | 
						|
 | 
						|
                $arguments = new Node\ArgumentsNode();
 | 
						|
                if ($this->stream->current->test(Token::PUNCTUATION_TYPE, '(')) {
 | 
						|
                    $type = Node\GetAttrNode::METHOD_CALL;
 | 
						|
                    foreach ($this->parseArguments()->nodes as $n) {
 | 
						|
                        $arguments->addElement($n);
 | 
						|
                    }
 | 
						|
                } else {
 | 
						|
                    $type = Node\GetAttrNode::PROPERTY_CALL;
 | 
						|
                }
 | 
						|
 | 
						|
                $node = new Node\GetAttrNode($node, $arg, $arguments, $type);
 | 
						|
            } elseif ('[' === $token->value) {
 | 
						|
                $this->stream->next();
 | 
						|
                $arg = $this->parseExpression();
 | 
						|
                $this->stream->expect(Token::PUNCTUATION_TYPE, ']');
 | 
						|
 | 
						|
                $node = new Node\GetAttrNode($node, $arg, new Node\ArgumentsNode(), Node\GetAttrNode::ARRAY_CALL);
 | 
						|
            } else {
 | 
						|
                break;
 | 
						|
            }
 | 
						|
 | 
						|
            $token = $this->stream->current;
 | 
						|
        }
 | 
						|
 | 
						|
        return $node;
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Parses arguments.
 | 
						|
     */
 | 
						|
    public function parseArguments()
 | 
						|
    {
 | 
						|
        $args = [];
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, '(', 'A list of arguments must begin with an opening parenthesis');
 | 
						|
        while (!$this->stream->current->test(Token::PUNCTUATION_TYPE, ')')) {
 | 
						|
            if (!empty($args)) {
 | 
						|
                $this->stream->expect(Token::PUNCTUATION_TYPE, ',', 'Arguments must be separated by a comma');
 | 
						|
            }
 | 
						|
 | 
						|
            $args[] = $this->parseExpression();
 | 
						|
        }
 | 
						|
        $this->stream->expect(Token::PUNCTUATION_TYPE, ')', 'A list of arguments must be closed by a parenthesis');
 | 
						|
 | 
						|
        return new Node\Node($args);
 | 
						|
    }
 | 
						|
}
 |