123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\CssSelector\Parser;
- use Symfony\Component\CssSelector\Exception\SyntaxErrorException;
- use Symfony\Component\CssSelector\Node;
- use Symfony\Component\CssSelector\Parser\Tokenizer\Tokenizer;
- /**
- * CSS selector parser.
- *
- * This component is a port of the Python cssselect library,
- * which is copyright Ian Bicking, @see https://github.com/SimonSapin/cssselect.
- *
- * @author Jean-François Simon <jeanfrancois.simon@sensiolabs.com>
- *
- * @internal
- */
- class Parser implements ParserInterface
- {
- /**
- * @var Tokenizer
- */
- private $tokenizer;
- /**
- * Constructor.
- *
- * @param null|Tokenizer $tokenizer
- */
- public function __construct(Tokenizer $tokenizer = null)
- {
- $this->tokenizer = $tokenizer ?: new Tokenizer();
- }
- /**
- * {@inheritdoc}
- */
- public function parse($source)
- {
- $reader = new Reader($source);
- $stream = $this->tokenizer->tokenize($reader);
- return $this->parseSelectorList($stream);
- }
- /**
- * Parses the arguments for ":nth-child()" and friends.
- *
- * @param Token[] $tokens
- *
- * @throws SyntaxErrorException
- *
- * @return array
- */
- public static function parseSeries(array $tokens)
- {
- foreach ($tokens as $token) {
- if ($token->isString()) {
- throw SyntaxErrorException::stringAsFunctionArgument();
- }
- }
- $joined = trim(implode('', array_map(function (Token $token) {
- return $token->getValue();
- }, $tokens)));
- $int = function ($string) {
- if (!is_numeric($string)) {
- throw SyntaxErrorException::stringAsFunctionArgument();
- }
- return (int) $string;
- };
- switch (true) {
- case 'odd' === $joined:
- return array(2, 1);
- case 'even' === $joined:
- return array(2, 0);
- case 'n' === $joined:
- return array(1, 0);
- case false === strpos($joined, 'n'):
- return array(0, $int($joined));
- }
- $split = explode('n', $joined);
- $first = isset($split[0]) ? $split[0] : null;
- return array(
- $first ? ('-' === $first || '+' === $first ? $int($first.'1') : $int($first)) : 1,
- isset($split[1]) && $split[1] ? $int($split[1]) : 0,
- );
- }
- /**
- * Parses selector nodes.
- *
- * @param TokenStream $stream
- *
- * @return array
- */
- private function parseSelectorList(TokenStream $stream)
- {
- $stream->skipWhitespace();
- $selectors = array();
- while (true) {
- $selectors[] = $this->parserSelectorNode($stream);
- if ($stream->getPeek()->isDelimiter(array(','))) {
- $stream->getNext();
- $stream->skipWhitespace();
- } else {
- break;
- }
- }
- return $selectors;
- }
- /**
- * Parses next selector or combined node.
- *
- * @param TokenStream $stream
- *
- * @throws SyntaxErrorException
- *
- * @return Node\SelectorNode
- */
- private function parserSelectorNode(TokenStream $stream)
- {
- list($result, $pseudoElement) = $this->parseSimpleSelector($stream);
- while (true) {
- $stream->skipWhitespace();
- $peek = $stream->getPeek();
- if ($peek->isFileEnd() || $peek->isDelimiter(array(','))) {
- break;
- }
- if (null !== $pseudoElement) {
- throw SyntaxErrorException::pseudoElementFound($pseudoElement, 'not at the end of a selector');
- }
- if ($peek->isDelimiter(array('+', '>', '~'))) {
- $combinator = $stream->getNext()->getValue();
- $stream->skipWhitespace();
- } else {
- $combinator = ' ';
- }
- list($nextSelector, $pseudoElement) = $this->parseSimpleSelector($stream);
- $result = new Node\CombinedSelectorNode($result, $combinator, $nextSelector);
- }
- return new Node\SelectorNode($result, $pseudoElement);
- }
- /**
- * Parses next simple node (hash, class, pseudo, negation).
- *
- * @param TokenStream $stream
- * @param bool $insideNegation
- *
- * @throws SyntaxErrorException
- *
- * @return array
- */
- private function parseSimpleSelector(TokenStream $stream, $insideNegation = false)
- {
- $stream->skipWhitespace();
- $selectorStart = count($stream->getUsed());
- $result = $this->parseElementNode($stream);
- $pseudoElement = null;
- while (true) {
- $peek = $stream->getPeek();
- if ($peek->isWhitespace()
- || $peek->isFileEnd()
- || $peek->isDelimiter(array(',', '+', '>', '~'))
- || ($insideNegation && $peek->isDelimiter(array(')')))
- ) {
- break;
- }
- if (null !== $pseudoElement) {
- throw SyntaxErrorException::pseudoElementFound($pseudoElement, 'not at the end of a selector');
- }
- if ($peek->isHash()) {
- $result = new Node\HashNode($result, $stream->getNext()->getValue());
- } elseif ($peek->isDelimiter(array('.'))) {
- $stream->getNext();
- $result = new Node\ClassNode($result, $stream->getNextIdentifier());
- } elseif ($peek->isDelimiter(array('['))) {
- $stream->getNext();
- $result = $this->parseAttributeNode($result, $stream);
- } elseif ($peek->isDelimiter(array(':'))) {
- $stream->getNext();
- if ($stream->getPeek()->isDelimiter(array(':'))) {
- $stream->getNext();
- $pseudoElement = $stream->getNextIdentifier();
- continue;
- }
- $identifier = $stream->getNextIdentifier();
- if (in_array(strtolower($identifier), array('first-line', 'first-letter', 'before', 'after'))) {
- // Special case: CSS 2.1 pseudo-elements can have a single ':'.
- // Any new pseudo-element must have two.
- $pseudoElement = $identifier;
- continue;
- }
- if (!$stream->getPeek()->isDelimiter(array('('))) {
- $result = new Node\PseudoNode($result, $identifier);
- continue;
- }
- $stream->getNext();
- $stream->skipWhitespace();
- if ('not' === strtolower($identifier)) {
- if ($insideNegation) {
- throw SyntaxErrorException::nestedNot();
- }
- list($argument, $argumentPseudoElement) = $this->parseSimpleSelector($stream, true);
- $next = $stream->getNext();
- if (null !== $argumentPseudoElement) {
- throw SyntaxErrorException::pseudoElementFound($argumentPseudoElement, 'inside ::not()');
- }
- if (!$next->isDelimiter(array(')'))) {
- throw SyntaxErrorException::unexpectedToken('")"', $next);
- }
- $result = new Node\NegationNode($result, $argument);
- } else {
- $arguments = array();
- $next = null;
- while (true) {
- $stream->skipWhitespace();
- $next = $stream->getNext();
- if ($next->isIdentifier()
- || $next->isString()
- || $next->isNumber()
- || $next->isDelimiter(array('+', '-'))
- ) {
- $arguments[] = $next;
- } elseif ($next->isDelimiter(array(')'))) {
- break;
- } else {
- throw SyntaxErrorException::unexpectedToken('an argument', $next);
- }
- }
- if (empty($arguments)) {
- throw SyntaxErrorException::unexpectedToken('at least one argument', $next);
- }
- $result = new Node\FunctionNode($result, $identifier, $arguments);
- }
- } else {
- throw SyntaxErrorException::unexpectedToken('selector', $peek);
- }
- }
- if (count($stream->getUsed()) === $selectorStart) {
- throw SyntaxErrorException::unexpectedToken('selector', $stream->getPeek());
- }
- return array($result, $pseudoElement);
- }
- /**
- * Parses next element node.
- *
- * @param TokenStream $stream
- *
- * @return Node\ElementNode
- */
- private function parseElementNode(TokenStream $stream)
- {
- $peek = $stream->getPeek();
- if ($peek->isIdentifier() || $peek->isDelimiter(array('*'))) {
- if ($peek->isIdentifier()) {
- $namespace = $stream->getNext()->getValue();
- } else {
- $stream->getNext();
- $namespace = null;
- }
- if ($stream->getPeek()->isDelimiter(array('|'))) {
- $stream->getNext();
- $element = $stream->getNextIdentifierOrStar();
- } else {
- $element = $namespace;
- $namespace = null;
- }
- } else {
- $element = $namespace = null;
- }
- return new Node\ElementNode($namespace, $element);
- }
- /**
- * Parses next attribute node.
- *
- * @param Node\NodeInterface $selector
- * @param TokenStream $stream
- *
- * @throws SyntaxErrorException
- *
- * @return Node\AttributeNode
- */
- private function parseAttributeNode(Node\NodeInterface $selector, TokenStream $stream)
- {
- $stream->skipWhitespace();
- $attribute = $stream->getNextIdentifierOrStar();
- if (null === $attribute && !$stream->getPeek()->isDelimiter(array('|'))) {
- throw SyntaxErrorException::unexpectedToken('"|"', $stream->getPeek());
- }
- if ($stream->getPeek()->isDelimiter(array('|'))) {
- $stream->getNext();
- if ($stream->getPeek()->isDelimiter(array('='))) {
- $namespace = null;
- $stream->getNext();
- $operator = '|=';
- } else {
- $namespace = $attribute;
- $attribute = $stream->getNextIdentifier();
- $operator = null;
- }
- } else {
- $namespace = $operator = null;
- }
- if (null === $operator) {
- $stream->skipWhitespace();
- $next = $stream->getNext();
- if ($next->isDelimiter(array(']'))) {
- return new Node\AttributeNode($selector, $namespace, $attribute, 'exists', null);
- } elseif ($next->isDelimiter(array('='))) {
- $operator = '=';
- } elseif ($next->isDelimiter(array('^', '$', '*', '~', '|', '!'))
- && $stream->getPeek()->isDelimiter(array('='))
- ) {
- $operator = $next->getValue().'=';
- $stream->getNext();
- } else {
- throw SyntaxErrorException::unexpectedToken('operator', $next);
- }
- }
- $stream->skipWhitespace();
- $value = $stream->getNext();
- if ($value->isNumber()) {
- // if the value is a number, it's casted into a string
- $value = new Token(Token::TYPE_STRING, (string) $value->getValue(), $value->getPosition());
- }
- if (!($value->isIdentifier() || $value->isString())) {
- throw SyntaxErrorException::unexpectedToken('string or identifier', $value);
- }
- $stream->skipWhitespace();
- $next = $stream->getNext();
- if (!$next->isDelimiter(array(']'))) {
- throw SyntaxErrorException::unexpectedToken('"]"', $next);
- }
- return new Node\AttributeNode($selector, $namespace, $attribute, $operator, $value->getValue());
- }
- }
|