popsu-d7/sites/all/modules/feeds_xpathparser/FeedsXPathParserQueryParser.inc
Bachir Soussi Chiadmi 1bc61b12ad first import
2015-04-08 11:40:19 +02:00

121 lines
2.8 KiB
PHP

<?php
/**
* @file
* Pseudo-parser of XPath queries. When an XML document has a default
* namespace this gets called so that adding the __default__ namepace where
* appropriate. Aren't we nice?
*
* @todo
* Cleanup.
* @param $query
* An XPath query string.
* @return string
* An XPath query string with the __default__ namespace added.
*/
class FeedsXPathParserQueryParser {
function __construct($query) {
$this->query = preg_replace('/\s+\(\s*/', '(', $query);
$this->word_boundaries = array(
'[', ']', '=', '(', ')', '.', '<', '>', '*', '!', '|', '/', ',', ' ', ':',
);
$this->in_quotes = FALSE;
$this->quote_char = '';
$this->word = '';
$this->output = '';
$this->prev_boundary = '';
$this->axis = '';
$this->skip_next_word = FALSE;
$this->start();
}
function start() {
for ($i=0; $i < drupal_strlen($this->query); $i++) {
$this->i = $i;
$c = $this->query[$i];
if ($c == '"' || $c == "'") {
$this->handle_quote($c);
continue;
}
if ($this->in_quotes) {
$this->word .= $c;
continue;
}
if (in_array($c, $this->word_boundaries)) {
$this->handle_word_boundary($c);
}
else {
$this->word .= $c;
}
}
$this->handle_word();
}
function handle_quote($c) {
if ($this->in_quotes && $c == $this->quote_char) {
$this->in_quotes = FALSE;
$this->word .= $c;
$this->output .= $this->word;
$this->word = '';
}
elseif (!$this->in_quotes) {
$this->in_quotes = TRUE;
$this->handle_word();
$this->word = $c;
$this->quote_char = $c;
}
else {
$this->word .= $c;
}
}
function handle_word_boundary($c) {
if (in_array($this->word, array('div', 'or', 'and', 'mod')) &&
$this->prev_boundary == ' ' && $c == ' ') {
$this->output .= $this->word;
}
else {
$this->handle_word($c);
}
$this->output .= $c;
$this->word = '';
$this->prev_boundary = $c;
}
function handle_word($c='') {
if ($this->word == '') {
return;
}
if ($c == ':' && $this->query[$this->i + 1] == ':') {
$this->axis = $this->word;
}
if ($c == ':' && $this->query[$this->i - 1] != ':' &&
$this->query[$this->i + 1] != ':') {
$this->output .= $this->word;
$this->skip_next_word = TRUE;
return;
}
if ($this->skip_next_word) {
$this->skip_next_word = FALSE;
$this->output .= $this->word;
return;
}
if (is_numeric($this->word) ||
$this->axis == 'attribute' ||
strpos($this->word, '@') === 0 ||
$c == '(' ||
$c == ':') {
$this->output .= $this->word;
return;
}
$this->output .= '__default__:' . $this->word;
}
function getQuery() {
return $this->output;
}
}