| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419 | <?php/** * @package dompdf * @link    http://dompdf.github.com/ * @author  Benj Carson <benjcarson@digitaljunkies.ca> * @author  Helmut Tischer <htischer@weihenstephan.org> * @author  Fabien Ménager <fabien.menager@gmail.com> * @license http://www.gnu.org/copyleft/lesser.html GNU Lesser General Public License *//** * The location of the default built-in CSS file. * {@link Stylesheet::DEFAULT_STYLESHEET} */define('__DEFAULT_STYLESHEET', DOMPDF_LIB_DIR . DIRECTORY_SEPARATOR . "res" . DIRECTORY_SEPARATOR . "html.css");/** * The master stylesheet class * * The Stylesheet class is responsible for parsing stylesheets and style * tags/attributes.  It also acts as a registry of the individual Style * objects generated by the current set of loaded CSS files and style * elements. * * @see Style * @package dompdf */class Stylesheet {    /**   * The location of the default built-in CSS file.   */  const DEFAULT_STYLESHEET = __DEFAULT_STYLESHEET;     /**   * User agent stylesheet origin   *   * @var int   */  const ORIG_UA = 1;    /**   * User normal stylesheet origin   *   * @var int   */  const ORIG_USER = 2;    /**   * Author normal stylesheet origin   *   * @var int   */  const ORIG_AUTHOR = 3;    private static $_stylesheet_origins = array(    self::ORIG_UA =>     -0x0FFFFFFF, // user agent style sheets    self::ORIG_USER =>   -0x0000FFFF, // user normal style sheets    self::ORIG_AUTHOR =>  0x00000000, // author normal style sheets  );  /**   * Current dompdf instance   *   * @var DOMPDF   */  private $_dompdf;    /**   * Array of currently defined styles   *   * @var Style[]   */  private $_styles;  /**   * Base protocol of the document being parsed   * Used to handle relative urls.   *   * @var string   */  private $_protocol;  /**   * Base hostname of the document being parsed   * Used to handle relative urls.   *   * @var string   */  private $_base_host;  /**   * Base path of the document being parsed   * Used to handle relative urls.   *   * @var string   */  private $_base_path;  /**   * The styles defined by @page rules   *   * @var array<Style>   */  private $_page_styles;  /**   * List of loaded files, used to prevent recursion   *   * @var array   */  private $_loaded_files;  /**   * Current stylesheet origin   *   * @var int   */  private $_current_origin = self::ORIG_UA;  /**   * Accepted CSS media types   * List of types and parsing rules for future extensions:   * http://www.w3.org/TR/REC-html40/types.html   *   screen, tty, tv, projection, handheld, print, braille, aural, all   * The following are non standard extensions for undocumented specific environments.   *   static, visual, bitmap, paged, dompdf   * Note, even though the generated pdf file is intended for print output,   * the desired content might be different (e.g. screen or projection view of html file).   * Therefore allow specification of content by dompdf setting DOMPDF_DEFAULT_MEDIA_TYPE.   * If given, replace media "print" by DOMPDF_DEFAULT_MEDIA_TYPE.   * (Previous version $ACCEPTED_MEDIA_TYPES = $ACCEPTED_GENERIC_MEDIA_TYPES + $ACCEPTED_DEFAULT_MEDIA_TYPE)   */  static $ACCEPTED_DEFAULT_MEDIA_TYPE = "print";  static $ACCEPTED_GENERIC_MEDIA_TYPES = array("all", "static", "visual", "bitmap", "paged", "dompdf");  /**   * The class constructor.   *   * The base protocol, host & path are initialized to those of   * the current script.   */  function __construct(DOMPDF $dompdf) {    $this->_dompdf = $dompdf;    $this->_styles = array();    $this->_loaded_files = array();    list($this->_protocol, $this->_base_host, $this->_base_path) = explode_url($_SERVER["SCRIPT_FILENAME"]);    $this->_page_styles = array("base" => null);  }    /**   * Class destructor   */  function __destruct() {    clear_object($this);  }  /**   * Set the base protocol   *   * @param string $protocol   */  function set_protocol($protocol) { $this->_protocol = $protocol; }  /**   * Set the base host   *   * @param string $host   */  function set_host($host) { $this->_base_host = $host; }  /**   * Set the base path   *   * @param string $path   */  function set_base_path($path) { $this->_base_path = $path; }  /**   * Return the DOMPDF object   *   * @return DOMPDF   */  function get_dompdf() { return $this->_dompdf; }  /**   * Return the base protocol for this stylesheet   *   * @return string   */  function get_protocol() { return $this->_protocol; }  /**   * Return the base host for this stylesheet   *   * @return string   */  function get_host() { return $this->_base_host; }  /**   * Return the base path for this stylesheet   *   * @return string   */  function get_base_path() { return $this->_base_path; }    /**   * Return the array of page styles   *   * @return Style[]   */  function get_page_styles() { return $this->_page_styles; }  /**   * Add a new Style object to the stylesheet   * add_style() adds a new Style object to the current stylesheet, or   * merges a new Style with an existing one.   *   * @param string $key    the Style's selector   * @param Style  $style  the Style to be added   *   * @throws DOMPDF_Exception   */  function add_style($key, Style $style) {    if ( !is_string($key) ) {      throw new DOMPDF_Exception("CSS rule must be keyed by a string.");    }    if ( isset($this->_styles[$key]) ) {      $this->_styles[$key]->merge($style);    }    else {      $this->_styles[$key] = clone $style;    }          $this->_styles[$key]->set_origin( $this->_current_origin );  }  /**   * lookup a specifc Style object   *   * lookup() returns the Style specified by $key, or null if the Style is   * not found.   *   * @param string $key   the selector of the requested Style   * @return Style   */  function lookup($key) {    if ( !isset($this->_styles[$key]) ) {      return null;    }    return $this->_styles[$key];  }  /**   * create a new Style object associated with this stylesheet   *   * @param Style $parent The style of this style's parent in the DOM tree   * @return Style   */  function create_style(Style $parent = null) {    return new Style($this, $this->_current_origin);  }  /**   * load and parse a CSS string   *   * @param string $css   */  function load_css(&$css) { $this->_parse_css($css); }  /**   * load and parse a CSS file   *   * @param string $file   * @param int    $origin   */  function load_css_file($file, $origin = self::ORIG_AUTHOR) {    if ( $origin ) {      $this->_current_origin = $origin;    }    // Prevent circular references    if ( isset($this->_loaded_files[$file]) ) {      return;    }        $this->_loaded_files[$file] = true;    if ( strpos($file, "data:") === 0) {      $parsed = parse_data_uri($file);      $css = $parsed["data"];    }    else {      $parsed_url = explode_url($file);        list($this->_protocol, $this->_base_host, $this->_base_path, $filename) = $parsed_url;        // Fix submitted by Nick Oostveen for aliased directory support:      if ( $this->_protocol == "" ) {        $file = $this->_base_path . $filename;      }      else {        $file = build_url($this->_protocol, $this->_base_host, $this->_base_path, $filename);      }        set_error_handler("record_warnings");      $css = file_get_contents($file, null, $this->_dompdf->get_http_context());      restore_error_handler();          $good_mime_type = true;            // See http://the-stickman.com/web-development/php/getting-http-response-headers-when-using-file_get_contents/      if ( isset($http_response_header) && !$this->_dompdf->get_quirksmode() ) {        foreach($http_response_header as $_header) {          if ( preg_match("@Content-Type:\s*([\w/]+)@i", $_header, $matches) &&               ($matches[1] !== "text/css") ) {            $good_mime_type = false;          }        }      }        if ( !$good_mime_type || $css == "" ) {        record_warnings(E_USER_WARNING, "Unable to load css file $file", __FILE__, __LINE__);        return;      }    }    $this->_parse_css($css);  }  /**   * @link http://www.w3.org/TR/CSS21/cascade.html#specificity   *   * @param string     $selector   * @param int $origin :   *    - ua: user agent style sheets   *    - un: user normal style sheets   *    - an: author normal style sheets   *    - ai: author important style sheets   *    - ui: user important style sheets   *   * @return int   */  private function _specificity($selector, $origin = self::ORIG_AUTHOR) {    // http://www.w3.org/TR/CSS21/cascade.html#specificity    // ignoring the ":" pseudoclass modifyers    // also ignored in _css_selector_to_xpath    $a = ($selector === "!attr") ? 1 : 0;    $b = min(mb_substr_count($selector, "#"), 255);    $c = min(mb_substr_count($selector, ".") +             mb_substr_count($selector, "["), 255);    $d = min(mb_substr_count($selector, " ") +              mb_substr_count($selector, ">") +             mb_substr_count($selector, "+"), 255);    //If a normal element name is at the begining of the string,    //a leading whitespace might have been removed on whitespace collapsing and removal    //therefore there might be one whitespace less as selected element names    //this can lead to a too small specificity    //see _css_selector_to_xpath    if ( !in_array($selector[0], array(" ", ">", ".", "#", "+", ":", "["))/* && $selector !== "*"*/) {      $d++;    }    if (DEBUGCSS) {      /*DEBUGCSS*/  print "<pre>\n";      /*DEBUGCSS*/  printf("_specificity(): 0x%08x \"%s\"\n", ($a << 24) | ($b << 16) | ($c << 8) | ($d), $selector);      /*DEBUGCSS*/  print "</pre>";    }        return self::$_stylesheet_origins[$origin] + ($a << 24) | ($b << 16) | ($c << 8) | ($d);  }  /**   * Converts a CSS selector to an XPath query.   *   * @param string $selector   * @param bool   $first_pass   *   * @throws DOMPDF_Exception   * @return string   */  private function _css_selector_to_xpath($selector, $first_pass = false) {    // Collapse white space and strip whitespace around delimiters//     $search = array("/\\s+/", "/\\s+([.>#+:])\\s+/");//     $replace = array(" ", "\\1");//     $selector = preg_replace($search, $replace, trim($selector));    // Initial query (non-absolute)    $query = "//";        // Will contain :before and :after if they must be created    $pseudo_elements = array();    // Parse the selector    //$s = preg_split("/([ :>.#+])/", $selector, -1, PREG_SPLIT_DELIM_CAPTURE);    $delimiters = array(" ", ">", ".", "#", "+", ":", "[", "(");    // Add an implicit * at the beginning of the selector     // if it begins with an attribute selector    if ( $selector[0] === "[" ) {      $selector = "*$selector";    }          // Add an implicit space at the beginning of the selector if there is no    // delimiter there already.    if ( !in_array($selector[0], $delimiters) ) {      $selector = " $selector";    }    $tok = "";    $len = mb_strlen($selector);    $i = 0;    while ( $i < $len ) {      $s = $selector[$i];      $i++;      // Eat characters up to the next delimiter      $tok = "";      $in_attr = false;            while ($i < $len) {        $c = $selector[$i];        $c_prev = $selector[$i-1];                if ( !$in_attr && in_array($c, $delimiters) ) {          break;        }                  if ( $c_prev === "[" ) {          $in_attr = true;        }                $tok .= $selector[$i++];                if ( $in_attr && $c === "]" ) {          $in_attr = false;          break;        }      }      switch ($s) {      case " ":      case ">":        // All elements matching the next token that are direct children of        // the current token        $expr = $s === " " ? "descendant" : "child";        if ( mb_substr($query, -1, 1) !== "/" ) {          $query .= "/";        }        // Tag names are case-insensitive        $tok = strtolower($tok);                if ( !$tok ) {          $tok = "*";        }        $query .= "$expr::$tok";        $tok = "";        break;      case ".":      case "#":        // All elements matching the current token with a class/id equal to        // the _next_ token.        $attr = $s === "." ? "class" : "id";        // empty class/id == *        if ( mb_substr($query, -1, 1) === "/" ) {          $query .= "*";        }        // Match multiple classes: $tok contains the current selected        // class.  Search for class attributes with class="$tok",        // class=".* $tok .*" and class=".* $tok"        // This doesn't work because libxml only supports XPath 1.0...        //$query .= "[matches(@$attr,\"^${tok}\$|^${tok}[ ]+|[ ]+${tok}\$|[ ]+${tok}[ ]+\")]";        // Query improvement by Michael Sheakoski <michael@mjsdigital.com>:        $query .= "[contains(concat(' ', @$attr, ' '), concat(' ', '$tok', ' '))]";        $tok = "";        break;      case "+":        // All sibling elements that folow the current token        if ( mb_substr($query, -1, 1) !== "/" ) {          $query .= "/";        }        $query .= "following-sibling::$tok";        $tok = "";        break;      case ":":        $i2 = $i-strlen($tok)-2; // the char before ":"        if ( !isset($selector[$i2]) || in_array($selector[$i2], $delimiters) ) {          $query .= "*";        }                $last = false;                // Pseudo-classes        switch ($tok) {        case "first-child":          $query .= "[1]";          $tok = "";          break;        case "last-child":          $query .= "[not(following-sibling::*)]";          $tok = "";          break;        case "first-of-type":          $query .= "[position() = 1]";          $tok = "";          break;        case "last-of-type":          $query .= "[position() = last()]";          $tok = "";          break;        // an+b, n, odd, and even        case "nth-last-of-type":        case "nth-last-child":          $last = true;                  case "nth-of-type":        case "nth-child":          $p = $i+1;          $nth = trim(mb_substr($selector, $p, strpos($selector, ")", $i)-$p));                    // 1          if ( preg_match("/^\d+$/", $nth) ) {            $condition = "position() = $nth";          }                    // odd          elseif ( $nth === "odd" ) {            $condition = "(position() mod 2) = 1";          }                    // even          elseif ( $nth === "even" ) {            $condition = "(position() mod 2) = 0";          }                    // an+b          else {            $condition = $this->_selector_an_plus_b($nth, $last);          }                    $query .= "[$condition]";          $tok = "";          break;        case "link":          $query .= "[@href]";          $tok = "";          break;                  case "first-line": // TODO        case "first-letter": // TODO                // N/A        case "active":        case "hover":        case "visited":          $query .= "[false()]";          $tok = "";          break;        /* Pseudo-elements */        case "before":        case "after":          if ( $first_pass ) {            $pseudo_elements[$tok] = $tok;          }          else {            $query .= "/*[@$tok]";          }                      $tok = "";          break;        case "empty":          $query .= "[not(*) and not(normalize-space())]";          $tok = "";          break;                  case "disabled":        case "checked":          $query .= "[@$tok]";          $tok = "";          break;                  case "enabled":          $query .= "[not(@disabled)]";          $tok = "";          break;        }        break;      case "[":        // Attribute selectors.  All with an attribute matching the following token(s)        $attr_delimiters = array("=", "]", "~", "|", "$", "^", "*");        $tok_len = mb_strlen($tok);        $j = 0;        $attr = "";        $op = "";        $value = "";        while ( $j < $tok_len ) {          if ( in_array($tok[$j], $attr_delimiters) ) {            break;          }          $attr .= $tok[$j++];        }        switch ( $tok[$j] ) {        case "~":        case "|":        case "$":        case "^":        case "*":          $op .= $tok[$j++];          if ( $tok[$j] !== "=" ) {            throw new DOMPDF_Exception("Invalid CSS selector syntax: invalid attribute selector: $selector");          }          $op .= $tok[$j];          break;        case "=":          $op = "=";          break;        }        // Read the attribute value, if required        if ( $op != "" ) {          $j++;          while ( $j < $tok_len ) {            if ( $tok[$j] === "]" ) {              break;            }            $value .= $tok[$j++];          }        }        if ( $attr == "" ) {          throw new DOMPDF_Exception("Invalid CSS selector syntax: missing attribute name");        }        $value = trim($value, "\"'");                switch ( $op ) {        case "":          $query .=  "[@$attr]";          break;        case "=":          $query .= "[@$attr=\"$value\"]";          break;        case "~=":          // FIXME: this will break if $value contains quoted strings          // (e.g. [type~="a b c" "d e f"])          $values = explode(" ", $value);          $query .=  "[";          foreach ( $values as $val ) {            $query .= "@$attr=\"$val\" or ";          }                    $query = rtrim($query, " or ") . "]";          break;        case "|=":          $values = explode("-", $value);          $query .= "[";          foreach ( $values as $val ) {            $query .= "starts-with(@$attr, \"$val\") or ";          }          $query = rtrim($query, " or ") . "]";          break;        case "$=":          $query .= "[substring(@$attr, string-length(@$attr)-".(strlen($value) - 1).")=\"$value\"]";          break;                  case "^=":          $query .= "[starts-with(@$attr,\"$value\")]";          break;                  case "*=":          $query .= "[contains(@$attr,\"$value\")]";          break;        }        break;      }    }    $i++;//       case ":"://         // Pseudo selectors: ignore for now.  Partially handled directly//         // below.//         // Skip until the next special character, leaving the token as-is//         while ( $i < $len ) {//           if ( in_array($selector[$i], $delimiters) )//             break;//           $i++;//         }//         break;//       default://         // Add the character to the token//         $tok .= $selector[$i++];//         break;//       }//    }    // Trim the trailing '/' from the query    if ( mb_strlen($query) > 2 ) {      $query = rtrim($query, "/");    }    return array("query" => $query, "pseudo_elements" => $pseudo_elements);  }    // https://github.com/tenderlove/nokogiri/blob/master/lib/nokogiri/css/xpath_visitor.rb  protected function _selector_an_plus_b($expr, $last = false) {    $expr = preg_replace("/\s/", "", $expr);    if ( !preg_match("/^(?P<a>-?[0-9]*)?n(?P<b>[-+]?[0-9]+)?$/", $expr, $matches)) {      return "false()";    }        $a = ((isset($matches["a"]) && $matches["a"] !== "") ? intval($matches["a"]) : 1);    $b = ((isset($matches["b"]) && $matches["b"] !== "") ? intval($matches["b"]) : 0);        $position = ($last ? "(last()-position()+1)" : "position()");    if ( $b == 0 ) {      return "($position mod $a) = 0";    }    else {      $compare = (($a < 0) ? "<=" : ">=");      $b2 = -$b;      if ( $b2 >= 0 ) {        $b2 = "+$b2";      }      return "($position $compare $b) and ((($position $b2) mod ".abs($a).") = 0)";    }  }  /**   * applies all current styles to a particular document tree   *   * apply_styles() applies all currently loaded styles to the provided   * {@link Frame_Tree}.  Aside from parsing CSS, this is the main purpose   * of this class.   *   * @param Frame_Tree $tree   */  function apply_styles(Frame_Tree $tree) {    // Use XPath to select nodes.  This would be easier if we could attach    // Frame objects directly to DOMNodes using the setUserData() method, but    // we can't do that just yet.  Instead, we set a _node attribute_ in    // Frame->set_id() and use that as a handle on the Frame object via    // Frame_Tree::$_registry.    // We create a scratch array of styles indexed by frame id.  Once all    // styles have been assigned, we order the cached styles by specificity    // and create a final style object to assign to the frame.    // FIXME: this is not particularly robust...    $styles = array();    $xp = new DOMXPath($tree->get_dom());        // Add generated content    foreach ($this->_styles as $selector => $style) {      if ( strpos($selector, ":before") === false && strpos($selector, ":after") === false ) {        continue;      }            $query = $this->_css_selector_to_xpath($selector, true);            // Retrieve the nodes      $nodes = @$xp->query($query["query"]);      if ( $nodes == null ) {        record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__);        continue;      }            foreach ($nodes as $node) {        foreach ($query["pseudo_elements"] as $pos) {          // Do not add a new pseudo element if another one already matched          if ( $node->hasAttribute("dompdf_{$pos}_frame_id") ) {            continue;          }                    if (($src = $this->_image($style->content)) !== "none") {            $new_node = $node->ownerDocument->createElement("img_generated");            $new_node->setAttribute("src", $src);          }          else {            $new_node = $node->ownerDocument->createElement("dompdf_generated");          }                    $new_node->setAttribute($pos, $pos);                    $new_frame_id = $tree->insert_node($node, $new_node, $pos);          $node->setAttribute("dompdf_{$pos}_frame_id", $new_frame_id);        }      }    }        // Apply all styles in stylesheet    foreach ($this->_styles as $selector => $style) {      $query = $this->_css_selector_to_xpath($selector);      // Retrieve the nodes      $nodes = @$xp->query($query["query"]);      if ( $nodes == null ) {        record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__);        continue;      }      foreach ($nodes as $node) {        // Retrieve the node id        // Only DOMElements get styles        if ( $node->nodeType != XML_ELEMENT_NODE ) {          continue;        }        $id = $node->getAttribute("frame_id");        // Assign the current style to the scratch array        $spec = $this->_specificity($selector);        $styles[$id][$spec][] = $style;      }    }    // Now create the styles and assign them to the appropriate frames.  (We    // iterate over the tree using an implicit Frame_Tree iterator.)    $root_flg = false;    foreach ($tree->get_frames() as $frame) {      // pre_r($frame->get_node()->nodeName . ":");      if ( !$root_flg && $this->_page_styles["base"] ) {        $style = $this->_page_styles["base"];        $root_flg = true;      }      else {        $style = $this->create_style();      }      // Find nearest DOMElement parent      $p = $frame;      while ( $p = $p->get_parent() ) {        if ( $p->get_node()->nodeType == XML_ELEMENT_NODE ) {          break;        }      }            // Styles can only be applied directly to DOMElements; anonymous      // frames inherit from their parent      if ( $frame->get_node()->nodeType != XML_ELEMENT_NODE ) {        if ( $p ) {          $style->inherit($p->get_style());        }                $frame->set_style($style);        continue;      }      $id = $frame->get_id();      // Handle HTML 4.0 attributes      Attribute_Translator::translate_attributes($frame);      if ( ($str = $frame->get_node()->getAttribute(Attribute_Translator::$_style_attr)) !== "" ) {        // Lowest specificity         $styles[$id][1][] = $this->_parse_properties($str);      }      // Locate any additional style attributes      if ( ($str = $frame->get_node()->getAttribute("style")) !== "" ) {        // Destroy CSS comments        $str = preg_replace("'/\*.*?\*/'si", "", $str);                $spec = $this->_specificity("!attr");        $styles[$id][$spec][] = $this->_parse_properties($str);      }      // Grab the applicable styles      if ( isset($styles[$id]) ) {        $applied_styles = $styles[ $frame->get_id() ];        // Sort by specificity        ksort($applied_styles);        if (DEBUGCSS) {          $debug_nodename = $frame->get_node()->nodeName;          print "<pre>\n[$debug_nodename\n";          foreach ($applied_styles as $spec => $arr) {            printf("specificity: 0x%08x\n",$spec);            foreach ($arr as $s) {              print "[\n";              $s->debug_print();              print "]\n";            }          }        }                // Merge the new styles with the inherited styles        foreach ($applied_styles as $arr) {          foreach ($arr as $s) {            $style->merge($s);          }        }      }      // Inherit parent's styles if required      if ( $p ) {        if (DEBUGCSS) {          print "inherit:\n";          print "[\n";          $p->get_style()->debug_print();          print "]\n";        }        $style->inherit( $p->get_style() );      }      if (DEBUGCSS) {        print "DomElementStyle:\n";        print "[\n";        $style->debug_print();        print "]\n";        print "/$debug_nodename]\n</pre>";      }      /*DEBUGCSS print: see below different print debugging method      pre_r($frame->get_node()->nodeName . ":");      echo "<pre>";      echo $style;      echo "</pre>";*/      $frame->set_style($style);    }    // We're done!  Clean out the registry of all styles since we    // won't be needing this later.    foreach ( array_keys($this->_styles) as $key ) {      $this->_styles[$key] = null;      unset($this->_styles[$key]);    }  }  /**   * parse a CSS string using a regex parser   * Called by {@link Stylesheet::parse_css()}   *   * @param string $str   *   * @throws DOMPDF_Exception   */  private function _parse_css($str) {    $str = trim($str);        // Destroy comments and remove HTML comments    $css = preg_replace(array(      "'/\*.*?\*/'si",       "/^<!--/",      "/-->$/"    ), "", $str);    // FIXME: handle '{' within strings, e.g. [attr="string {}"]    // Something more legible:    $re =      "/\s*                                   # Skip leading whitespace                             \n".      "( @([^\s]+)\s+([^{;]*) (?:;|({)) )?    # Match @rules followed by ';' or '{'                 \n".      "(?(1)                                  # Only parse sub-sections if we're in an @rule...     \n".      "  (?(4)                                # ...and if there was a leading '{'                   \n".      "    \s*( (?:(?>[^{}]+) ({)?            # Parse rulesets and individual @page rules           \n".      "            (?(6) (?>[^}]*) }) \s*)+?  \n".      "       )                               \n".      "   })                                  # Balancing '}'                                \n".      "|                                      # Branch to match regular rules (not preceeded by '@')\n".      "([^{]*{[^}]*}))                        # Parse normal rulesets\n".      "/xs";    if ( preg_match_all($re, $css, $matches, PREG_SET_ORDER) === false ) {      // An error occured      throw new DOMPDF_Exception("Error parsing css file: preg_match_all() failed.");    }    // After matching, the array indicies are set as follows:    //    // [0] => complete text of match    // [1] => contains '@import ...;' or '@media {' if applicable    // [2] => text following @ for cases where [1] is set    // [3] => media types or full text following '@import ...;'    // [4] => '{', if present    // [5] => rulesets within media rules    // [6] => '{', within media rules    // [7] => individual rules, outside of media rules    //    //pre_r($matches);    foreach ( $matches as $match ) {      $match[2] = trim($match[2]);      if ( $match[2] !== "" ) {        // Handle @rules        switch ($match[2]) {        case "import":          $this->_parse_import($match[3]);          break;        case "media":          $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES;          $acceptedmedia[] = $this->_dompdf->get_option("default_media_type");                    $media = preg_split("/\s*,\s*/", mb_strtolower(trim($match[3])));                    if ( count(array_intersect($acceptedmedia, $media)) ) {            $this->_parse_sections($match[5]);          }          break;        case "page":          //This handles @page to be applied to page oriented media          //Note: This has a reduced syntax:          //@page { margin:1cm; color:blue; }          //Not a sequence of styles like a full.css, but only the properties          //of a single style, which is applied to the very first "root" frame before          //processing other styles of the frame.          //Working properties:          // margin (for margin around edge of paper)          // font-family (default font of pages)          // color (default text color of pages)          //Non working properties:          // border          // padding          // background-color          //Todo:Reason is unknown          //Other properties (like further font or border attributes) not tested.          //If a border or background color around each paper sheet is desired,          //assign it to the <body> tag, possibly only for the css of the correct media type.          // If the page has a name, skip the style.          $page_selector = trim($match[3]);          $key = null;          switch($page_selector) {            case "":               $key = "base";               break;                          case ":left":            case ":right":            case ":odd":            case ":even":            case ":first":              $key = $page_selector;                          default: continue;          }          // Store the style for later...          if ( empty($this->_page_styles[$key]) ) {            $this->_page_styles[$key] = $this->_parse_properties($match[5]);          }          else {            $this->_page_styles[$key]->merge($this->_parse_properties($match[5]));          }          break;        case "font-face":          $this->_parse_font_face($match[5]);          break;                  default:          // ignore everything else          break;        }        continue;      }      if ( $match[7] !== "" ) {        $this->_parse_sections($match[7]);      }    }  }  /* See also style.cls Style::_image(), refactoring?, works also for imported css files */  protected function _image($val) {    $DEBUGCSS=DEBUGCSS;    $parsed_url = "none";    if ( mb_strpos($val, "url") === false ) {      $path = "none"; //Don't resolve no image -> otherwise would prefix path and no longer recognize as none    }    else {      $val = preg_replace("/url\(['\"]?([^'\")]+)['\"]?\)/","\\1", trim($val));      // Resolve the url now in the context of the current stylesheet      $parsed_url = explode_url($val);      if ( $parsed_url["protocol"] == "" && $this->get_protocol() == "" ) {        if ($parsed_url["path"][0] === '/' || $parsed_url["path"][0] === '\\' ) {          $path = $_SERVER["DOCUMENT_ROOT"].'/';        }        else {          $path = $this->get_base_path();        }                $path .= $parsed_url["path"] . $parsed_url["file"];        $path = realpath($path);        // If realpath returns FALSE then specifically state that there is no background image        // FIXME: Is this causing problems for imported CSS files? There are some './none' references when running the test cases.        if (!$path) { $path = 'none'; }      }      else {        $path = build_url($this->get_protocol(),                          $this->get_host(),                          $this->get_base_path(),                          $val);      }    }        if ($DEBUGCSS) {      print "<pre>[_image\n";      print_r($parsed_url);      print $this->get_protocol()."\n".$this->get_base_path()."\n".$path."\n";      print "_image]</pre>";;    }        return $path;  }  /**   * parse @import{} sections   *   * @param string $url  the url of the imported CSS file   */  private function _parse_import($url) {    $arr = preg_split("/[\s\n,]/", $url,-1, PREG_SPLIT_NO_EMPTY);    $url = array_shift($arr);    $accept = false;    if ( count($arr) > 0 ) {      $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES;      $acceptedmedia[] = $this->_dompdf->get_option("default_media_type");                    // @import url media_type [media_type...]      foreach ( $arr as $type ) {        if ( in_array(mb_strtolower(trim($type)), $acceptedmedia) ) {          $accept = true;          break;        }      }    }    else {      // unconditional import      $accept = true;    }    if ( $accept ) {      // Store our current base url properties in case the new url is elsewhere      $protocol = $this->_protocol;      $host = $this->_base_host;      $path = $this->_base_path;            // $url = str_replace(array('"',"url", "(", ")"), "", $url);      // If the protocol is php, assume that we will import using file://      // $url = build_url($protocol == "php://" ? "file://" : $protocol, $host, $path, $url);      // Above does not work for subfolders and absolute urls.      // Todo: As above, do we need to replace php or file to an empty protocol for local files?            $url = $this->_image($url);            $this->load_css_file($url);      // Restore the current base url      $this->_protocol = $protocol;      $this->_base_host = $host;      $this->_base_path = $path;    }  }    /**   * parse @font-face{} sections   * http://www.w3.org/TR/css3-fonts/#the-font-face-rule   *    * @param string $str CSS @font-face rules   * @return Style   */  private function _parse_font_face($str) {    $descriptors = $this->_parse_properties($str);        preg_match_all("/(url|local)\s*\([\"\']?([^\"\'\)]+)[\"\']?\)\s*(format\s*\([\"\']?([^\"\'\)]+)[\"\']?\))?/i", $descriptors->src, $src);        $sources = array();    $valid_sources = array();        foreach($src[0] as $i => $value) {      $source = array(        "local"  => strtolower($src[1][$i]) === "local",        "uri"    => $src[2][$i],        "format" => $src[4][$i],        "path"   => build_url($this->_protocol, $this->_base_host, $this->_base_path, $src[2][$i]),      );            if ( !$source["local"] && in_array($source["format"], array("", "woff", "opentype", "truetype")) ) {        $valid_sources[] = $source;      }            $sources[] = $source;    }        // No valid sources    if ( empty($valid_sources) ) {      return;    }        $style = array(      "family" => $descriptors->get_font_family_raw(),      "weight" => $descriptors->font_weight,      "style"  => $descriptors->font_style,    );        Font_Metrics::register_font($style, $valid_sources[0]["path"]);  }  /**   * parse regular CSS blocks   *   * _parse_properties() creates a new Style object based on the provided   * CSS rules.   *   * @param string $str  CSS rules   * @return Style   */  private function _parse_properties($str) {    $properties = preg_split("/;(?=(?:[^\(]*\([^\)]*\))*(?![^\)]*\)))/", $str);    if (DEBUGCSS) print '[_parse_properties';    // Create the style    $style = new Style($this);        foreach ($properties as $prop) {      // If the $prop contains an url, the regex may be wrong      // @todo: fix the regex so that it works everytime      /*if (strpos($prop, "url(") === false) {        if (preg_match("/([a-z-]+)\s*:\s*[^:]+$/i", $prop, $m))          $prop = $m[0];      }*/      //A css property can have " ! important" appended (whitespace optional)      //strip this off to decode core of the property correctly.      //Pass on in the style to allow proper handling:      //!important properties can only be overridden by other !important ones.      //$style->$prop_name = is a shortcut of $style->__set($prop_name,$value);.      //If no specific set function available, set _props["prop_name"]      //style is always copied completely, or $_props handled separately      //Therefore set a _important_props["prop_name"]=true to indicate the modifier      /* Instead of short code, prefer the typical case with fast code    $important = preg_match("/(.*?)!\s*important/",$prop,$match);      if ( $important ) {        $prop = $match[1];      }      $prop = trim($prop);      */      if (DEBUGCSS) print '(';            $important = false;      $prop = trim($prop);            if ( substr($prop, -9) === 'important' ) {        $prop_tmp = rtrim(substr($prop, 0, -9));                if ( substr($prop_tmp, -1) === '!' ) {          $prop = rtrim(substr($prop_tmp, 0, -1));          $important = true;        }      }      if ( $prop === "" ) {        if (DEBUGCSS) print 'empty)';        continue;      }      $i = mb_strpos($prop, ":");      if ( $i === false ) {        if (DEBUGCSS) print 'novalue'.$prop.')';        continue;      }      $prop_name = rtrim(mb_strtolower(mb_substr($prop, 0, $i)));      $value = ltrim(mb_substr($prop, $i+1));      if (DEBUGCSS) print $prop_name.':='.$value.($important?'!IMPORTANT':'').')';      //New style, anyway empty      //if ($important || !$style->important_get($prop_name) ) {      //$style->$prop_name = array($value,$important);      //assignment might be replaced by overloading through __set,      //and overloaded functions might check _important_props,      //therefore set _important_props first.      if ($important) {        $style->important_set($prop_name);      }      //For easier debugging, don't use overloading of assignments with __set      $style->$prop_name = $value;      //$style->props_set($prop_name, $value);    }    if (DEBUGCSS) print '_parse_properties]';    return $style;  }  /**   * parse selector + rulesets   *   * @param string $str  CSS selectors and rulesets   */  private function _parse_sections($str) {    // Pre-process: collapse all whitespace and strip whitespace around '>',    // '.', ':', '+', '#'    $patterns = array("/[\\s\n]+/", "/\\s+([>.:+#])\\s+/");    $replacements = array(" ", "\\1");    $str = preg_replace($patterns, $replacements, $str);    $sections = explode("}", $str);    if (DEBUGCSS) print '[_parse_sections';    foreach ($sections as $sect) {      $i = mb_strpos($sect, "{");      $selectors = explode(",", mb_substr($sect, 0, $i));      if (DEBUGCSS) print '[section';      $style = $this->_parse_properties(trim(mb_substr($sect, $i+1)));            // Assign it to the selected elements      foreach ($selectors as $selector) {        $selector = trim($selector);        if ($selector == "") {          if (DEBUGCSS) print '#empty#';          continue;        }        if (DEBUGCSS) print '#'.$selector.'#';        //if (DEBUGCSS) { if (strpos($selector,'p') !== false) print '!!!p!!!#'; }        $this->add_style($selector, $style);      }            if (DEBUGCSS) print 'section]';    }        if (DEBUGCSS) print '_parse_sections]';  }  /**   * dumps the entire stylesheet as a string   *   * Generates a string of each selector and associated style in the   * Stylesheet.  Useful for debugging.   *   * @return string   */  function __toString() {    $str = "";    foreach ($this->_styles as $selector => $style) {      $str .= "$selector => " . $style->__toString() . "\n";    }    return $str;  }}
 |