12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418 |
- <?php
- /**
- * @package dompdf
- * @link http://dompdf.github.com/
- * @author Benj Carson <benjcarson@digitaljunkies.ca>
- * @author Helmut Tischer <htischer@weihenstephan.org>
- * @author Fabien Ménager <fabien.menager@gmail.com>
- * @license http://www.gnu.org/copyleft/lesser.html GNU Lesser General Public License
- */
-
- /**
- * The location of the default built-in CSS file.
- * {@link Stylesheet::DEFAULT_STYLESHEET}
- */
- define('__DEFAULT_STYLESHEET', DOMPDF_LIB_DIR . DIRECTORY_SEPARATOR . "res" . DIRECTORY_SEPARATOR . "html.css");
-
- /**
- * The master stylesheet class
- *
- * The Stylesheet class is responsible for parsing stylesheets and style
- * tags/attributes. It also acts as a registry of the individual Style
- * objects generated by the current set of loaded CSS files and style
- * elements.
- *
- * @see Style
- * @package dompdf
- */
- class Stylesheet {
-
- /**
- * The location of the default built-in CSS file.
- */
- const DEFAULT_STYLESHEET = __DEFAULT_STYLESHEET;
-
- /**
- * User agent stylesheet origin
- *
- * @var int
- */
- const ORIG_UA = 1;
-
- /**
- * User normal stylesheet origin
- *
- * @var int
- */
- const ORIG_USER = 2;
-
- /**
- * Author normal stylesheet origin
- *
- * @var int
- */
- const ORIG_AUTHOR = 3;
-
- private static $_stylesheet_origins = array(
- self::ORIG_UA => -0x0FFFFFFF, // user agent style sheets
- self::ORIG_USER => -0x0000FFFF, // user normal style sheets
- self::ORIG_AUTHOR => 0x00000000, // author normal style sheets
- );
-
- /**
- * Current dompdf instance
- *
- * @var DOMPDF
- */
- private $_dompdf;
-
- /**
- * Array of currently defined styles
- *
- * @var Style[]
- */
- private $_styles;
-
- /**
- * Base protocol of the document being parsed
- * Used to handle relative urls.
- *
- * @var string
- */
- private $_protocol;
-
- /**
- * Base hostname of the document being parsed
- * Used to handle relative urls.
- *
- * @var string
- */
- private $_base_host;
-
- /**
- * Base path of the document being parsed
- * Used to handle relative urls.
- *
- * @var string
- */
- private $_base_path;
-
- /**
- * The styles defined by @page rules
- *
- * @var array<Style>
- */
- private $_page_styles;
-
- /**
- * List of loaded files, used to prevent recursion
- *
- * @var array
- */
- private $_loaded_files;
-
- /**
- * Current stylesheet origin
- *
- * @var int
- */
- private $_current_origin = self::ORIG_UA;
-
- /**
- * Accepted CSS media types
- * List of types and parsing rules for future extensions:
- * http://www.w3.org/TR/REC-html40/types.html
- * screen, tty, tv, projection, handheld, print, braille, aural, all
- * The following are non standard extensions for undocumented specific environments.
- * static, visual, bitmap, paged, dompdf
- * Note, even though the generated pdf file is intended for print output,
- * the desired content might be different (e.g. screen or projection view of html file).
- * Therefore allow specification of content by dompdf setting DOMPDF_DEFAULT_MEDIA_TYPE.
- * If given, replace media "print" by DOMPDF_DEFAULT_MEDIA_TYPE.
- * (Previous version $ACCEPTED_MEDIA_TYPES = $ACCEPTED_GENERIC_MEDIA_TYPES + $ACCEPTED_DEFAULT_MEDIA_TYPE)
- */
- static $ACCEPTED_DEFAULT_MEDIA_TYPE = "print";
- static $ACCEPTED_GENERIC_MEDIA_TYPES = array("all", "static", "visual", "bitmap", "paged", "dompdf");
-
- /**
- * The class constructor.
- *
- * The base protocol, host & path are initialized to those of
- * the current script.
- */
- function __construct(DOMPDF $dompdf) {
- $this->_dompdf = $dompdf;
- $this->_styles = array();
- $this->_loaded_files = array();
- list($this->_protocol, $this->_base_host, $this->_base_path) = explode_url($_SERVER["SCRIPT_FILENAME"]);
- $this->_page_styles = array("base" => null);
- }
-
- /**
- * Class destructor
- */
- function __destruct() {
- clear_object($this);
- }
-
- /**
- * Set the base protocol
- *
- * @param string $protocol
- */
- function set_protocol($protocol) { $this->_protocol = $protocol; }
-
- /**
- * Set the base host
- *
- * @param string $host
- */
- function set_host($host) { $this->_base_host = $host; }
-
- /**
- * Set the base path
- *
- * @param string $path
- */
- function set_base_path($path) { $this->_base_path = $path; }
-
- /**
- * Return the DOMPDF object
- *
- * @return DOMPDF
- */
- function get_dompdf() { return $this->_dompdf; }
-
- /**
- * Return the base protocol for this stylesheet
- *
- * @return string
- */
- function get_protocol() { return $this->_protocol; }
-
- /**
- * Return the base host for this stylesheet
- *
- * @return string
- */
- function get_host() { return $this->_base_host; }
-
- /**
- * Return the base path for this stylesheet
- *
- * @return string
- */
- function get_base_path() { return $this->_base_path; }
-
- /**
- * Return the array of page styles
- *
- * @return Style[]
- */
- function get_page_styles() { return $this->_page_styles; }
-
- /**
- * Add a new Style object to the stylesheet
- * add_style() adds a new Style object to the current stylesheet, or
- * merges a new Style with an existing one.
- *
- * @param string $key the Style's selector
- * @param Style $style the Style to be added
- *
- * @throws DOMPDF_Exception
- */
- function add_style($key, Style $style) {
- if ( !is_string($key) ) {
- throw new DOMPDF_Exception("CSS rule must be keyed by a string.");
- }
-
- if ( isset($this->_styles[$key]) ) {
- $this->_styles[$key]->merge($style);
- }
- else {
- $this->_styles[$key] = clone $style;
- }
-
- $this->_styles[$key]->set_origin( $this->_current_origin );
- }
-
- /**
- * lookup a specifc Style object
- *
- * lookup() returns the Style specified by $key, or null if the Style is
- * not found.
- *
- * @param string $key the selector of the requested Style
- * @return Style
- */
- function lookup($key) {
- if ( !isset($this->_styles[$key]) ) {
- return null;
- }
-
- return $this->_styles[$key];
- }
-
- /**
- * create a new Style object associated with this stylesheet
- *
- * @param Style $parent The style of this style's parent in the DOM tree
- * @return Style
- */
- function create_style(Style $parent = null) {
- return new Style($this, $this->_current_origin);
- }
-
- /**
- * load and parse a CSS string
- *
- * @param string $css
- */
- function load_css(&$css) { $this->_parse_css($css); }
-
-
- /**
- * load and parse a CSS file
- *
- * @param string $file
- * @param int $origin
- */
- function load_css_file($file, $origin = self::ORIG_AUTHOR) {
- if ( $origin ) {
- $this->_current_origin = $origin;
- }
-
- // Prevent circular references
- if ( isset($this->_loaded_files[$file]) ) {
- return;
- }
-
- $this->_loaded_files[$file] = true;
-
- if ( strpos($file, "data:") === 0) {
- $parsed = parse_data_uri($file);
- $css = $parsed["data"];
- }
- else {
- $parsed_url = explode_url($file);
-
- list($this->_protocol, $this->_base_host, $this->_base_path, $filename) = $parsed_url;
-
- // Fix submitted by Nick Oostveen for aliased directory support:
- if ( $this->_protocol == "" ) {
- $file = $this->_base_path . $filename;
- }
- else {
- $file = build_url($this->_protocol, $this->_base_host, $this->_base_path, $filename);
- }
-
- set_error_handler("record_warnings");
- $css = file_get_contents($file, null, $this->_dompdf->get_http_context());
- restore_error_handler();
-
- $good_mime_type = true;
-
- // See http://the-stickman.com/web-development/php/getting-http-response-headers-when-using-file_get_contents/
- if ( isset($http_response_header) && !$this->_dompdf->get_quirksmode() ) {
- foreach($http_response_header as $_header) {
- if ( preg_match("@Content-Type:\s*([\w/]+)@i", $_header, $matches) &&
- ($matches[1] !== "text/css") ) {
- $good_mime_type = false;
- }
- }
- }
-
- if ( !$good_mime_type || $css == "" ) {
- record_warnings(E_USER_WARNING, "Unable to load css file $file", __FILE__, __LINE__);
- return;
- }
- }
-
- $this->_parse_css($css);
- }
-
- /**
- * @link http://www.w3.org/TR/CSS21/cascade.html#specificity
- *
- * @param string $selector
- * @param int $origin :
- * - ua: user agent style sheets
- * - un: user normal style sheets
- * - an: author normal style sheets
- * - ai: author important style sheets
- * - ui: user important style sheets
- *
- * @return int
- */
- private function _specificity($selector, $origin = self::ORIG_AUTHOR) {
- // http://www.w3.org/TR/CSS21/cascade.html#specificity
- // ignoring the ":" pseudoclass modifyers
- // also ignored in _css_selector_to_xpath
-
- $a = ($selector === "!attr") ? 1 : 0;
-
- $b = min(mb_substr_count($selector, "#"), 255);
-
- $c = min(mb_substr_count($selector, ".") +
- mb_substr_count($selector, "["), 255);
-
- $d = min(mb_substr_count($selector, " ") +
- mb_substr_count($selector, ">") +
- mb_substr_count($selector, "+"), 255);
-
- //If a normal element name is at the begining of the string,
- //a leading whitespace might have been removed on whitespace collapsing and removal
- //therefore there might be one whitespace less as selected element names
- //this can lead to a too small specificity
- //see _css_selector_to_xpath
-
- if ( !in_array($selector[0], array(" ", ">", ".", "#", "+", ":", "["))/* && $selector !== "*"*/) {
- $d++;
- }
-
- if (DEBUGCSS) {
- /*DEBUGCSS*/ print "<pre>\n";
- /*DEBUGCSS*/ printf("_specificity(): 0x%08x \"%s\"\n", ($a << 24) | ($b << 16) | ($c << 8) | ($d), $selector);
- /*DEBUGCSS*/ print "</pre>";
- }
-
- return self::$_stylesheet_origins[$origin] + ($a << 24) | ($b << 16) | ($c << 8) | ($d);
- }
-
- /**
- * Converts a CSS selector to an XPath query.
- *
- * @param string $selector
- * @param bool $first_pass
- *
- * @throws DOMPDF_Exception
- * @return string
- */
- private function _css_selector_to_xpath($selector, $first_pass = false) {
-
- // Collapse white space and strip whitespace around delimiters
- // $search = array("/\\s+/", "/\\s+([.>#+:])\\s+/");
- // $replace = array(" ", "\\1");
- // $selector = preg_replace($search, $replace, trim($selector));
-
- // Initial query (non-absolute)
- $query = "//";
-
- // Will contain :before and :after if they must be created
- $pseudo_elements = array();
-
- // Parse the selector
- //$s = preg_split("/([ :>.#+])/", $selector, -1, PREG_SPLIT_DELIM_CAPTURE);
-
- $delimiters = array(" ", ">", ".", "#", "+", ":", "[", "(");
-
- // Add an implicit * at the beginning of the selector
- // if it begins with an attribute selector
- if ( $selector[0] === "[" ) {
- $selector = "*$selector";
- }
-
- // Add an implicit space at the beginning of the selector if there is no
- // delimiter there already.
- if ( !in_array($selector[0], $delimiters) ) {
- $selector = " $selector";
- }
-
- $tok = "";
- $len = mb_strlen($selector);
- $i = 0;
-
- while ( $i < $len ) {
-
- $s = $selector[$i];
- $i++;
-
- // Eat characters up to the next delimiter
- $tok = "";
- $in_attr = false;
-
- while ($i < $len) {
- $c = $selector[$i];
- $c_prev = $selector[$i-1];
-
- if ( !$in_attr && in_array($c, $delimiters) ) {
- break;
- }
-
- if ( $c_prev === "[" ) {
- $in_attr = true;
- }
-
- $tok .= $selector[$i++];
-
- if ( $in_attr && $c === "]" ) {
- $in_attr = false;
- break;
- }
- }
-
- switch ($s) {
-
- case " ":
- case ">":
- // All elements matching the next token that are direct children of
- // the current token
- $expr = $s === " " ? "descendant" : "child";
-
- if ( mb_substr($query, -1, 1) !== "/" ) {
- $query .= "/";
- }
-
- // Tag names are case-insensitive
- $tok = strtolower($tok);
-
- if ( !$tok ) {
- $tok = "*";
- }
-
- $query .= "$expr::$tok";
- $tok = "";
- break;
-
- case ".":
- case "#":
- // All elements matching the current token with a class/id equal to
- // the _next_ token.
-
- $attr = $s === "." ? "class" : "id";
-
- // empty class/id == *
- if ( mb_substr($query, -1, 1) === "/" ) {
- $query .= "*";
- }
-
- // Match multiple classes: $tok contains the current selected
- // class. Search for class attributes with class="$tok",
- // class=".* $tok .*" and class=".* $tok"
-
- // This doesn't work because libxml only supports XPath 1.0...
- //$query .= "[matches(@$attr,\"^${tok}\$|^${tok}[ ]+|[ ]+${tok}\$|[ ]+${tok}[ ]+\")]";
-
- // Query improvement by Michael Sheakoski <michael@mjsdigital.com>:
- $query .= "[contains(concat(' ', @$attr, ' '), concat(' ', '$tok', ' '))]";
- $tok = "";
- break;
-
- case "+":
- // All sibling elements that folow the current token
- if ( mb_substr($query, -1, 1) !== "/" ) {
- $query .= "/";
- }
-
- $query .= "following-sibling::$tok";
- $tok = "";
- break;
-
- case ":":
- $i2 = $i-strlen($tok)-2; // the char before ":"
- if ( !isset($selector[$i2]) || in_array($selector[$i2], $delimiters) ) {
- $query .= "*";
- }
-
- $last = false;
-
- // Pseudo-classes
- switch ($tok) {
-
- case "first-child":
- $query .= "[1]";
- $tok = "";
- break;
-
- case "last-child":
- $query .= "[not(following-sibling::*)]";
- $tok = "";
- break;
-
- case "first-of-type":
- $query .= "[position() = 1]";
- $tok = "";
- break;
-
- case "last-of-type":
- $query .= "[position() = last()]";
- $tok = "";
- break;
-
- // an+b, n, odd, and even
- case "nth-last-of-type":
- case "nth-last-child":
- $last = true;
-
- case "nth-of-type":
- case "nth-child":
- $p = $i+1;
- $nth = trim(mb_substr($selector, $p, strpos($selector, ")", $i)-$p));
-
- // 1
- if ( preg_match("/^\d+$/", $nth) ) {
- $condition = "position() = $nth";
- }
-
- // odd
- elseif ( $nth === "odd" ) {
- $condition = "(position() mod 2) = 1";
- }
-
- // even
- elseif ( $nth === "even" ) {
- $condition = "(position() mod 2) = 0";
- }
-
- // an+b
- else {
- $condition = $this->_selector_an_plus_b($nth, $last);
- }
-
- $query .= "[$condition]";
- $tok = "";
- break;
-
- case "link":
- $query .= "[@href]";
- $tok = "";
- break;
-
- case "first-line": // TODO
- case "first-letter": // TODO
-
- // N/A
- case "active":
- case "hover":
- case "visited":
- $query .= "[false()]";
- $tok = "";
- break;
-
- /* Pseudo-elements */
- case "before":
- case "after":
- if ( $first_pass ) {
- $pseudo_elements[$tok] = $tok;
- }
- else {
- $query .= "/*[@$tok]";
- }
-
- $tok = "";
- break;
-
- case "empty":
- $query .= "[not(*) and not(normalize-space())]";
- $tok = "";
- break;
-
- case "disabled":
- case "checked":
- $query .= "[@$tok]";
- $tok = "";
- break;
-
- case "enabled":
- $query .= "[not(@disabled)]";
- $tok = "";
- break;
- }
-
- break;
-
- case "[":
- // Attribute selectors. All with an attribute matching the following token(s)
- $attr_delimiters = array("=", "]", "~", "|", "$", "^", "*");
- $tok_len = mb_strlen($tok);
- $j = 0;
-
- $attr = "";
- $op = "";
- $value = "";
-
- while ( $j < $tok_len ) {
- if ( in_array($tok[$j], $attr_delimiters) ) {
- break;
- }
- $attr .= $tok[$j++];
- }
-
- switch ( $tok[$j] ) {
-
- case "~":
- case "|":
- case "$":
- case "^":
- case "*":
- $op .= $tok[$j++];
-
- if ( $tok[$j] !== "=" ) {
- throw new DOMPDF_Exception("Invalid CSS selector syntax: invalid attribute selector: $selector");
- }
-
- $op .= $tok[$j];
- break;
-
- case "=":
- $op = "=";
- break;
-
- }
-
- // Read the attribute value, if required
- if ( $op != "" ) {
- $j++;
- while ( $j < $tok_len ) {
- if ( $tok[$j] === "]" ) {
- break;
- }
- $value .= $tok[$j++];
- }
- }
-
- if ( $attr == "" ) {
- throw new DOMPDF_Exception("Invalid CSS selector syntax: missing attribute name");
- }
-
- $value = trim($value, "\"'");
-
- switch ( $op ) {
-
- case "":
- $query .= "[@$attr]";
- break;
-
- case "=":
- $query .= "[@$attr=\"$value\"]";
- break;
-
- case "~=":
- // FIXME: this will break if $value contains quoted strings
- // (e.g. [type~="a b c" "d e f"])
- $values = explode(" ", $value);
- $query .= "[";
-
- foreach ( $values as $val ) {
- $query .= "@$attr=\"$val\" or ";
- }
-
- $query = rtrim($query, " or ") . "]";
- break;
-
- case "|=":
- $values = explode("-", $value);
- $query .= "[";
-
- foreach ( $values as $val ) {
- $query .= "starts-with(@$attr, \"$val\") or ";
- }
-
- $query = rtrim($query, " or ") . "]";
- break;
-
- case "$=":
- $query .= "[substring(@$attr, string-length(@$attr)-".(strlen($value) - 1).")=\"$value\"]";
- break;
-
- case "^=":
- $query .= "[starts-with(@$attr,\"$value\")]";
- break;
-
- case "*=":
- $query .= "[contains(@$attr,\"$value\")]";
- break;
- }
-
- break;
- }
- }
- $i++;
-
- // case ":":
- // // Pseudo selectors: ignore for now. Partially handled directly
- // // below.
-
- // // Skip until the next special character, leaving the token as-is
- // while ( $i < $len ) {
- // if ( in_array($selector[$i], $delimiters) )
- // break;
- // $i++;
- // }
- // break;
-
- // default:
- // // Add the character to the token
- // $tok .= $selector[$i++];
- // break;
- // }
-
- // }
-
-
- // Trim the trailing '/' from the query
- if ( mb_strlen($query) > 2 ) {
- $query = rtrim($query, "/");
- }
-
- return array("query" => $query, "pseudo_elements" => $pseudo_elements);
- }
-
- // https://github.com/tenderlove/nokogiri/blob/master/lib/nokogiri/css/xpath_visitor.rb
- protected function _selector_an_plus_b($expr, $last = false) {
- $expr = preg_replace("/\s/", "", $expr);
- if ( !preg_match("/^(?P<a>-?[0-9]*)?n(?P<b>[-+]?[0-9]+)?$/", $expr, $matches)) {
- return "false()";
- }
-
- $a = ((isset($matches["a"]) && $matches["a"] !== "") ? intval($matches["a"]) : 1);
- $b = ((isset($matches["b"]) && $matches["b"] !== "") ? intval($matches["b"]) : 0);
-
- $position = ($last ? "(last()-position()+1)" : "position()");
-
- if ( $b == 0 ) {
- return "($position mod $a) = 0";
- }
- else {
- $compare = (($a < 0) ? "<=" : ">=");
- $b2 = -$b;
- if ( $b2 >= 0 ) {
- $b2 = "+$b2";
- }
- return "($position $compare $b) and ((($position $b2) mod ".abs($a).") = 0)";
- }
- }
-
- /**
- * applies all current styles to a particular document tree
- *
- * apply_styles() applies all currently loaded styles to the provided
- * {@link Frame_Tree}. Aside from parsing CSS, this is the main purpose
- * of this class.
- *
- * @param Frame_Tree $tree
- */
- function apply_styles(Frame_Tree $tree) {
- // Use XPath to select nodes. This would be easier if we could attach
- // Frame objects directly to DOMNodes using the setUserData() method, but
- // we can't do that just yet. Instead, we set a _node attribute_ in
- // Frame->set_id() and use that as a handle on the Frame object via
- // Frame_Tree::$_registry.
-
- // We create a scratch array of styles indexed by frame id. Once all
- // styles have been assigned, we order the cached styles by specificity
- // and create a final style object to assign to the frame.
-
- // FIXME: this is not particularly robust...
-
- $styles = array();
- $xp = new DOMXPath($tree->get_dom());
-
- // Add generated content
- foreach ($this->_styles as $selector => $style) {
- if ( strpos($selector, ":before") === false && strpos($selector, ":after") === false ) {
- continue;
- }
-
- $query = $this->_css_selector_to_xpath($selector, true);
-
- // Retrieve the nodes, limit to body for generated content
- $nodes = @$xp->query( '.'.$query["query"] );
- if ( $nodes == null ) {
- record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__);
- continue;
- }
-
- foreach ($nodes as $node) {
- foreach ($query["pseudo_elements"] as $pos) {
- // Do not add a new pseudo element if another one already matched
- if ( $node->hasAttribute("dompdf_{$pos}_frame_id") ) {
- continue;
- }
-
- if (($src = $this->_image($style->content)) !== "none") {
- $new_node = $node->ownerDocument->createElement("img_generated");
- $new_node->setAttribute("src", $src);
- }
- else {
- $new_node = $node->ownerDocument->createElement("dompdf_generated");
- }
-
- $new_node->setAttribute($pos, $pos);
- $new_frame_id = $tree->insert_node($node, $new_node, $pos);
- $node->setAttribute("dompdf_{$pos}_frame_id", $new_frame_id);
- }
- }
- }
-
- // Apply all styles in stylesheet
- foreach ($this->_styles as $selector => $style) {
- $query = $this->_css_selector_to_xpath($selector);
-
- // Retrieve the nodes
- $nodes = @$xp->query($query["query"]);
- if ( $nodes == null ) {
- record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__);
- continue;
- }
-
- foreach ($nodes as $node) {
- // Retrieve the node id
- // Only DOMElements get styles
- if ( $node->nodeType != XML_ELEMENT_NODE ) {
- continue;
- }
-
- $id = $node->getAttribute("frame_id");
-
- // Assign the current style to the scratch array
- $spec = $this->_specificity($selector);
- $styles[$id][$spec][] = $style;
- }
- }
-
- // Now create the styles and assign them to the appropriate frames. (We
- // iterate over the tree using an implicit Frame_Tree iterator.)
- $root_flg = false;
- foreach ($tree->get_frames() as $frame) {
- // pre_r($frame->get_node()->nodeName . ":");
- if ( !$root_flg && $this->_page_styles["base"] ) {
- $style = $this->_page_styles["base"];
- $root_flg = true;
- }
- else {
- $style = $this->create_style();
- }
-
- // Find nearest DOMElement parent
- $p = $frame;
- while ( $p = $p->get_parent() ) {
- if ( $p->get_node()->nodeType == XML_ELEMENT_NODE ) {
- break;
- }
- }
-
- // Styles can only be applied directly to DOMElements; anonymous
- // frames inherit from their parent
- if ( $frame->get_node()->nodeType != XML_ELEMENT_NODE ) {
- if ( $p ) {
- $style->inherit($p->get_style());
- }
-
- $frame->set_style($style);
- continue;
- }
-
- $id = $frame->get_id();
-
- // Handle HTML 4.0 attributes
- Attribute_Translator::translate_attributes($frame);
- if ( ($str = $frame->get_node()->getAttribute(Attribute_Translator::$_style_attr)) !== "" ) {
- // Lowest specificity
- $styles[$id][1][] = $this->_parse_properties($str);
- }
-
- // Locate any additional style attributes
- if ( ($str = $frame->get_node()->getAttribute("style")) !== "" ) {
- // Destroy CSS comments
- $str = preg_replace("'/\*.*?\*/'si", "", $str);
-
- $spec = $this->_specificity("!attr");
- $styles[$id][$spec][] = $this->_parse_properties($str);
- }
-
- // Grab the applicable styles
- if ( isset($styles[$id]) ) {
-
- $applied_styles = $styles[ $frame->get_id() ];
-
- // Sort by specificity
- ksort($applied_styles);
-
- if (DEBUGCSS) {
- $debug_nodename = $frame->get_node()->nodeName;
- print "<pre>\n[$debug_nodename\n";
- foreach ($applied_styles as $spec => $arr) {
- printf("specificity: 0x%08x\n",$spec);
- foreach ($arr as $s) {
- print "[\n";
- $s->debug_print();
- print "]\n";
- }
- }
- }
-
- // Merge the new styles with the inherited styles
- foreach ($applied_styles as $arr) {
- foreach ($arr as $s) {
- $style->merge($s);
- }
- }
- }
-
- // Inherit parent's styles if required
- if ( $p ) {
-
- if (DEBUGCSS) {
- print "inherit:\n";
- print "[\n";
- $p->get_style()->debug_print();
- print "]\n";
- }
-
- $style->inherit( $p->get_style() );
- }
-
- if (DEBUGCSS) {
- print "DomElementStyle:\n";
- print "[\n";
- $style->debug_print();
- print "]\n";
- print "/$debug_nodename]\n</pre>";
- }
-
- /*DEBUGCSS print: see below different print debugging method
- pre_r($frame->get_node()->nodeName . ":");
- echo "<pre>";
- echo $style;
- echo "</pre>";*/
- $frame->set_style($style);
-
- }
-
- // We're done! Clean out the registry of all styles since we
- // won't be needing this later.
- foreach ( array_keys($this->_styles) as $key ) {
- $this->_styles[$key] = null;
- unset($this->_styles[$key]);
- }
-
- }
-
- /**
- * parse a CSS string using a regex parser
- * Called by {@link Stylesheet::parse_css()}
- *
- * @param string $str
- *
- * @throws DOMPDF_Exception
- */
- private function _parse_css($str) {
-
- $str = trim($str);
-
- // Destroy comments and remove HTML comments
- $css = preg_replace(array(
- "'/\*.*?\*/'si",
- "/^<!--/",
- "/-->$/"
- ), "", $str);
-
- // FIXME: handle '{' within strings, e.g. [attr="string {}"]
-
- // Something more legible:
- $re =
- "/\s* # Skip leading whitespace \n".
- "( @([^\s{]+)\s*([^{;]*) (?:;|({)) )? # Match @rules followed by ';' or '{' \n".
- "(?(1) # Only parse sub-sections if we're in an @rule... \n".
- " (?(4) # ...and if there was a leading '{' \n".
- " \s*( (?:(?>[^{}]+) ({)? # Parse rulesets and individual @page rules \n".
- " (?(6) (?>[^}]*) }) \s*)+? \n".
- " ) \n".
- " }) # Balancing '}' \n".
- "| # Branch to match regular rules (not preceeded by '@')\n".
- "([^{]*{[^}]*})) # Parse normal rulesets\n".
- "/xs";
-
- if ( preg_match_all($re, $css, $matches, PREG_SET_ORDER) === false ) {
- // An error occured
- throw new DOMPDF_Exception("Error parsing css file: preg_match_all() failed.");
- }
-
- // After matching, the array indicies are set as follows:
- //
- // [0] => complete text of match
- // [1] => contains '@import ...;' or '@media {' if applicable
- // [2] => text following @ for cases where [1] is set
- // [3] => media types or full text following '@import ...;'
- // [4] => '{', if present
- // [5] => rulesets within media rules
- // [6] => '{', within media rules
- // [7] => individual rules, outside of media rules
- //
- //pre_r($matches);
- foreach ( $matches as $match ) {
- $match[2] = trim($match[2]);
-
- if ( $match[2] !== "" ) {
- // Handle @rules
- switch ($match[2]) {
-
- case "import":
- $this->_parse_import($match[3]);
- break;
-
- case "media":
- $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES;
- $acceptedmedia[] = $this->_dompdf->get_option("default_media_type");
-
- $media = preg_split("/\s*,\s*/", mb_strtolower(trim($match[3])));
-
- if ( count(array_intersect($acceptedmedia, $media)) ) {
- $this->_parse_sections($match[5]);
- }
- break;
-
- case "page":
- //This handles @page to be applied to page oriented media
- //Note: This has a reduced syntax:
- //@page { margin:1cm; color:blue; }
- //Not a sequence of styles like a full.css, but only the properties
- //of a single style, which is applied to the very first "root" frame before
- //processing other styles of the frame.
- //Working properties:
- // margin (for margin around edge of paper)
- // font-family (default font of pages)
- // color (default text color of pages)
- //Non working properties:
- // border
- // padding
- // background-color
- //Todo:Reason is unknown
- //Other properties (like further font or border attributes) not tested.
- //If a border or background color around each paper sheet is desired,
- //assign it to the <body> tag, possibly only for the css of the correct media type.
-
- // If the page has a name, skip the style.
- $page_selector = trim($match[3]);
-
- $key = null;
- switch($page_selector) {
- case "":
- $key = "base";
- break;
-
- case ":left":
- case ":right":
- case ":odd":
- case ":even":
- case ":first":
- $key = $page_selector;
-
- default: continue;
- }
-
- // Store the style for later...
- if ( empty($this->_page_styles[$key]) ) {
- $this->_page_styles[$key] = $this->_parse_properties($match[5]);
- }
- else {
- $this->_page_styles[$key]->merge($this->_parse_properties($match[5]));
- }
- break;
-
- case "font-face":
- $this->_parse_font_face($match[5]);
- break;
-
- default:
- // ignore everything else
- break;
- }
-
- continue;
- }
-
- if ( $match[7] !== "" ) {
- $this->_parse_sections($match[7]);
- }
-
- }
- }
-
- /* See also style.cls Style::_image(), refactoring?, works also for imported css files */
- protected function _image($val) {
- $DEBUGCSS=DEBUGCSS;
- $parsed_url = "none";
-
- if ( mb_strpos($val, "url") === false ) {
- $path = "none"; //Don't resolve no image -> otherwise would prefix path and no longer recognize as none
- }
- else {
- $val = preg_replace("/url\(['\"]?([^'\")]+)['\"]?\)/","\\1", trim($val));
-
- // Resolve the url now in the context of the current stylesheet
- $parsed_url = explode_url($val);
- if ( $parsed_url["protocol"] == "" && $this->get_protocol() == "" ) {
- if ($parsed_url["path"][0] === '/' || $parsed_url["path"][0] === '\\' ) {
- $path = $_SERVER["DOCUMENT_ROOT"].'/';
- }
- else {
- $path = $this->get_base_path();
- }
-
- $path .= $parsed_url["path"] . $parsed_url["file"];
- $path = realpath($path);
- // If realpath returns FALSE then specifically state that there is no background image
- // FIXME: Is this causing problems for imported CSS files? There are some './none' references when running the test cases.
- if (!$path) { $path = 'none'; }
- }
- else {
- $path = build_url($this->get_protocol(),
- $this->get_host(),
- $this->get_base_path(),
- $val);
- }
- }
-
- if ($DEBUGCSS) {
- print "<pre>[_image\n";
- print_r($parsed_url);
- print $this->get_protocol()."\n".$this->get_base_path()."\n".$path."\n";
- print "_image]</pre>";;
- }
-
- return $path;
- }
-
- /**
- * parse @import{} sections
- *
- * @param string $url the url of the imported CSS file
- */
- private function _parse_import($url) {
- $arr = preg_split("/[\s\n,]/", $url,-1, PREG_SPLIT_NO_EMPTY);
- $url = array_shift($arr);
- $accept = false;
-
- if ( count($arr) > 0 ) {
- $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES;
- $acceptedmedia[] = $this->_dompdf->get_option("default_media_type");
-
- // @import url media_type [media_type...]
- foreach ( $arr as $type ) {
- if ( in_array(mb_strtolower(trim($type)), $acceptedmedia) ) {
- $accept = true;
- break;
- }
- }
-
- }
- else {
- // unconditional import
- $accept = true;
- }
-
- if ( $accept ) {
- // Store our current base url properties in case the new url is elsewhere
- $protocol = $this->_protocol;
- $host = $this->_base_host;
- $path = $this->_base_path;
-
- // $url = str_replace(array('"',"url", "(", ")"), "", $url);
- // If the protocol is php, assume that we will import using file://
- // $url = build_url($protocol == "php://" ? "file://" : $protocol, $host, $path, $url);
- // Above does not work for subfolders and absolute urls.
- // Todo: As above, do we need to replace php or file to an empty protocol for local files?
-
- $url = $this->_image($url);
-
- $this->load_css_file($url);
-
- // Restore the current base url
- $this->_protocol = $protocol;
- $this->_base_host = $host;
- $this->_base_path = $path;
- }
-
- }
-
- /**
- * parse @font-face{} sections
- * http://www.w3.org/TR/css3-fonts/#the-font-face-rule
- *
- * @param string $str CSS @font-face rules
- * @return Style
- */
- private function _parse_font_face($str) {
- $descriptors = $this->_parse_properties($str);
-
- preg_match_all("/(url|local)\s*\([\"\']?([^\"\'\)]+)[\"\']?\)\s*(format\s*\([\"\']?([^\"\'\)]+)[\"\']?\))?/i", $descriptors->src, $src);
-
- $sources = array();
- $valid_sources = array();
-
- foreach($src[0] as $i => $value) {
- $source = array(
- "local" => strtolower($src[1][$i]) === "local",
- "uri" => $src[2][$i],
- "format" => $src[4][$i],
- "path" => build_url($this->_protocol, $this->_base_host, $this->_base_path, $src[2][$i]),
- );
-
- if ( !$source["local"] && in_array($source["format"], array("", "truetype")) ) {
- $valid_sources[] = $source;
- }
-
- $sources[] = $source;
- }
-
- // No valid sources
- if ( empty($valid_sources) ) {
- return;
- }
-
- $style = array(
- "family" => $descriptors->get_font_family_raw(),
- "weight" => $descriptors->font_weight,
- "style" => $descriptors->font_style,
- );
-
- Font_Metrics::register_font($style, $valid_sources[0]["path"], $this->_dompdf->get_http_context());
- }
-
- /**
- * parse regular CSS blocks
- *
- * _parse_properties() creates a new Style object based on the provided
- * CSS rules.
- *
- * @param string $str CSS rules
- * @return Style
- */
- private function _parse_properties($str) {
- $properties = preg_split("/;(?=(?:[^\(]*\([^\)]*\))*(?![^\)]*\)))/", $str);
-
- if (DEBUGCSS) print '[_parse_properties';
-
- // Create the style
- $style = new Style($this);
-
- foreach ($properties as $prop) {
- // If the $prop contains an url, the regex may be wrong
- // @todo: fix the regex so that it works everytime
- /*if (strpos($prop, "url(") === false) {
- if (preg_match("/([a-z-]+)\s*:\s*[^:]+$/i", $prop, $m))
- $prop = $m[0];
- }*/
- //A css property can have " ! important" appended (whitespace optional)
- //strip this off to decode core of the property correctly.
- //Pass on in the style to allow proper handling:
- //!important properties can only be overridden by other !important ones.
- //$style->$prop_name = is a shortcut of $style->__set($prop_name,$value);.
- //If no specific set function available, set _props["prop_name"]
- //style is always copied completely, or $_props handled separately
- //Therefore set a _important_props["prop_name"]=true to indicate the modifier
-
- /* Instead of short code, prefer the typical case with fast code
- $important = preg_match("/(.*?)!\s*important/",$prop,$match);
- if ( $important ) {
- $prop = $match[1];
- }
- $prop = trim($prop);
- */
- if (DEBUGCSS) print '(';
-
- $important = false;
- $prop = trim($prop);
-
- if ( substr($prop, -9) === 'important' ) {
- $prop_tmp = rtrim(substr($prop, 0, -9));
-
- if ( substr($prop_tmp, -1) === '!' ) {
- $prop = rtrim(substr($prop_tmp, 0, -1));
- $important = true;
- }
- }
-
- if ( $prop === "" ) {
- if (DEBUGCSS) print 'empty)';
- continue;
- }
-
- $i = mb_strpos($prop, ":");
- if ( $i === false ) {
- if (DEBUGCSS) print 'novalue'.$prop.')';
- continue;
- }
-
- $prop_name = rtrim(mb_strtolower(mb_substr($prop, 0, $i)));
- $value = ltrim(mb_substr($prop, $i+1));
- if (DEBUGCSS) print $prop_name.':='.$value.($important?'!IMPORTANT':'').')';
- //New style, anyway empty
- //if ($important || !$style->important_get($prop_name) ) {
- //$style->$prop_name = array($value,$important);
- //assignment might be replaced by overloading through __set,
- //and overloaded functions might check _important_props,
- //therefore set _important_props first.
- if ($important) {
- $style->important_set($prop_name);
- }
- //For easier debugging, don't use overloading of assignments with __set
- $style->$prop_name = $value;
- //$style->props_set($prop_name, $value);
- }
- if (DEBUGCSS) print '_parse_properties]';
-
- return $style;
- }
-
- /**
- * parse selector + rulesets
- *
- * @param string $str CSS selectors and rulesets
- */
- private function _parse_sections($str) {
- // Pre-process: collapse all whitespace and strip whitespace around '>',
- // '.', ':', '+', '#'
-
- $patterns = array("/[\\s\n]+/", "/\\s+([>.:+#])\\s+/");
- $replacements = array(" ", "\\1");
- $str = preg_replace($patterns, $replacements, $str);
-
- $sections = explode("}", $str);
- if (DEBUGCSS) print '[_parse_sections';
- foreach ($sections as $sect) {
- $i = mb_strpos($sect, "{");
-
- $selectors = explode(",", mb_substr($sect, 0, $i));
- if (DEBUGCSS) print '[section';
- $style = $this->_parse_properties(trim(mb_substr($sect, $i+1)));
-
- // Assign it to the selected elements
- foreach ($selectors as $selector) {
- $selector = trim($selector);
-
- if ($selector == "") {
- if (DEBUGCSS) print '#empty#';
- continue;
- }
- if (DEBUGCSS) print '#'.$selector.'#';
- //if (DEBUGCSS) { if (strpos($selector,'p') !== false) print '!!!p!!!#'; }
-
- $this->add_style($selector, $style);
- }
-
- if (DEBUGCSS) print 'section]';
- }
-
- if (DEBUGCSS) print '_parse_sections]';
- }
-
- /**
- * dumps the entire stylesheet as a string
- *
- * Generates a string of each selector and associated style in the
- * Stylesheet. Useful for debugging.
- *
- * @return string
- */
- function __toString() {
- $str = "";
- foreach ($this->_styles as $selector => $style) {
- $str .= "$selector => " . $style->__toString() . "\n";
- }
-
- return $str;
- }
- }
|