ok
Direktori : /home2/selectio/www/bharath/3idiotsgadgetstore.in/vendor/dompdf/dompdf/src/Css/ |
Current File : /home2/selectio/www/bharath/3idiotsgadgetstore.in/vendor/dompdf/dompdf/src/Css/Stylesheet.php |
<?php /** * @package dompdf * @link https://github.com/dompdf/dompdf * @license http://www.gnu.org/copyleft/lesser.html GNU Lesser General Public License */ namespace Dompdf\Css; use DOMElement; use DOMXPath; use Dompdf\Dompdf; use Dompdf\Helpers; use Dompdf\Exception; use Dompdf\FontMetrics; use Dompdf\Frame\FrameTree; /** * The master stylesheet class * * The Stylesheet class is responsible for parsing stylesheets and style * tags/attributes. It also acts as a registry of the individual Style * objects generated by the current set of loaded CSS files and style * elements. * * @see Style * @package dompdf */ class Stylesheet { /** * The location of the default built-in CSS file. */ const DEFAULT_STYLESHEET = "/lib/res/html.css"; /** * User agent stylesheet origin * * @var int */ const ORIG_UA = 1; /** * User normal stylesheet origin * * @var int */ const ORIG_USER = 2; /** * Author normal stylesheet origin * * @var int */ const ORIG_AUTHOR = 3; /* * The highest possible specificity is 0x01000000 (and that is only for author * stylesheets, as it is for inline styles). Origin precedence can be achieved by * adding multiples of 0x10000000 to the actual specificity. Important * declarations are handled in Style; though technically they should be handled * here so that user important declarations can be made to take precedence over * user important declarations, this doesn't matter in practice as Dompdf does * not support user stylesheets, and user agent stylesheets can not include * important declarations. */ private static $_stylesheet_origins = [ self::ORIG_UA => 0x00000000, // user agent declarations self::ORIG_USER => 0x10000000, // user normal declarations self::ORIG_AUTHOR => 0x30000000, // author normal declarations ]; /** * Non-CSS presentational hints (i.e. HTML 4 attributes) are handled as if added * to the beginning of an author stylesheet, i.e. anything in author stylesheets * should override them. */ const SPEC_NON_CSS = 0x20000000; /** * Current dompdf instance * * @var Dompdf */ private $_dompdf; /** * Array of currently defined styles * * @var Style[][] */ private $_styles; /** * Base protocol of the document being parsed * Used to handle relative urls. * * @var string */ private $_protocol = ""; /** * Base hostname of the document being parsed * Used to handle relative urls. * * @var string */ private $_base_host = ""; /** * Base path of the document being parsed * Used to handle relative urls. * * @var string */ private $_base_path = ""; /** * The styles defined by @page rules * * @var array<Style> */ private $_page_styles; /** * List of loaded files, used to prevent recursion * * @var array */ private $_loaded_files; /** * Current stylesheet origin * * @var int */ private $_current_origin = self::ORIG_UA; /** * Accepted CSS media types * List of types and parsing rules for future extensions: * http://www.w3.org/TR/REC-html40/types.html * screen, tty, tv, projection, handheld, print, braille, aural, all * The following are non standard extensions for undocumented specific environments. * static, visual, bitmap, paged, dompdf * Note, even though the generated pdf file is intended for print output, * the desired content might be different (e.g. screen or projection view of html file). * Therefore allow specification of content by dompdf setting Options::defaultMediaType. * If given, replace media "print" by Options::defaultMediaType. * (Previous version $ACCEPTED_MEDIA_TYPES = $ACCEPTED_GENERIC_MEDIA_TYPES + $ACCEPTED_DEFAULT_MEDIA_TYPE) */ static $ACCEPTED_DEFAULT_MEDIA_TYPE = "print"; static $ACCEPTED_GENERIC_MEDIA_TYPES = ["all", "static", "visual", "bitmap", "paged", "dompdf"]; static $VALID_MEDIA_TYPES = ["all", "aural", "bitmap", "braille", "dompdf", "embossed", "handheld", "paged", "print", "projection", "screen", "speech", "static", "tty", "tv", "visual"]; /** * @var FontMetrics */ private $fontMetrics; /** * The class constructor. * * The base protocol, host & path are initialized to those of * the current script. */ function __construct(Dompdf $dompdf) { $this->_dompdf = $dompdf; $this->setFontMetrics($dompdf->getFontMetrics()); $this->_styles = []; $this->_loaded_files = []; $script = __FILE__; if (isset($_SERVER["SCRIPT_FILENAME"])) { $script = $_SERVER["SCRIPT_FILENAME"]; } list($this->_protocol, $this->_base_host, $this->_base_path) = Helpers::explode_url($script); $this->_page_styles = ["base" => new Style($this)]; } /** * Set the base protocol * * @param string $protocol */ function set_protocol(string $protocol) { $this->_protocol = $protocol; } /** * Set the base host * * @param string $host */ function set_host(string $host) { $this->_base_host = $host; } /** * Set the base path * * @param string $path */ function set_base_path(string $path) { $this->_base_path = $path; } /** * Return the Dompdf object * * @return Dompdf */ function get_dompdf() { return $this->_dompdf; } /** * Return the base protocol for this stylesheet * * @return string */ function get_protocol() { return $this->_protocol; } /** * Return the base host for this stylesheet * * @return string */ function get_host() { return $this->_base_host; } /** * Return the base path for this stylesheet * * @return string */ function get_base_path() { return $this->_base_path; } /** * Return the array of page styles * * @return Style[] */ function get_page_styles() { return $this->_page_styles; } /** * Create a new Style object associated with this stylesheet * * @return Style */ function create_style(): Style { return new Style($this, $this->_current_origin); } /** * Add a new Style object to the stylesheet * * The style's origin is changed to the current origin of the stylesheet. * * @param string $key the Style's selector * @param Style $style the Style to be added */ function add_style(string $key, Style $style): void { if (!isset($this->_styles[$key])) { $this->_styles[$key] = []; } $style->set_origin($this->_current_origin); $this->_styles[$key][] = $style; } /** * load and parse a CSS string * * @param string $css * @param int $origin */ function load_css(&$css, $origin = self::ORIG_AUTHOR) { if ($origin) { $this->_current_origin = $origin; } $this->_parse_css($css); } /** * load and parse a CSS file * * @param string $file * @param int $origin */ function load_css_file($file, $origin = self::ORIG_AUTHOR) { if ($origin) { $this->_current_origin = $origin; } // Prevent circular references if (isset($this->_loaded_files[$file])) { return; } $this->_loaded_files[$file] = true; if (strpos($file, "data:") === 0) { $parsed = Helpers::parse_data_uri($file); $css = $parsed["data"]; } else { $options = $this->_dompdf->getOptions(); $parsed_url = Helpers::explode_url($file); $protocol = $parsed_url["protocol"]; if ($file !== $this->getDefaultStylesheet()) { $allowed_protocols = $options->getAllowedProtocols(); if (!array_key_exists($protocol, $allowed_protocols)) { Helpers::record_warnings(E_USER_WARNING, "Permission denied on $file. The communication protocol is not supported.", __FILE__, __LINE__); return; } foreach ($allowed_protocols[$protocol]["rules"] as $rule) { [$result, $message] = $rule($file); if (!$result) { Helpers::record_warnings(E_USER_WARNING, "Error loading $file: $message", __FILE__, __LINE__); return; } } } [$css, $http_response_header] = Helpers::getFileContent($file, $this->_dompdf->getHttpContext()); $good_mime_type = true; // See http://the-stickman.com/web-development/php/getting-http-response-headers-when-using-file_get_contents/ if (isset($http_response_header) && !$this->_dompdf->getQuirksmode()) { foreach ($http_response_header as $_header) { if (preg_match("@Content-Type:\s*([\w/]+)@i", $_header, $matches) && ($matches[1] !== "text/css") ) { $good_mime_type = false; } } } if (!$good_mime_type || $css === null) { Helpers::record_warnings(E_USER_WARNING, "Unable to load css file $file", __FILE__, __LINE__); return; } [$this->_protocol, $this->_base_host, $this->_base_path] = $parsed_url; } $this->_parse_css($css); } /** * @link https://www.w3.org/TR/CSS21/cascade.html#specificity * * @param string $selector * @param int $origin * - Stylesheet::ORIG_UA: user agent style sheet * - Stylesheet::ORIG_USER: user style sheet * - Stylesheet::ORIG_AUTHOR: author style sheet * * @return int */ protected function specificity(string $selector, int $origin = self::ORIG_AUTHOR): int { $a = ($selector === "!attr") ? 1 : 0; $b = min(mb_substr_count($selector, "#"), 255); $c = min(mb_substr_count($selector, ".") + mb_substr_count($selector, "[") + mb_substr_count($selector, ":") - 2 * mb_substr_count($selector, "::"), 255); $d = min(mb_substr_count($selector, " ") + mb_substr_count($selector, ">") + mb_substr_count($selector, "+") + mb_substr_count($selector, "~") - mb_substr_count($selector, "~=") + mb_substr_count($selector, "::"), 255); //If a normal element name is at the beginning of the string, //a leading whitespace might have been removed on whitespace collapsing and removal //therefore there might be one whitespace less as selected element names //this can lead to a too small specificity //see selectorToXpath if (!in_array($selector[0], [" ", ">", ".", "#", "+", "~", ":", "["], true) && $selector !== "*") { $d++; } if ($this->_dompdf->getOptions()->getDebugCss()) { /*DEBUGCSS*/ print "<pre>\n"; /*DEBUGCSS*/ printf("specificity(): 0x%08x \"%s\"\n", self::$_stylesheet_origins[$origin] + (($a << 24) | ($b << 16) | ($c << 8) | ($d)), $selector); /*DEBUGCSS*/ print "</pre>"; } return self::$_stylesheet_origins[$origin] + (($a << 24) | ($b << 16) | ($c << 8) | ($d)); } /** * Converts a CSS selector to an XPath query. * * @param string $selector * @param bool $firstPass * * @return array|null */ protected function selectorToXpath(string $selector, bool $firstPass = false): ?array { // Collapse white space and strip whitespace around delimiters //$search = array("/\\s+/", "/\\s+([.>#+:])\\s+/"); //$replace = array(" ", "\\1"); //$selector = preg_replace($search, $replace, trim($selector)); // Initial query, always expanded to // below (non-absolute) $query = "/"; // Will contain :before and :after $pseudo_elements = []; // Parse the selector //$s = preg_split("/([ :>.#+])/", $selector, -1, PREG_SPLIT_DELIM_CAPTURE); $delimiters = [" ", ">", ".", "#", "+", "~", ":", "[", "("]; // Add an implicit space at the beginning of the selector if there is no // delimiter there already. if (!in_array($selector[0], $delimiters, true)) { $selector = " $selector"; } $name = "*"; $len = mb_strlen($selector); $i = 0; while ($i < $len) { $s = $selector[$i]; $i++; // Eat characters up to the next delimiter $tok = ""; $in_attr = false; $in_func = false; while ($i < $len) { $c = $selector[$i]; $c_prev = $selector[$i - 1]; if (!$in_func && !$in_attr && in_array($c, $delimiters, true) && !($c === $c_prev && $c === ":")) { break; } if ($c_prev === "[") { $in_attr = true; } if ($c_prev === "(") { $in_func = true; } $tok .= $selector[$i++]; if ($in_attr && $c === "]") { $in_attr = false; break; } if ($in_func && $c === ")") { $in_func = false; break; } } switch ($s) { case " ": case ">": // All elements matching the next token that are descendants // or children of the current token // https://www.w3.org/TR/selectors-3/#descendant-combinators // https://www.w3.org/TR/selectors-3/#child-combinators $expr = $s === " " ? "descendant" : "child"; // Tag names are case-insensitive $name = $tok === "" ? "*" : strtolower($tok); $query .= "/$expr::$name"; break; case "+": // Next-sibling combinator // https://www.w3.org/TR/selectors-3/#sibling-combinators // Tag names are case-insensitive $name = $tok === "" ? "*" : strtolower($tok); $query .= "/following-sibling::*[1]"; if ($name !== "*") { $query .= "[name() = '$name']"; } break; case "~": // Subsequent-sibling combinator // https://www.w3.org/TR/selectors-3/#sibling-combinators // Tag names are case-insensitive $name = $tok === "" ? "*" : strtolower($tok); $query .= "/following-sibling::$name"; break; case "#": // All elements matching the current token with id equal // to the _next_ token // https://www.w3.org/TR/selectors-3/#id-selectors if ($query === "/") { $query .= "/*"; } $query .= "[@id=\"$tok\"]"; break; case ".": // All elements matching the current token with a class // equal to the _next_ token // https://www.w3.org/TR/selectors-3/#class-html if ($query === "/") { $query .= "/*"; } // Match multiple classes: $tok contains the current selected // class. Search for class attributes with class="$tok", // class=".* $tok .*" and class=".* $tok" // This doesn't work because libxml only supports XPath 1.0... //$query .= "[matches(@$attr,\"^{$tok}\$|^{$tok}[ ]+|[ ]+{$tok}\$|[ ]+{$tok}[ ]+\")]"; $query .= "[contains(concat(' ', normalize-space(@class), ' '), concat(' ', '$tok', ' '))]"; break; case ":": if ($query === "/") { $query .= "/*"; } $last = false; // Pseudo-classes switch ($tok) { case "root": $query .= "[not(parent::*)]"; break; case "first-child": $query .= "[not(preceding-sibling::*)]"; break; case "last-child": $query .= "[not(following-sibling::*)]"; break; case "only-child": $query .= "[not(preceding-sibling::*) and not(following-sibling::*)]"; break; // https://www.w3.org/TR/selectors-3/#nth-child-pseudo /** @noinspection PhpMissingBreakStatementInspection */ case "nth-last-child": $last = true; case "nth-child": $p = $i + 1; $nth = trim(mb_substr($selector, $p, strpos($selector, ")", $i) - $p)); $position = $last ? "(count(following-sibling::*) + 1)" : "(count(preceding-sibling::*) + 1)"; $condition = $this->selectorAnPlusB($nth, $position); $query .= "[$condition]"; break; // TODO: `*:first-of-type`, `*:nth-of-type` etc. // (without fixed element name) are treated equivalent // to their `:*-child` counterparts here. They might // not be properly expressible in XPath 1.0 case "first-of-type": $query .= "[not(preceding-sibling::$name)]"; break; case "last-of-type": $query .= "[not(following-sibling::$name)]"; break; case "only-of-type": $query .= "[not(preceding-sibling::$name) and not(following-sibling::$name)]"; break; // https://www.w3.org/TR/selectors-3/#nth-of-type-pseudo /** @noinspection PhpMissingBreakStatementInspection */ case "nth-last-of-type": $last = true; case "nth-of-type": $p = $i + 1; $nth = trim(mb_substr($selector, $p, strpos($selector, ")", $i) - $p)); $position = $last ? "(count(following-sibling::$name) + 1)" : "(count(preceding-sibling::$name) + 1)"; $condition = $this->selectorAnPlusB($nth, $position); $query .= "[$condition]"; break; // https://www.w3.org/TR/selectors-4/#empty-pseudo case "empty": $query .= "[not(*) and not(normalize-space())]"; break; // TODO: bit of a hack attempt at matches support, currently only matches against elements case "matches": $p = $i + 1; $matchList = trim(mb_substr($selector, $p, strpos($selector, ")", $i) - $p)); // Tag names are case-insensitive $elements = array_map("trim", explode(",", strtolower($matchList))); foreach ($elements as &$element) { $element = "name() = '$element'"; } $query .= "[" . implode(" or ", $elements) . "]"; break; // https://www.w3.org/TR/selectors-3/#UIstates case "disabled": case "checked": $query .= "[@$tok]"; break; case "enabled": $query .= "[not(@disabled)]"; break; // https://www.w3.org/TR/selectors-3/#dynamic-pseudos // https://www.w3.org/TR/selectors-4/#the-any-link-pseudo case "link": case "any-link": $query .= "[@href]"; break; // N/A case "visited": case "hover": case "active": case "focus": case "focus-visible": case "focus-within": $query .= "[false()]"; break; // https://www.w3.org/TR/selectors-3/#first-line // https://www.w3.org/TR/selectors-3/#first-letter case "first-line": case ":first-line": case "first-letter": case ":first-letter": // TODO $el = ltrim($tok, ":"); $pseudo_elements[$el] = true; break; // https://www.w3.org/TR/selectors-3/#gen-content case "before": case ":before": case "after": case ":after": $pos = ltrim($tok, ":"); $pseudo_elements[$pos] = true; if (!$firstPass) { $query .= "/*[@$pos]"; } break; // Invalid or unsupported pseudo-class or pseudo-element default: return null; } break; case "[": // Attribute selectors. All with an attribute matching the // following token(s) // https://www.w3.org/TR/selectors-3/#attribute-selectors if ($query === "/") { $query .= "/*"; } $attr_delimiters = ["=", "]", "~", "|", "$", "^", "*"]; $tok_len = mb_strlen($tok); $j = 0; $attr = ""; $op = ""; $value = ""; while ($j < $tok_len) { if (in_array($tok[$j], $attr_delimiters, true)) { break; } $attr .= $tok[$j++]; } if ($attr === "") { // Selector invalid: Missing attribute name return null; } if (!isset($tok[$j])) { // Selector invalid: Missing ] or operator return null; } switch ($tok[$j]) { case "~": case "|": case "^": case "$": case "*": $op .= $tok[$j++]; if (!isset($tok[$j]) || $tok[$j] !== "=") { // Selector invalid: Incomplete attribute operator return null; } $op .= $tok[$j]; break; case "=": $op = "="; break; } // Read the attribute value, if required if ($op !== "") { $j++; while ($j < $tok_len) { if ($tok[$j] === "]") { break; } $value .= $tok[$j++]; } } if (!isset($tok[$j])) { // Selector invalid: Missing ] return null; } $value = trim($value, "\"'"); switch ($op) { case "": $query .= "[@$attr]"; break; case "=": $query .= "[@$attr=\"$value\"]"; break; case "~=": // FIXME: this will break if $value contains quoted strings // (e.g. [type~="a b c" "d e f"]) $query .= $value !== "" && !preg_match("/\s+/", $value) ? "[contains(concat(' ', normalize-space(@$attr), ' '), concat(' ', \"$value\", ' '))]" : "[false()]"; break; case "|=": $values = explode("-", $value); $query .= "["; foreach ($values as $val) { $query .= "starts-with(@$attr, \"$val\") or "; } $query = rtrim($query, " or ") . "]"; break; case "^=": $query .= $value !== "" ? "[starts-with(@$attr,\"$value\")]" : "[false()]"; break; case "$=": $query .= $value !== "" ? "[substring(@$attr, string-length(@$attr)-" . (strlen($value) - 1) . ")=\"$value\"]" : "[false()]"; break; case "*=": $query .= $value !== "" ? "[contains(@$attr,\"$value\")]" : "[false()]"; break; } break; } } return ["query" => $query, "pseudo_elements" => $pseudo_elements]; } /** * Parse an `nth-child` expression of the form `an+b`, `odd`, or `even`. * * @param string $expr * @param string $position * * @return string * * @link https://www.w3.org/TR/selectors-3/#nth-child-pseudo */ protected function selectorAnPlusB(string $expr, string $position): string { // odd if ($expr === "odd") { return "($position mod 2) = 1"; } // even elseif ($expr === "even") { return "($position mod 2) = 0"; } // b elseif (preg_match("/^\d+$/", $expr)) { return "$position = $expr"; } // an+b // https://github.com/tenderlove/nokogiri/blob/master/lib/nokogiri/css/xpath_visitor.rb $expr = preg_replace("/\s/", "", $expr); if (!preg_match("/^(?P<a>-?[0-9]*)?n(?P<b>[-+]?[0-9]+)?$/", $expr, $matches)) { return "false()"; } $a = (isset($matches["a"]) && $matches["a"] !== "") ? ($matches["a"] !== "-" ? intval($matches["a"]) : -1) : 1; $b = (isset($matches["b"]) && $matches["b"] !== "") ? intval($matches["b"]) : 0; if ($b === 0) { return "($position mod $a) = 0"; } else { $compare = ($a < 0) ? "<=" : ">="; $b2 = -$b; if ($b2 >= 0) { $b2 = "+$b2"; } return "($position $compare $b) and ((($position $b2) mod " . abs($a) . ") = 0)"; } } /** * applies all current styles to a particular document tree * * apply_styles() applies all currently loaded styles to the provided * {@link FrameTree}. Aside from parsing CSS, this is the main purpose * of this class. * * @param FrameTree $tree */ function apply_styles(FrameTree $tree) { // Use XPath to select nodes. This would be easier if we could attach // Frame objects directly to DOMNodes using the setUserData() method, but // we can't do that just yet. Instead, we set a _node attribute_ in // Frame->set_id() and use that as a handle on the Frame object via // FrameTree::$_registry. // We create a scratch array of styles indexed by frame id. Once all // styles have been assigned, we order the cached styles by specificity // and create a final style object to assign to the frame. // FIXME: this is not particularly robust... $styles = []; $xp = new DOMXPath($tree->get_dom()); $DEBUGCSS = $this->_dompdf->getOptions()->getDebugCss(); // Add generated content foreach ($this->_styles as $selector => $selector_styles) { if (strpos($selector, ":before") === false && strpos($selector, ":after") === false) { continue; } $query = $this->selectorToXpath($selector, true); if ($query === null) { Helpers::record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__); continue; } // Retrieve the nodes, limit to body for generated content // TODO: If we use a context node can we remove the leading dot? $nodes = @$xp->query('.' . $query["query"]); if ($nodes === false) { Helpers::record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__); continue; } foreach ($selector_styles as $style) { foreach ($nodes as $node) { // Only DOMElements get styles if (!($node instanceof DOMElement)) { continue; } foreach (array_keys($query["pseudo_elements"], true, true) as $pos) { // Do not add a new pseudo element if another one already matched if ($node->hasAttribute("dompdf_{$pos}_frame_id")) { continue; } $content = $style->get_specified("content"); // Do not create non-displayed before/after pseudo elements // https://www.w3.org/TR/CSS21/generate.html#content // https://www.w3.org/TR/CSS21/generate.html#undisplayed-counters if ($content === "normal" || $content === "none") { continue; } if (($src = $this->resolve_url($content)) !== "none") { $new_node = $node->ownerDocument->createElement("img_generated"); $new_node->setAttribute("src", $src); } else { $new_node = $node->ownerDocument->createElement("dompdf_generated"); } $new_node->setAttribute($pos, $pos); $new_frame_id = $tree->insert_node($node, $new_node, $pos); $node->setAttribute("dompdf_{$pos}_frame_id", $new_frame_id); } } } } // Apply all styles in stylesheet foreach ($this->_styles as $selector => $selector_styles) { $query = $this->selectorToXpath($selector); if ($query === null) { Helpers::record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__); continue; } // Retrieve the nodes $nodes = @$xp->query($query["query"]); if ($nodes === false) { Helpers::record_warnings(E_USER_WARNING, "The CSS selector '$selector' is not valid", __FILE__, __LINE__); continue; } foreach ($selector_styles as $style) { $spec = $this->specificity($selector, $style->get_origin()); foreach ($nodes as $node) { // Only DOMElements get styles if (!($node instanceof DOMElement)) { continue; } $id = $node->getAttribute("frame_id"); // Assign the current style to the scratch array $styles[$id][$spec][] = $style; } } } // Set the page width, height, and orientation based on the canvas paper size $canvas = $this->_dompdf->getCanvas(); $paper_width = $canvas->get_width(); $paper_height = $canvas->get_height(); $paper_orientation = ($paper_width > $paper_height ? "landscape" : "portrait"); if ($this->_page_styles["base"] && is_array($this->_page_styles["base"]->size)) { $paper_width = $this->_page_styles['base']->size[0]; $paper_height = $this->_page_styles['base']->size[1]; $paper_orientation = ($paper_width > $paper_height ? "landscape" : "portrait"); } // Now create the styles and assign them to the appropriate frames. (We // iterate over the tree using an implicit FrameTree iterator.) $root_flg = false; foreach ($tree as $frame) { // Helpers::pre_r($frame->get_node()->nodeName . ":"); if (!$root_flg && $this->_page_styles["base"]) { $style = $this->_page_styles["base"]; } else { $style = $this->create_style(); } // Find nearest DOMElement parent $p = $frame; while ($p = $p->get_parent()) { if ($p->get_node()->nodeType === XML_ELEMENT_NODE) { break; } } // Styles can only be applied directly to DOMElements; anonymous // frames inherit from their parent if ($frame->get_node()->nodeType !== XML_ELEMENT_NODE) { $style->inherit($p ? $p->get_style() : null); $frame->set_style($style); continue; } $id = $frame->get_id(); // Handle HTML 4.0 attributes AttributeTranslator::translate_attributes($frame); if (($str = $frame->get_node()->getAttribute(AttributeTranslator::$_style_attr)) !== "") { $styles[$id][self::SPEC_NON_CSS][] = $this->_parse_properties($str); } // Locate any additional style attributes if (($str = $frame->get_node()->getAttribute("style")) !== "") { // Destroy CSS comments $str = preg_replace("'/\*.*?\*/'si", "", $str); $spec = $this->specificity("!attr", self::ORIG_AUTHOR); $styles[$id][$spec][] = $this->_parse_properties($str); } // Grab the applicable styles if (isset($styles[$id])) { /** @var array[][] $applied_styles */ $applied_styles = $styles[$id]; // Sort by specificity ksort($applied_styles); if ($DEBUGCSS) { $debug_nodename = $frame->get_node()->nodeName; print "<pre>\n$debug_nodename [\n"; foreach ($applied_styles as $spec => $arr) { printf(" specificity 0x%08x\n", $spec); /** @var Style $s */ foreach ($arr as $s) { print " [\n"; $s->debug_print(); print " ]\n"; } } } // Merge the new styles with the inherited styles $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES; $acceptedmedia[] = $this->_dompdf->getOptions()->getDefaultMediaType(); foreach ($applied_styles as $arr) { /** @var Style $s */ foreach ($arr as $s) { $media_queries = $s->get_media_queries(); foreach ($media_queries as $media_query) { list($media_query_feature, $media_query_value) = $media_query; // if any of the Style's media queries fail then do not apply the style //TODO: When the media query logic is fully developed we should not apply the Style when any of the media queries fail or are bad, per https://www.w3.org/TR/css3-mediaqueries/#error-handling if (in_array($media_query_feature, self::$VALID_MEDIA_TYPES)) { if ((strlen($media_query_feature) === 0 && !in_array($media_query, $acceptedmedia)) || (in_array($media_query, $acceptedmedia) && $media_query_value == "not")) { continue (3); } } else { switch ($media_query_feature) { case "height": if ($paper_height !== (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "min-height": if ($paper_height < (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "max-height": if ($paper_height > (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "width": if ($paper_width !== (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "min-width": //if (min($paper_width, $media_query_width) === $paper_width) { if ($paper_width < (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "max-width": //if (max($paper_width, $media_query_width) === $paper_width) { if ($paper_width > (float)$style->length_in_pt($media_query_value)) { continue (3); } break; case "orientation": if ($paper_orientation !== $media_query_value) { continue (3); } break; default: Helpers::record_warnings(E_USER_WARNING, "Unknown media query: $media_query_feature", __FILE__, __LINE__); break; } } } $style->merge($s); } } } // Handle inheritance if ($p && $DEBUGCSS) { print " inherit [\n"; $p->get_style()->debug_print(); print " ]\n"; } $style->inherit($p ? $p->get_style() : null); if ($DEBUGCSS) { print " DomElementStyle [\n"; $style->debug_print(); print " ]\n"; print "]\n</pre>"; } $style->clear_important(); $frame->set_style($style); if (!$root_flg && $this->_page_styles["base"]) { $root_flg = true; // set the page width, height, and orientation based on the parsed page style if ($style->size !== "auto") { list($paper_width, $paper_height) = $style->size; } $paper_width = $paper_width - (float)$style->length_in_pt($style->margin_left) - (float)$style->length_in_pt($style->margin_right); $paper_height = $paper_height - (float)$style->length_in_pt($style->margin_top) - (float)$style->length_in_pt($style->margin_bottom); $paper_orientation = ($paper_width > $paper_height ? "landscape" : "portrait"); } } // We're done! Clean out the registry of all styles since we // won't be needing this later. foreach (array_keys($this->_styles) as $key) { $this->_styles[$key] = null; unset($this->_styles[$key]); } } /** * parse a CSS string using a regex parser * Called by {@link Stylesheet::parse_css()} * * @param string $str * * @throws Exception */ private function _parse_css($str) { $str = trim($str); // Destroy comments and remove HTML comments $css = preg_replace([ "'/\*.*?\*/'si", "/^<!--/", "/-->$/" ], "", $str); // FIXME: handle '{' within strings, e.g. [attr="string {}"] // Something more legible: $re = "/\s* # Skip leading whitespace \n" . "( @([^\s{]+)\s*([^{;]*) (?:;|({)) )? # Match @rules followed by ';' or '{' \n" . "(?(1) # Only parse sub-sections if we're in an @rule... \n" . " (?(4) # ...and if there was a leading '{' \n" . " \s*( (?:(?>[^{}]+) ({)? # Parse rulesets and individual @page rules \n" . " (?(6) (?>[^}]*) }) \s*)+? \n" . " ) \n" . " }) # Balancing '}' \n" . "| # Branch to match regular rules (not preceded by '@') \n" . "([^{]*{[^}]*})) # Parse normal rulesets \n" . "/xs"; if (preg_match_all($re, $css, $matches, PREG_SET_ORDER) === false) { // An error occurred throw new Exception("Error parsing css file: preg_match_all() failed."); } // After matching, the array indices are set as follows: // // [0] => complete text of match // [1] => contains '@import ...;' or '@media {' if applicable // [2] => text following @ for cases where [1] is set // [3] => media types or full text following '@import ...;' // [4] => '{', if present // [5] => rulesets within media rules // [6] => '{', within media rules // [7] => individual rules, outside of media rules // $media_query_regex = "/(?:((only|not)?\s*(" . implode("|", self::$VALID_MEDIA_TYPES) . "))|(\s*\(\s*((?:(min|max)-)?([\w\-]+))\s*(?:\:\s*(.*?)\s*)?\)))/isx"; //Helpers::pre_r($matches); foreach ($matches as $match) { $match[2] = trim($match[2]); if ($match[2] !== "") { // Handle @rules switch ($match[2]) { case "import": $this->_parse_import($match[3]); break; case "media": $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES; $acceptedmedia[] = $this->_dompdf->getOptions()->getDefaultMediaType(); $media_queries = preg_split("/\s*,\s*/", mb_strtolower(trim($match[3]))); foreach ($media_queries as $media_query) { if (in_array($media_query, $acceptedmedia)) { //if we have a media type match go ahead and parse the stylesheet $this->_parse_sections($match[5]); break; } elseif (!in_array($media_query, self::$VALID_MEDIA_TYPES)) { // otherwise conditionally parse the stylesheet assuming there are parseable media queries if (preg_match_all($media_query_regex, $media_query, $media_query_matches, PREG_SET_ORDER) !== false) { $mq = []; foreach ($media_query_matches as $media_query_match) { if (empty($media_query_match[1]) === false) { $media_query_feature = strtolower($media_query_match[3]); $media_query_value = strtolower($media_query_match[2]); $mq[] = [$media_query_feature, $media_query_value]; } elseif (empty($media_query_match[4]) === false) { $media_query_feature = strtolower($media_query_match[5]); $media_query_value = (array_key_exists(8, $media_query_match) ? strtolower($media_query_match[8]) : null); $mq[] = [$media_query_feature, $media_query_value]; } } $this->_parse_sections($match[5], $mq); break; } } } break; case "page": //This handles @page to be applied to page oriented media //Note: This has a reduced syntax: //@page { margin:1cm; color:blue; } //Not a sequence of styles like a full.css, but only the properties //of a single style, which is applied to the very first "root" frame before //processing other styles of the frame. //Working properties: // margin (for margin around edge of paper) // font-family (default font of pages) // color (default text color of pages) //Non working properties: // border // padding // background-color //Todo:Reason is unknown //Other properties (like further font or border attributes) not tested. //If a border or background color around each paper sheet is desired, //assign it to the <body> tag, possibly only for the css of the correct media type. // If the page has a name, skip the style. $page_selector = trim($match[3]); $key = null; switch ($page_selector) { case "": $key = "base"; break; case ":left": case ":right": case ":odd": case ":even": /** @noinspection PhpMissingBreakStatementInspection */ case ":first": $key = $page_selector; break; default: break 2; } // Store the style for later... if (empty($this->_page_styles[$key])) { $this->_page_styles[$key] = $this->_parse_properties($match[5]); } else { $this->_page_styles[$key]->merge($this->_parse_properties($match[5])); } break; case "font-face": $this->_parse_font_face($match[5]); break; default: // ignore everything else break; } continue; } if ($match[7] !== "") { $this->_parse_sections($match[7]); } } } /** * Resolve the given `url()` declaration to an absolute URL. * * @param string|null $val The declaration to resolve in the context of the stylesheet. * @return string The resolved URL, or `none`, if the value is `none`, * invalid, or points to a non-existent local file. */ public function resolve_url($val): string { $DEBUGCSS = $this->_dompdf->getOptions()->getDebugCss(); $parsed_url = "none"; if (empty($val) || $val === "none") { $path = "none"; } elseif (mb_strpos($val, "url") === false) { $path = "none"; //Don't resolve no image -> otherwise would prefix path and no longer recognize as none } else { $val = preg_replace("/url\(\s*['\"]?([^'\")]+)['\"]?\s*\)/", "\\1", trim($val)); // Resolve the url now in the context of the current stylesheet $path = Helpers::build_url($this->_protocol, $this->_base_host, $this->_base_path, $val); if ($path === null) { $path = "none"; } } if ($DEBUGCSS) { $parsed_url = Helpers::explode_url($path); print "<pre>[_image\n"; print_r($parsed_url); print $this->_protocol . "\n" . $this->_base_path . "\n" . $path . "\n"; print "_image]</pre>"; } return $path; } /** * parse @import{} sections * * @param string $url the url of the imported CSS file */ private function _parse_import($url) { $arr = preg_split("/[\s\n,]/", $url, -1, PREG_SPLIT_NO_EMPTY); $url = array_shift($arr); $accept = false; if (count($arr) > 0) { $acceptedmedia = self::$ACCEPTED_GENERIC_MEDIA_TYPES; $acceptedmedia[] = $this->_dompdf->getOptions()->getDefaultMediaType(); // @import url media_type [media_type...] foreach ($arr as $type) { if (in_array(mb_strtolower(trim($type)), $acceptedmedia)) { $accept = true; break; } } } else { // unconditional import $accept = true; } if ($accept) { // Store our current base url properties in case the new url is elsewhere $protocol = $this->_protocol; $host = $this->_base_host; $path = $this->_base_path; // $url = str_replace(array('"',"url", "(", ")"), "", $url); // If the protocol is php, assume that we will import using file:// // $url = Helpers::build_url($protocol === "php://" ? "file://" : $protocol, $host, $path, $url); // Above does not work for subfolders and absolute urls. // Todo: As above, do we need to replace php or file to an empty protocol for local files? if (($url = $this->resolve_url($url)) !== "none") { $this->load_css_file($url); } // Restore the current base url $this->_protocol = $protocol; $this->_base_host = $host; $this->_base_path = $path; } } /** * parse @font-face{} sections * http://www.w3.org/TR/css3-fonts/#the-font-face-rule * * @param string $str CSS @font-face rules */ private function _parse_font_face($str) { $descriptors = $this->_parse_properties($str); preg_match_all("/(url|local)\s*\(\s*[\"\']?([^\"\'\)]+)[\"\']?\s*\)\s*(format\s*\(\s*[\"\']?([^\"\'\)]+)[\"\']?\s*\))?/i", $descriptors->src, $src); $valid_sources = []; foreach ($src[0] as $i => $value) { $source = [ "local" => strtolower($src[1][$i]) === "local", "uri" => $src[2][$i], "format" => strtolower($src[4][$i]), "path" => Helpers::build_url($this->_protocol, $this->_base_host, $this->_base_path, $src[2][$i]), ]; if (!$source["local"] && in_array($source["format"], ["", "truetype"]) && $source["path"] !== null) { $valid_sources[] = $source; } } // No valid sources if (empty($valid_sources)) { return; } $style = [ "family" => $descriptors->get_font_family_raw(), "weight" => $descriptors->font_weight, "style" => $descriptors->font_style, ]; $this->getFontMetrics()->registerFont($style, $valid_sources[0]["path"], $this->_dompdf->getHttpContext()); } /** * parse regular CSS blocks * * _parse_properties() creates a new Style object based on the provided * CSS rules. * * @param string $str CSS rules * @return Style */ private function _parse_properties($str) { $properties = preg_split("/;(?=(?:[^\(]*\([^\)]*\))*(?![^\)]*\)))/", $str); $DEBUGCSS = $this->_dompdf->getOptions()->getDebugCss(); if ($DEBUGCSS) { print '[_parse_properties'; } // Create the style $style = new Style($this, Stylesheet::ORIG_AUTHOR); foreach ($properties as $prop) { // If the $prop contains an url, the regex may be wrong // @todo: fix the regex so that it works every time /*if (strpos($prop, "url(") === false) { if (preg_match("/([a-z-]+)\s*:\s*[^:]+$/i", $prop, $m)) $prop = $m[0]; }*/ //A css property can have " ! important" appended (whitespace optional) //strip this off to decode core of the property correctly. /* Instead of short code, prefer the typical case with fast code $important = preg_match("/(.*?)!\s*important/",$prop,$match); if ( $important ) { $prop = $match[1]; } $prop = trim($prop); */ if ($DEBUGCSS) print '('; $important = false; $prop = trim($prop); if (substr($prop, -9) === 'important') { $prop_tmp = rtrim(substr($prop, 0, -9)); if (substr($prop_tmp, -1) === '!') { $prop = rtrim(substr($prop_tmp, 0, -1)); $important = true; } } if ($prop === "") { if ($DEBUGCSS) print 'empty)'; continue; } $i = mb_strpos($prop, ":"); if ($i === false) { if ($DEBUGCSS) print 'novalue' . $prop . ')'; continue; } $prop_name = rtrim(mb_strtolower(mb_substr($prop, 0, $i))); $value = ltrim(mb_substr($prop, $i + 1)); if ($DEBUGCSS) print $prop_name . ':=' . $value . ($important ? '!IMPORTANT' : '') . ')'; $style->set_prop($prop_name, $value, $important, false); } if ($DEBUGCSS) print '_parse_properties]'; return $style; } /** * parse selector + rulesets * * @param string $str CSS selectors and rulesets * @param array $media_queries */ private function _parse_sections($str, $media_queries = []) { // Pre-process selectors: collapse all whitespace and strip whitespace // around '>', '.', ':', '+', '~', '#' $patterns = ["/\s+/", "/\s+([>.:+~#])\s+/"]; $replacements = [" ", "\\1"]; $DEBUGCSS = $this->_dompdf->getOptions()->getDebugCss(); $sections = explode("}", $str); if ($DEBUGCSS) print '[_parse_sections'; foreach ($sections as $sect) { $i = mb_strpos($sect, "{"); if ($i === false) { continue; } if ($DEBUGCSS) print '[section'; $selector_str = preg_replace($patterns, $replacements, mb_substr($sect, 0, $i)); $selectors = preg_split("/,(?![^\(]*\))/", $selector_str, 0, PREG_SPLIT_NO_EMPTY); $style = $this->_parse_properties(trim(mb_substr($sect, $i + 1))); // Assign it to the selected elements foreach ($selectors as $selector) { $selector = trim($selector); if ($selector === "") { if ($DEBUGCSS) print '#empty#'; continue; } if ($DEBUGCSS) print '#' . $selector . '#'; //if ($DEBUGCSS) { if (strpos($selector,'p') !== false) print '!!!p!!!#'; } //FIXME: tag the selector with a hash of the media query to separate it from non-conditional styles (?), xpath comments are probably not what we want to do here if (count($media_queries) > 0) { $style->set_media_queries($media_queries); } $this->add_style($selector, $style); } if ($DEBUGCSS) { print 'section]'; } } if ($DEBUGCSS) { print "_parse_sections]\n"; } } /** * @return string */ public function getDefaultStylesheet() { $options = $this->_dompdf->getOptions(); $rootDir = realpath($options->getRootDir()); return Helpers::build_url("file://", "", $rootDir, $rootDir . self::DEFAULT_STYLESHEET); } /** * @param FontMetrics $fontMetrics * @return $this */ public function setFontMetrics(FontMetrics $fontMetrics) { $this->fontMetrics = $fontMetrics; return $this; } /** * @return FontMetrics */ public function getFontMetrics() { return $this->fontMetrics; } /** * dumps the entire stylesheet as a string * * Generates a string of each selector and associated style in the * Stylesheet. Useful for debugging. * * @return string */ function __toString() { $str = ""; foreach ($this->_styles as $selector => $selector_styles) { foreach ($selector_styles as $style) { $str .= "$selector => " . $style->__toString() . "\n"; } } return $str; } }