WeasyPrint/weasyprint/css/__init__.py

"""
    weasyprint.css
    --------------

    This module takes care of steps 3 and 4 of “CSS 2.1 processing model”:
    Retrieve stylesheets associated with a document and annotate every element
    with a value for every CSS property.

    http://www.w3.org/TR/CSS21/intro.html#processing-model

    This module does this in more than two steps. The
    :func:`get_all_computed_styles` function does everything, but it is itsef
    based on other functions in this module.

    :copyright: Copyright 2011-2019 Simon Sapin and contributors, see AUTHORS.
    :license: BSD, see LICENSE for details.

"""

from collections import namedtuple
from logging import DEBUG, WARNING

import cssselect2
import tinycss2

from .. import CSS
from ..logger import LOGGER, PROGRESS_LOGGER
from ..urls import URLFetchingError, get_url_attribute, url_join
from . import computed_values, media_queries
from .properties import INHERITED, INITIAL_NOT_COMPUTED, INITIAL_VALUES
from .utils import remove_whitespace
from .validation import preprocess_declarations
from .validation.descriptors import preprocess_descriptors

# Reject anything not in here:
PSEUDO_ELEMENTS = (None, 'before', 'after', 'first-line', 'first-letter')


PageType = namedtuple('PageType', ['side', 'blank', 'first', 'index', 'name'])


class StyleFor:
    """Convenience function to get the computed styles for an element."""
    def __init__(self, html, sheets, presentational_hints, target_collector):
        # keys: (element, pseudo_element_type)
        #    element: an ElementTree Element or the '@page' string
        #    pseudo_element_type: a string such as 'first' (for @page) or
        #        'after', or None for normal elements
        # values: dicts of
        #     keys: property name as a string
        #     values: (values, weight)
        #         values: a PropertyValue-like object
        #         weight: values with a greater weight take precedence, see
        #             http://www.w3.org/TR/CSS21/cascade.html#cascading-order
        self._cascaded_styles = cascaded_styles = {}

        # keys: (element, pseudo_element_type), like cascaded_styles
        # values: style dict objects:
        #     keys: property name as a string
        #     values: a PropertyValue-like object
        self._computed_styles = computed_styles = {}

        PROGRESS_LOGGER.info('Step 3 - Applying CSS')
        for specificity, attributes in find_style_attributes(
                html.etree_element, presentational_hints, html.base_url):
            element, declarations, base_url = attributes
            for name, values, importance in preprocess_declarations(
                    base_url, declarations):
                precedence = declaration_precedence('author', importance)
                weight = (precedence, specificity)
                add_declaration(cascaded_styles, name, values, weight, element)

        # First, add declarations and set computed styles for "real" elements
        # *in tree order*. Tree order is important so that parents have
        # computed styles before their children, for inheritance.

        # Iterate on all elements, even if there is no cascaded style for them.
        for element in html.wrapper_element.iter_subtree():
            for sheet, origin, sheet_specificity in sheets:
                # Add declarations for matched elements
                for selector in sheet.matcher.match(element):
                    specificity, order, pseudo_type, declarations = selector
                    specificity = sheet_specificity or specificity
                    for name, values, importance in declarations:
                        precedence = declaration_precedence(origin, importance)
                        weight = (precedence, specificity)
                        add_declaration(
                            cascaded_styles, name, values, weight,
                            element.etree_element, pseudo_type)
            parent = element.parent.etree_element if element.parent else None
            self.set_computed_styles(
                element.etree_element, root=html.etree_element, parent=parent,
                base_url=html.base_url, target_collector=target_collector)

        page_names = {style['page'] for style in computed_styles.values()}

        for sheet, origin, sheet_specificity in sheets:
            # Add declarations for page elements
            for _rule, selector_list, declarations in sheet.page_rules:
                for selector in selector_list:
                    specificity, pseudo_type, match = selector
                    specificity = sheet_specificity or specificity
                    for page_type in match(page_names):
                        for name, values, importance in declarations:
                            precedence = declaration_precedence(
                                origin, importance)
                            weight = (precedence, specificity)
                            add_declaration(
                                cascaded_styles, name, values, weight,
                                page_type, pseudo_type)

        # Then computed styles for pseudo elements, in any order.
        # Pseudo-elements inherit from their associated element so they come
        # last. Do them in a second pass as there is no easy way to iterate
        # on the pseudo-elements for a given element with the current structure
        # of cascaded_styles. (Keys are (element, pseudo_type) tuples.)

        # Only iterate on pseudo-elements that have cascaded styles. (Others
        # might as well not exist.)
        for element, pseudo_type in cascaded_styles:
            if pseudo_type and not isinstance(element, PageType):
                self.set_computed_styles(
                    element, pseudo_type=pseudo_type,
                    # The pseudo-element inherits from the element.
                    root=html.etree_element, parent=element,
                    base_url=html.base_url, target_collector=target_collector)

    def __call__(self, element, pseudo_type=None):
        style = self._computed_styles.get((element, pseudo_type))

        if style:
            if 'table' in style['display']:
                if (style['display'] in ('table', 'inline-table') and
                        style['border_collapse'] == 'collapse'):
                    # Padding do not apply
                    for side in ['top', 'bottom', 'left', 'right']:
                        style['padding_' + side] = computed_values.ZERO_PIXELS
                if (style['display'].startswith('table-') and
                        style['display'] != 'table-caption'):
                    # Margins do not apply
                    for side in ['top', 'bottom', 'left', 'right']:
                        style['margin_' + side] = computed_values.ZERO_PIXELS

        return style

    def set_computed_styles(self, element, parent, root=None, pseudo_type=None,
                            base_url=None, target_collector=None):
        """Set the computed values of styles to ``element``.

        Take the properties left by ``apply_style_rule`` on an element or
        pseudo-element and assign computed values with respect to the cascade,
        declaration priority (ie. ``!important``) and selector specificity.

        """
        cascaded_styles = self.get_cascaded_styles()
        computed_styles = self.get_computed_styles()
        if element == root and pseudo_type is None:
            assert parent is None
            parent_style = None
            root_style = {
                # When specified on the font-size property of the root element,
                # the rem units refer to the property’s initial value.
                'font_size': INITIAL_VALUES['font_size'],
            }
        else:
            assert parent is not None
            parent_style = computed_styles[parent, None]
            root_style = computed_styles[root, None]

        cascaded = cascaded_styles.get((element, pseudo_type), {})
        computed_styles[element, pseudo_type] = computed_from_cascaded(
            element, cascaded, parent_style, pseudo_type, root_style, base_url,
            target_collector)

    def get_cascaded_styles(self):
        return self._cascaded_styles

    def get_computed_styles(self):
        return self._computed_styles


def get_child_text(element):
    """Return the text directly in the element, not descendants."""
    content = [element.text] if element.text else []
    for child in element:
        if child.tail:
            content.append(child.tail)
    return ''.join(content)


def find_stylesheets(wrapper_element, device_media_type, url_fetcher, base_url,
                     font_config, page_rules):
    """Yield the stylesheets in ``element_tree``.

    The output order is the same as the source order.

    """
    from ..html import element_has_link_type  # Work around circular imports.

    for wrapper in wrapper_element.query_all('style', 'link'):
        element = wrapper.etree_element
        mime_type = element.get('type', 'text/css').split(';', 1)[0].strip()
        # Only keep 'type/subtype' from 'type/subtype ; param1; param2'.
        if mime_type != 'text/css':
            continue
        media_attr = element.get('media', '').strip() or 'all'
        media = [media_type.strip() for media_type in media_attr.split(',')]
        if not media_queries.evaluate_media_query(media, device_media_type):
            continue
        if element.tag == 'style':
            # Content is text that is directly in the <style> element, not its
            # descendants
            content = get_child_text(element)
            # ElementTree should give us either unicode or ASCII-only
            # bytestrings, so we don't need `encoding` here.
            css = CSS(
                string=content, base_url=base_url,
                url_fetcher=url_fetcher, media_type=device_media_type,
                font_config=font_config, page_rules=page_rules)
            yield css
        elif element.tag == 'link' and element.get('href'):
            if not element_has_link_type(element, 'stylesheet') or \
                    element_has_link_type(element, 'alternate'):
                continue
            href = get_url_attribute(element, 'href', base_url)
            if href is not None:
                try:
                    yield CSS(
                        url=href, url_fetcher=url_fetcher,
                        _check_mime_type=True, media_type=device_media_type,
                        font_config=font_config, page_rules=page_rules)
                except URLFetchingError as exc:
                    LOGGER.error(
                        'Failed to load stylesheet at %s : %s', href, exc)


def find_style_attributes(tree, presentational_hints=False, base_url=None):
    """Yield ``specificity, (element, declaration, base_url)`` rules.

    Rules from "style" attribute are returned with specificity
    ``(1, 0, 0)``.

    If ``presentational_hints`` is ``True``, rules from presentational hints
    are returned with specificity ``(0, 0, 0)``.

    """
    def check_style_attribute(element, style_attribute):
        declarations = tinycss2.parse_declaration_list(style_attribute)
        return element, declarations, base_url

    for element in tree.iter():
        specificity = (1, 0, 0)
        style_attribute = element.get('style')
        if style_attribute:
            yield specificity, check_style_attribute(element, style_attribute)
        if not presentational_hints:
            continue
        specificity = (0, 0, 0)
        if element.tag == 'body':
            # TODO: we should check the container frame element
            for part, position in (
                    ('height', 'top'), ('height', 'bottom'),
                    ('width', 'left'), ('width', 'right')):
                style_attribute = None
                for prop in ('margin%s' % part, '%smargin' % position):
                    if element.get(prop):
                        style_attribute = 'margin-%s:%spx' % (
                            position, element.get(prop))
                        break
                if style_attribute:
                    yield specificity, check_style_attribute(
                        element, style_attribute)
            if element.get('background'):
                style_attribute = 'background-image:url(%s)' % (
                    element.get('background'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('bgcolor'):
                style_attribute = 'background-color:%s' % (
                    element.get('bgcolor'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('text'):
                style_attribute = 'color:%s' % element.get('text')
                yield specificity, check_style_attribute(
                    element, style_attribute)
            # TODO: we should support link, vlink, alink
        elif element.tag == 'center':
            yield specificity, check_style_attribute(
                element, 'text-align:center')
        elif element.tag == 'div':
            align = element.get('align', '').lower()
            if align == 'middle':
                yield specificity, check_style_attribute(
                    element, 'text-align:center')
            elif align in ('center', 'left', 'right', 'justify'):
                yield specificity, check_style_attribute(
                    element, 'text-align:%s' % align)
        elif element.tag == 'font':
            if element.get('color'):
                yield specificity, check_style_attribute(
                    element, 'color:%s' % element.get('color'))
            if element.get('face'):
                yield specificity, check_style_attribute(
                    element, 'font-family:%s' % element.get('face'))
            if element.get('size'):
                size = element.get('size').strip()
                relative_plus = size.startswith('+')
                relative_minus = size.startswith('-')
                if relative_plus or relative_minus:
                    size = size[1:].strip()
                try:
                    size = int(size)
                except ValueError:
                    LOGGER.warning('Invalid value for size: %s', size)
                else:
                    font_sizes = {
                        1: 'x-small',
                        2: 'small',
                        3: 'medium',
                        4: 'large',
                        5: 'x-large',
                        6: 'xx-large',
                        7: '48px',  # 1.5 * xx-large
                    }
                    if relative_plus:
                        size += 3
                    elif relative_minus:
                        size -= 3
                    size = max(1, min(7, size))
                    yield specificity, check_style_attribute(
                        element, 'font-size:%s' % font_sizes[size])
        elif element.tag == 'table':
            # TODO: we should support cellpadding
            if element.get('cellspacing'):
                yield specificity, check_style_attribute(
                    element,
                    'border-spacing:%spx' % element.get('cellspacing'))
            if element.get('cellpadding'):
                cellpadding = element.get('cellpadding')
                if cellpadding.isdigit():
                    cellpadding += 'px'
                # TODO: don't match subtables cells
                for subelement in element.iter():
                    if subelement.tag in ('td', 'th'):
                        yield specificity, check_style_attribute(
                            subelement,
                            'padding-left:%s;padding-right:%s;'
                            'padding-top:%s;padding-bottom:%s;' % (
                                4 * (cellpadding,)))
            if element.get('hspace'):
                hspace = element.get('hspace')
                if hspace.isdigit():
                    hspace += 'px'
                yield specificity, check_style_attribute(
                    element,
                    'margin-left:%s;margin-right:%s' % (hspace, hspace))
            if element.get('vspace'):
                vspace = element.get('vspace')
                if vspace.isdigit():
                    vspace += 'px'
                yield specificity, check_style_attribute(
                    element,
                    'margin-top:%s;margin-bottom:%s' % (vspace, vspace))
            if element.get('width'):
                style_attribute = 'width:%s' % element.get('width')
                if element.get('width').isdigit():
                    style_attribute += 'px'
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('height'):
                style_attribute = 'height:%s' % element.get('height')
                if element.get('height').isdigit():
                    style_attribute += 'px'
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('background'):
                style_attribute = 'background-image:url(%s)' % (
                    element.get('background'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('bgcolor'):
                style_attribute = 'background-color:%s' % (
                    element.get('bgcolor'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('bordercolor'):
                style_attribute = 'border-color:%s' % (
                    element.get('bordercolor'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('border'):
                style_attribute = 'border-width:%spx' % (
                    element.get('border'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
        elif element.tag in ('tr', 'td', 'th', 'thead', 'tbody', 'tfoot'):
            align = element.get('align', '').lower()
            # TODO: we should align descendants too
            if align == 'middle':
                yield specificity, check_style_attribute(
                    element, 'text-align:center')
            elif align in ('center', 'left', 'right', 'justify'):
                yield specificity, check_style_attribute(
                    element, 'text-align:%s' % align)
            if element.get('background'):
                style_attribute = 'background-image:url(%s)' % (
                    element.get('background'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('bgcolor'):
                style_attribute = 'background-color:%s' % (
                    element.get('bgcolor'))
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.tag in ('tr', 'td', 'th'):
                if element.get('height'):
                    style_attribute = 'height:%s' % element.get('height')
                    if element.get('height').isdigit():
                        style_attribute += 'px'
                    yield specificity, check_style_attribute(
                        element, style_attribute)
                if element.tag in ('td', 'th'):
                    if element.get('width'):
                        style_attribute = 'width:%s' % element.get('width')
                        if element.get('width').isdigit():
                            style_attribute += 'px'
                        yield specificity, check_style_attribute(
                            element, style_attribute)
        elif element.tag == 'caption':
            align = element.get('align', '').lower()
            # TODO: we should align descendants too
            if align == 'middle':
                yield specificity, check_style_attribute(
                    element, 'text-align:center')
            elif align in ('center', 'left', 'right', 'justify'):
                yield specificity, check_style_attribute(
                    element, 'text-align:%s' % align)
        elif element.tag == 'col':
            if element.get('width'):
                style_attribute = 'width:%s' % element.get('width')
                if element.get('width').isdigit():
                    style_attribute += 'px'
                yield specificity, check_style_attribute(
                    element, style_attribute)
        elif element.tag == 'hr':
            size = 0
            if element.get('size'):
                try:
                    size = int(element.get('size'))
                except ValueError:
                    LOGGER.warning('Invalid value for size: %s', size)
            if (element.get('color'), element.get('noshade')) != (None, None):
                if size >= 1:
                    yield specificity, check_style_attribute(
                        element, 'border-width:%spx' % (size / 2))
            elif size == 1:
                yield specificity, check_style_attribute(
                    element, 'border-bottom-width:0')
            elif size > 1:
                yield specificity, check_style_attribute(
                    element, 'height:%spx' % (size - 2))
            if element.get('width'):
                style_attribute = 'width:%s' % element.get('width')
                if element.get('width').isdigit():
                    style_attribute += 'px'
                yield specificity, check_style_attribute(
                    element, style_attribute)
            if element.get('color'):
                yield specificity, check_style_attribute(
                    element, 'color:%s' % element.get('color'))
        elif element.tag in (
                'iframe', 'applet', 'embed', 'img', 'input', 'object'):
            if (element.tag != 'input' or
                    element.get('type', '').lower() == 'image'):
                align = element.get('align', '').lower()
                if align in ('middle', 'center'):
                    # TODO: middle and center values are wrong
                    yield specificity, check_style_attribute(
                        element, 'vertical-align:middle')
                if element.get('hspace'):
                    hspace = element.get('hspace')
                    if hspace.isdigit():
                        hspace += 'px'
                    yield specificity, check_style_attribute(
                        element,
                        'margin-left:%s;margin-right:%s' % (hspace, hspace))
                if element.get('vspace'):
                    vspace = element.get('vspace')
                    if vspace.isdigit():
                        vspace += 'px'
                    yield specificity, check_style_attribute(
                        element,
                        'margin-top:%s;margin-bottom:%s' % (vspace, vspace))
                # TODO: img seems to be excluded for width and height, but a
                # lot of W3C tests rely on this attribute being applied to img
                if element.get('width'):
                    style_attribute = 'width:%s' % element.get('width')
                    if element.get('width').isdigit():
                        style_attribute += 'px'
                    yield specificity, check_style_attribute(
                        element, style_attribute)
                if element.get('height'):
                    style_attribute = 'height:%s' % element.get('height')
                    if element.get('height').isdigit():
                        style_attribute += 'px'
                    yield specificity, check_style_attribute(
                        element, style_attribute)
                if element.tag in ('img', 'object', 'input'):
                    if element.get('border'):
                        yield specificity, check_style_attribute(
                            element,
                            'border-width:%spx;border-style:solid' %
                            element.get('border'))
        elif element.tag == 'ol':
            # From https://www.w3.org/TR/css-lists-3/
            if element.get('start'):
                yield specificity, check_style_attribute(
                    element,
                    'counter-reset:list-item %s;'
                    'counter-increment:list-item -1' % element.get('start'))
        elif element.tag == 'ul':
            # From https://www.w3.org/TR/css-lists-3/
            if element.get('value'):
                yield specificity, check_style_attribute(
                    element,
                    'counter-reset:list-item %s;'
                    'counter-increment:none' % element.get('value'))


def matching_page_types(page_type, names=()):
    sides = ['left', 'right', None] if page_type.side is None else [
        page_type.side]
    blanks = (True, False) if page_type.blank is False else (True,)
    firsts = (True, False) if page_type.first is False else (True,)
    indexes = list(range(100)) if page_type.index is None else (
        page_type.index,)
    names = (
        tuple(names) + ('',) if page_type.name == ''
        else (page_type.name,))
    for side in sides:
        for blank in blanks:
            for first in firsts:
                for index in indexes:
                    if (first and index) or (not first and not index):
                        continue
                    for name in names:
                        yield PageType(side, blank, first, index, name)


def declaration_precedence(origin, importance):
    """Return the precedence for a declaration.

    Precedence values have no meaning unless compared to each other.

    Acceptable values for ``origin`` are the strings ``'author'``, ``'user'``
    and ``'user agent'``.

    """
    # See http://www.w3.org/TR/CSS21/cascade.html#cascading-order
    if origin == 'user agent':
        return 1
    elif origin == 'user' and not importance:
        return 2
    elif origin == 'author' and not importance:
        return 3
    elif origin == 'author':  # and importance
        return 4
    else:
        assert origin == 'user'  # and importance
        return 5


def add_declaration(cascaded_styles, prop_name, prop_values, weight, element,
                    pseudo_type=None):
    """Set the value for a property on a given element.

    The value is only set if there is no value of greater weight defined yet.

    """
    style = cascaded_styles.setdefault((element, pseudo_type), {})
    _values, previous_weight = style.get(prop_name, (None, None))
    if previous_weight is None or previous_weight <= weight:
        style[prop_name] = prop_values, weight


def computed_from_cascaded(element, cascaded, parent_style, pseudo_type=None,
                           root_style=None, base_url=None,
                           target_collector=None):
    """Get a dict of computed style mixed from parent and cascaded styles."""
    if not cascaded and parent_style is not None:
        # Fast path for anonymous boxes:
        # no cascaded style, only implicitly initial or inherited values.
        computed = dict(INITIAL_VALUES)
        for name in INHERITED:
            computed[name] = parent_style[name]
        # page is not inherited but taken from the ancestor if 'auto'
        computed['page'] = parent_style['page']
        # border-*-style is none, so border-width computes to zero.
        # Other than that, properties that would need computing are
        # border-*-color, but they do not apply.
        for side in ('top', 'bottom', 'left', 'right'):
            computed['border_%s_width' % side] = 0
        computed['outline_width'] = 0
        return computed

    # Handle inheritance and initial values
    specified = {}
    computed = {}
    for name, initial in INITIAL_VALUES.items():
        if name in cascaded:
            value, _precedence = cascaded[name]
            keyword = value
        else:
            if name in INHERITED:
                keyword = 'inherit'
            else:
                keyword = 'initial'

        if keyword == 'inherit' and parent_style is None:
            # On the root element, 'inherit' from initial values
            keyword = 'initial'

        if keyword == 'initial':
            value = initial
            if name not in INITIAL_NOT_COMPUTED:
                # The value is the same as when computed
                computed[name] = value
        elif keyword == 'inherit':
            value = parent_style[name]
            # Values in parent_style are already computed.
            computed[name] = value

        specified[name] = value

    if specified['page'] == 'auto':
        # The page property does not inherit. However, if the page value on
        # an element is auto, then its used value is the value specified on
        # its nearest ancestor with a non-auto value. When specified on the
        # root element, the used value for auto is the empty string.
        computed['page'] = specified['page'] = (
            '' if parent_style is None else parent_style['page'])

    return computed_values.compute(
        element, pseudo_type, specified, computed, parent_style, root_style,
        base_url, target_collector)


def parse_page_selectors(rule):
    """Parse a page selector rule.

    Return a list of page data if the rule is correctly parsed. Page data are a
    dict containing:

    - 'side' ('left', 'right' or None),
    - 'blank' (True or False),
    - 'first' (True or False),
    - 'index' (page number or None),
    - 'name' (page name string or empty string), and
    - 'spacificity' (list of numbers).

    Return ``None` if something went wrong while parsing the rule.

    """
    # See https://drafts.csswg.org/css-page-3/#syntax-page-selector

    tokens = list(remove_whitespace(rule.prelude))
    page_data = []

    # TODO: Specificity is probably wrong, should clean and test that.
    if not tokens:
        page_data.append({
            'side': None, 'blank': False, 'first': False, 'index': None,
            'name': '', 'specificity': [0, 0, 0]})
        return page_data

    while tokens:
        types = {
            'side': None, 'blank': False, 'first': False, 'index': None,
            'name': '', 'specificity': [0, 0, 0]}

        if tokens[0].type == 'ident':
            token = tokens.pop(0)
            types['name'] = token.value
            types['specificity'][0] = 1

        if len(tokens) == 1:
            return None
        elif not tokens:
            page_data.append(types)
            return page_data

        while tokens:
            literal = tokens.pop(0)
            if literal.type != 'literal':
                return None

            if literal.value == ':':
                if not tokens:
                    return None

                if tokens[0].type == 'ident':
                    ident = tokens.pop(0)
                    pseudo_class = ident.lower_value
                    if pseudo_class in ('left', 'right'):
                        if types['side']:
                            return None
                        types['side'] = pseudo_class
                        types['specificity'][2] += 1
                        continue
                    elif pseudo_class in ('blank', 'first'):
                        types[pseudo_class] = True
                        types['specificity'][1] += 1
                        continue
                elif tokens[0].type == 'function':
                    function = tokens.pop(0)
                    if function.name != 'nth':
                        return None
                    arguments = function.arguments
                    if len(arguments) != 1:
                        return None
                    number = arguments[0]
                    if number.type != 'number':
                        return None
                    types['index'] = number.value - 1
                    # TODO: specificity is not specified yet
                    # https://github.com/w3c/csswg-drafts/issues/3791
                    types['specificity'][1] += 1
                    continue

                return None
            elif literal.value == ',':
                if tokens and any(types['specificity']):
                    break
                else:
                    return None

        page_data.append(types)

    return page_data


def preprocess_stylesheet(device_media_type, base_url, stylesheet_rules,
                          url_fetcher, matcher, page_rules, fonts,
                          font_config, ignore_imports=False):
    """Do the work that can be done early on stylesheet, before they are
    in a document.

    """
    for rule in stylesheet_rules:
        if getattr(rule, 'content', None) is None and (
                rule.type != 'at-rule' or rule.lower_at_keyword != 'import'):
            continue

        if rule.type == 'qualified-rule':
            declarations = list(preprocess_declarations(
                base_url, tinycss2.parse_declaration_list(rule.content)))
            if declarations:
                logger_level = WARNING
                try:
                    selectors = cssselect2.compile_selector_list(rule.prelude)
                    for selector in selectors:
                        matcher.add_selector(selector, declarations)
                        if selector.pseudo_element not in PSEUDO_ELEMENTS:
                            if selector.pseudo_element.startswith('-'):
                                logger_level = DEBUG
                                raise cssselect2.SelectorError(
                                    'ignored prefixed pseudo-element: %s'
                                    % selector.pseudo_element)
                            else:
                                raise cssselect2.SelectorError(
                                    'unknown pseudo-element: %s'
                                    % selector.pseudo_element)
                    ignore_imports = True
                except cssselect2.SelectorError as exc:
                    LOGGER.log(
                        logger_level,
                        "Invalid or unsupported selector '%s', %s",
                        tinycss2.serialize(rule.prelude), exc)
                    continue
            else:
                ignore_imports = True

        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'import':
            if ignore_imports:
                LOGGER.warning('@import rule "%s" not at the beginning of the '
                               'the whole rule was ignored at %s:%s.',
                               tinycss2.serialize(rule.prelude),
                               rule.source_line, rule.source_column)
                continue

            tokens = remove_whitespace(rule.prelude)
            if tokens and tokens[0].type in ('url', 'string'):
                url = tokens[0].value
            else:
                continue
            media = media_queries.parse_media_query(tokens[1:])
            if media is None:
                LOGGER.warning('Invalid media type "%s" '
                               'the whole @import rule was ignored at %s:%s.',
                               tinycss2.serialize(rule.prelude),
                               rule.source_line, rule.source_column)
                continue
            if not media_queries.evaluate_media_query(
                    media, device_media_type):
                continue
            url = url_join(
                base_url, url, allow_relative=False,
                context='@import at %s:%s',
                context_args=(rule.source_line, rule.source_column))
            if url is not None:
                try:
                    CSS(
                        url=url, url_fetcher=url_fetcher,
                        media_type=device_media_type, font_config=font_config,
                        matcher=matcher, page_rules=page_rules)
                except URLFetchingError as exc:
                    LOGGER.error(
                        'Failed to load stylesheet at %s : %s', url, exc)

        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'media':
            media = media_queries.parse_media_query(rule.prelude)
            if media is None:
                LOGGER.warning('Invalid media type "%s" '
                               'the whole @media rule was ignored at %s:%s.',
                               tinycss2.serialize(rule.prelude),
                               rule.source_line, rule.source_column)
                continue
            ignore_imports = True
            if not media_queries.evaluate_media_query(
                    media, device_media_type):
                continue
            content_rules = tinycss2.parse_rule_list(rule.content)
            preprocess_stylesheet(
                device_media_type, base_url, content_rules, url_fetcher,
                matcher, page_rules, fonts, font_config, ignore_imports=True)

        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'page':
            data = parse_page_selectors(rule)

            if data is None:
                LOGGER.warning(
                    'Unsupported @page selector "%s", '
                    'the whole @page rule was ignored at %s:%s.',
                    tinycss2.serialize(rule.prelude),
                    rule.source_line, rule.source_column)
                continue

            ignore_imports = True
            for page_type in data:
                specificity = page_type.pop('specificity')
                page_type = PageType(**page_type)
                # Use a double lambda to have a closure that holds page_types
                match = (lambda page_type: lambda page_names: list(
                    matching_page_types(page_type, names=page_names)))(
                        page_type)
                content = tinycss2.parse_declaration_list(rule.content)
                declarations = list(preprocess_declarations(base_url, content))

                if declarations:
                    selector_list = [(specificity, None, match)]
                    page_rules.append((rule, selector_list, declarations))

                for margin_rule in content:
                    if margin_rule.type != 'at-rule' or (
                            margin_rule.content is None):
                        continue
                    declarations = list(preprocess_declarations(
                        base_url,
                        tinycss2.parse_declaration_list(margin_rule.content)))
                    if declarations:
                        selector_list = [(
                            specificity, '@' + margin_rule.lower_at_keyword,
                            match)]
                        page_rules.append(
                            (margin_rule, selector_list, declarations))

        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'font-face':
            ignore_imports = True
            content = tinycss2.parse_declaration_list(rule.content)
            rule_descriptors = dict(preprocess_descriptors(base_url, content))
            for key in ('src', 'font_family'):
                if key not in rule_descriptors:
                    LOGGER.warning(
                        "Missing %s descriptor in '@font-face' rule at %s:%s",
                        key.replace('_', '-'),
                        rule.source_line, rule.source_column)
                    break
            else:
                if font_config is not None:
                    font_filename = font_config.add_font_face(
                        rule_descriptors, url_fetcher)
                    if font_filename:
                        fonts.append(font_filename)


def get_all_computed_styles(html, user_stylesheets=None,
                            presentational_hints=False, font_config=None,
                            page_rules=None, target_collector=None):
    """Compute all the computed styles of all elements in ``html`` document.

    Do everything from finding author stylesheets to parsing and applying them.

    Return a ``style_for`` function that takes an element and an optional
    pseudo-element type, and return a style dict object.

    """
    # List stylesheets. Order here is not important ('origin' is).
    sheets = []
    for sheet in (html._ua_stylesheets() or []):
        sheets.append((sheet, 'user agent', None))
    if presentational_hints:
        for sheet in (html._ph_stylesheets() or []):
            sheets.append((sheet, 'author', (0, 0, 0)))
    for sheet in find_stylesheets(
            html.wrapper_element, html.media_type, html.url_fetcher,
            html.base_url, font_config, page_rules):
        sheets.append((sheet, 'author', None))
    for sheet in (user_stylesheets or []):
        sheets.append((sheet, 'user', None))

    return StyleFor(html, sheets, presentational_hints, target_collector)
-												Switch the licence to BSD and rewrite module docstrings/headers

											
										
										
											2012-03-22 02:19:27 +04:00
+								"""
 								    weasyprint.css
 								    --------------
-												Add links to the website and an AGPL licence.

											
										
										
											2011-04-28 21:15:30 +04:00
-												Switch the licence to BSD and rewrite module docstrings/headers

											
										
										
											2012-03-22 02:19:27 +04:00
+								    This module takes care of steps 3 and 4 of “CSS 2.1 processing model”:
 								    Retrieve stylesheets associated with a document and annotate every element
 								    with a value for every CSS property.
-												Add links to the website and an AGPL licence.

											
										
										
											2011-04-28 21:15:30 +04:00
-												Switch the licence to BSD and rewrite module docstrings/headers

											
										
										
											2012-03-22 02:19:27 +04:00
+								    http://www.w3.org/TR/CSS21/intro.html#processing-model
 								    This module does this in more than two steps. The
-												Remove out-dated parts of the weasyprint.css docstring.

											
										
										
											2012-10-09 19:10:45 +04:00
+								    :func:`get_all_computed_styles` function does everything, but it is itsef
 								    based on other functions in this module.
-												Switch the licence to BSD and rewrite module docstrings/headers

											
										
										
											2012-03-22 02:19:27 +04:00
-												Update copyright

											
										
										
											2019-03-04 13:04:06 +03:00
+								    :copyright: Copyright 2011-2019 Simon Sapin and contributors, see AUTHORS.
-												Switch the licence to BSD and rewrite module docstrings/headers

											
										
										
											2012-03-22 02:19:27 +04:00
+								    :license: BSD, see LICENSE for details.
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
+								"""
-												Add support for pseudo-elements.

											
										
										
											2011-05-12 18:06:47 +04:00
-												Set the page styles lazily

											
										
										
											2017-07-18 00:40:59 +03:00
+								from collections import namedtuple
-												Add a --debug option and set debug level for prefixed CSS properties

											
										
										
											2019-01-04 03:22:49 +03:00
+								from logging import DEBUG, WARNING
-												Log ignored rule-set on invalid selectors.

											
										
										
											2011-08-16 01:22:16 +04:00
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								import cssselect2
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								import tinycss2
-												Find stylesheets in an HTML document.

											
										
										
											2011-04-26 20:07:19 +04:00
-												Please isort again

											
										
										
											2019-03-10 21:34:16 +03:00
+								from .. import CSS
 								from ..logger import LOGGER, PROGRESS_LOGGER
 								from ..urls import URLFetchingError, get_url_attribute, url_join
-												Merge branch 'master' into media-queries

											
										
										
											2019-04-01 15:41:51 +03:00
+								from . import computed_values, media_queries
-												Fix imports for isort

											
										
										
											2019-03-01 13:38:03 +03:00
+								from .properties import INHERITED, INITIAL_NOT_COMPUTED, INITIAL_VALUES
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								from .utils import remove_whitespace
-												Split validation module

											
										
										
											2018-03-31 23:13:08 +03:00
+								from .validation import preprocess_declarations
 								from .validation.descriptors import preprocess_descriptors
-												Add support for pseudo-elements.

											
										
										
											2011-05-12 18:06:47 +04:00
-												Use the new cssselect.

											
										
										
											2012-04-25 21:05:42 +04:00
+								# Reject anything not in here:
 								PSEUDO_ELEMENTS = (None, 'before', 'after', 'first-line', 'first-letter')
-												Rename the weasy.css.utils module to weasy.css.values

											
										
										
											2011-08-15 15:03:09 +04:00
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								PageType = namedtuple('PageType', ['side', 'blank', 'first', 'index', 'name'])
-												Set the page styles lazily

											
										
										
											2017-07-18 00:40:59 +03:00
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								class StyleFor:
 								    """Convenience function to get the computed styles for an element."""
 								    def __init__(self, html, sheets, presentational_hints, target_collector):
 								        # keys: (element, pseudo_element_type)
 								        #    element: an ElementTree Element or the '@page' string
 								        #    pseudo_element_type: a string such as 'first' (for @page) or
 								        #        'after', or None for normal elements
 								        # values: dicts of
 								        #     keys: property name as a string
 								        #     values: (values, weight)
 								        #         values: a PropertyValue-like object
 								        #         weight: values with a greater weight take precedence, see
 								        #             http://www.w3.org/TR/CSS21/cascade.html#cascading-order
 								        self._cascaded_styles = cascaded_styles = {}
 								        # keys: (element, pseudo_element_type), like cascaded_styles
 								        # values: style dict objects:
 								        #     keys: property name as a string
 								        #     values: a PropertyValue-like object
 								        self._computed_styles = computed_styles = {}
-												Merge branch 'master' into media-queries

											
										
										
											2019-01-24 20:36:53 +03:00
+								        PROGRESS_LOGGER.info('Step 3 - Applying CSS')
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								        for specificity, attributes in find_style_attributes(
 								                html.etree_element, presentational_hints, html.base_url):
 								            element, declarations, base_url = attributes
 								            for name, values, importance in preprocess_declarations(
 								                    base_url, declarations):
 								                precedence = declaration_precedence('author', importance)
 								                weight = (precedence, specificity)
 								                add_declaration(cascaded_styles, name, values, weight, element)
 								        # First, add declarations and set computed styles for "real" elements
 								        # *in tree order*. Tree order is important so that parents have
 								        # computed styles before their children, for inheritance.
 								        # Iterate on all elements, even if there is no cascaded style for them.
 								        for element in html.wrapper_element.iter_subtree():
 								            for sheet, origin, sheet_specificity in sheets:
 								                # Add declarations for matched elements
 								                for selector in sheet.matcher.match(element):
 								                    specificity, order, pseudo_type, declarations = selector
 								                    specificity = sheet_specificity or specificity
 								                    for name, values, importance in declarations:
 								                        precedence = declaration_precedence(origin, importance)
 								                        weight = (precedence, specificity)
 								                        add_declaration(
 								                            cascaded_styles, name, values, weight,
 								                            element.etree_element, pseudo_type)
 								            parent = element.parent.etree_element if element.parent else None
-												Set set_computed_styles as a StyleFor method

											
										
										
											2019-04-01 16:24:18 +03:00
+								            self.set_computed_styles(
 								                element.etree_element, root=html.etree_element, parent=parent,
 								                base_url=html.base_url, target_collector=target_collector)
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
 								        page_names = {style['page'] for style in computed_styles.values()}
 								        for sheet, origin, sheet_specificity in sheets:
 								            # Add declarations for page elements
 								            for _rule, selector_list, declarations in sheet.page_rules:
 								                for selector in selector_list:
 								                    specificity, pseudo_type, match = selector
 								                    specificity = sheet_specificity or specificity
 								                    for page_type in match(page_names):
 								                        for name, values, importance in declarations:
 								                            precedence = declaration_precedence(
 								                                origin, importance)
 								                            weight = (precedence, specificity)
 								                            add_declaration(
 								                                cascaded_styles, name, values, weight,
 								                                page_type, pseudo_type)
 								        # Then computed styles for pseudo elements, in any order.
 								        # Pseudo-elements inherit from their associated element so they come
 								        # last. Do them in a second pass as there is no easy way to iterate
 								        # on the pseudo-elements for a given element with the current structure
 								        # of cascaded_styles. (Keys are (element, pseudo_type) tuples.)
 								        # Only iterate on pseudo-elements that have cascaded styles. (Others
 								        # might as well not exist.)
 								        for element, pseudo_type in cascaded_styles:
 								            if pseudo_type and not isinstance(element, PageType):
-												Set set_computed_styles as a StyleFor method

											
										
										
											2019-04-01 16:24:18 +03:00
+								                self.set_computed_styles(
 								                    element, pseudo_type=pseudo_type,
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								                    # The pseudo-element inherits from the element.
 								                    root=html.etree_element, parent=element,
 								                    base_url=html.base_url, target_collector=target_collector)
 								    def __call__(self, element, pseudo_type=None):
 								        style = self._computed_styles.get((element, pseudo_type))
 								        if style:
 								            if 'table' in style['display']:
 								                if (style['display'] in ('table', 'inline-table') and
 								                        style['border_collapse'] == 'collapse'):
 								                    # Padding do not apply
 								                    for side in ['top', 'bottom', 'left', 'right']:
 								                        style['padding_' + side] = computed_values.ZERO_PIXELS
 								                if (style['display'].startswith('table-') and
 								                        style['display'] != 'table-caption'):
 								                    # Margins do not apply
 								                    for side in ['top', 'bottom', 'left', 'right']:
 								                        style['margin_' + side] = computed_values.ZERO_PIXELS
 								        return style
-												Set set_computed_styles as a StyleFor method

											
										
										
											2019-04-01 16:24:18 +03:00
+								    def set_computed_styles(self, element, parent, root=None, pseudo_type=None,
 								                            base_url=None, target_collector=None):
 								        """Set the computed values of styles to ``element``.
 								        Take the properties left by ``apply_style_rule`` on an element or
 								        pseudo-element and assign computed values with respect to the cascade,
 								        declaration priority (ie. ``!important``) and selector specificity.
 								        """
 								        cascaded_styles = self.get_cascaded_styles()
 								        computed_styles = self.get_computed_styles()
 								        if element == root and pseudo_type is None:
 								            assert parent is None
 								            parent_style = None
 								            root_style = {
 								                # When specified on the font-size property of the root element,
 								                # the rem units refer to the property’s initial value.
 								                'font_size': INITIAL_VALUES['font_size'],
 								            }
 								        else:
 								            assert parent is not None
 								            parent_style = computed_styles[parent, None]
 								            root_style = computed_styles[root, None]
 								        cascaded = cascaded_styles.get((element, pseudo_type), {})
 								        computed_styles[element, pseudo_type] = computed_from_cascaded(
 								            element, cascaded, parent_style, pseudo_type, root_style, base_url,
 								            target_collector)
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								    def get_cascaded_styles(self):
 								        return self._cascaded_styles
 								    def get_computed_styles(self):
 								        return self._computed_styles
-												Add PDF metadata parsed from HTML. Fix #77.

<title> → /Title
<meta name=author> → /Author
<meta name=description> → /Subject
<meta name=keywords> → /Keywords
<meta name=generator> → /Creator
<meta name=dcterms.created> → /CreationDate
<meta name=dcterms.modified> → /ModDate
"WeasyPrint vX.Y" → /Producer

											
										
										
											2013-07-14 15:08:02 +04:00
+								def get_child_text(element):
 								    """Return the text directly in the element, not descendants."""
 								    content = [element.text] if element.text else []
 								    for child in element:
 								        if child.tail:
 								            content.append(child.tail)
 								    return ''.join(content)
-												Don't store base_url in ElementWrappers

											
										
										
											2017-07-07 12:14:07 +03:00
+								def find_stylesheets(wrapper_element, device_media_type, url_fetcher, base_url,
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                     font_config, page_rules):
-												Kill Document in css/__init__.py

											
										
										
											2012-07-12 17:21:37 +04:00
+								    """Yield the stylesheets in ``element_tree``.
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
-												Kill Document in css/__init__.py

											
										
										
											2012-07-12 17:21:37 +04:00
+								    The output order is the same as the source order.
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
-												Find stylesheets in an HTML document.

											
										
										
											2011-04-26 20:07:19 +04:00
+								    """
-												Fix parsing of <link rel>

											
										
										
											2014-04-22 04:34:47 +04:00
+								    from ..html import element_has_link_type  # Work around circular imports.
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								    for wrapper in wrapper_element.query_all('style', 'link'):
 								        element = wrapper.etree_element
-												Tests n’ fixes. Lots of them.

											
										
										
											2012-04-02 16:45:44 +04:00
+								        mime_type = element.get('type', 'text/css').split(';', 1)[0].strip()
-												Inline a function that was as long as its name and used only once.

											
										
										
											2011-05-10 17:09:55 +04:00
+								        # Only keep 'type/subtype' from 'type/subtype ; param1; param2'.
-												Tests n’ fixes. Lots of them.

											
										
										
											2012-04-02 16:45:44 +04:00
+								        if mime_type != 'text/css':
-												Find stylesheets in tree order.

											
										
										
											2011-05-10 13:41:23 +04:00
+								            continue
-												Switch from cssutils to tinycss as the CSS parser

											
										
										
											2012-03-24 16:39:31 +04:00
+								        media_attr = element.get('media', '').strip() or 'all'
 								        media = [media_type.strip() for media_type in media_attr.split(',')]
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								        if not media_queries.evaluate_media_query(media, device_media_type):
-												Tests n’ fixes. Lots of them.

											
										
										
											2012-04-02 16:45:44 +04:00
+								            continue
-												Find stylesheets in tree order.

											
										
										
											2011-05-10 13:41:23 +04:00
+								        if element.tag == 'style':
 								            # Content is text that is directly in the <style> element, not its
 								            # descendants
-												Add PDF metadata parsed from HTML. Fix #77.

<title> → /Title
<meta name=author> → /Author
<meta name=description> → /Subject
<meta name=keywords> → /Keywords
<meta name=generator> → /Creator
<meta name=dcterms.created> → /CreationDate
<meta name=dcterms.modified> → /ModDate
"WeasyPrint vX.Y" → /Producer

											
										
										
											2013-07-14 15:08:02 +04:00
+								            content = get_child_text(element)
-												Get rid of lxml

											
										
										
											2017-06-30 23:48:47 +03:00
+								            # ElementTree should give us either unicode or ASCII-only
 								            # bytestrings, so we don't need `encoding` here.
-												Clean the font config after rendering the document

											
										
										
											2016-10-27 12:41:34 +03:00
+								            css = CSS(
-												Don't store base_url in ElementWrappers

											
										
										
											2017-07-07 12:14:07 +03:00
+								                string=content, base_url=base_url,
-												Clean the font config after rendering the document

											
										
										
											2016-10-27 12:41:34 +03:00
+								                url_fetcher=url_fetcher, media_type=device_media_type,
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                font_config=font_config, page_rules=page_rules)
-												Switch from cssutils to tinycss as the CSS parser

											
										
										
											2012-03-24 16:39:31 +04:00
+								            yield css
-												Tests n’ fixes. Lots of them.

											
										
										
											2012-04-02 16:45:44 +04:00
+								        elif element.tag == 'link' and element.get('href'):
-												Fix parsing of <link rel>

											
										
										
											2014-04-22 04:34:47 +04:00
+								            if not element_has_link_type(element, 'stylesheet') or \
 								                    element_has_link_type(element, 'alternate'):
-												Do not apply alternate stylesheets.

											
										
										
											2011-11-08 20:31:32 +04:00
+								                continue
-												Don't store base_url in ElementWrappers

											
										
										
											2017-07-07 12:14:07 +03:00
+								            href = get_url_attribute(element, 'href', base_url)
-												Fix relative stylesheet URL without a base URL.

Previously we passed url=None to CSS which failed with
a "zero source" exception.

											
										
										
											2012-07-17 17:23:58 +04:00
+								            if href is not None:
-												Fix #84: Mak loading an author stylesheet not fatal.

											
										
										
											2013-06-21 01:07:52 +04:00
+								                try:
-												Clean the font config after rendering the document

											
										
										
											2016-10-27 12:41:34 +03:00
+								                    yield CSS(
 								                        url=href, url_fetcher=url_fetcher,
 								                        _check_mime_type=True, media_type=device_media_type,
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                        font_config=font_config, page_rules=page_rules)
-												Fix #84: Mak loading an author stylesheet not fatal.

											
										
										
											2013-06-21 01:07:52 +04:00
+								                except URLFetchingError as exc:
-												Clean and document the logging levels

Related to #488.

											
										
										
											2017-07-25 14:59:56 +03:00
+								                    LOGGER.error(
 								                        'Failed to load stylesheet at %s : %s', href, exc)
-												Resolve @import and @media rules.

											
										
										
											2011-04-27 19:50:12 +04:00
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								def find_style_attributes(tree, presentational_hints=False, base_url=None):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								    """Yield ``specificity, (element, declaration, base_url)`` rules.
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								    Rules from "style" attribute are returned with specificity
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								    ``(1, 0, 0)``.
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
 								    If ``presentational_hints`` is ``True``, rules from presentational hints
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								    are returned with specificity ``(0, 0, 0)``.
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
 								    """
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								    def check_style_attribute(element, style_attribute):
 								        declarations = tinycss2.parse_declaration_list(style_attribute)
 								        return element, declarations, base_url
 								    for element in tree.iter():
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								        specificity = (1, 0, 0)
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								        style_attribute = element.get('style')
 								        if style_attribute:
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								            yield specificity, check_style_attribute(element, style_attribute)
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								        if not presentational_hints:
 								            continue
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								        specificity = (0, 0, 0)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        if element.tag == 'body':
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								            # TODO: we should check the container frame element
 								            for part, position in (
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    ('height', 'top'), ('height', 'bottom'),
 								                    ('width', 'left'), ('width', 'right')):
 								                style_attribute = None
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                for prop in ('margin%s' % part, '%smargin' % position):
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    if element.get(prop):
 								                        style_attribute = 'margin-%s:%spx' % (
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                            position, element.get(prop))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                        break
 								                if style_attribute:
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('background'):
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                style_attribute = 'background-image:url(%s)' % (
-												Flake8 forever <3 <3

											
										
										
											2016-08-29 18:59:28 +03:00
+								                    element.get('background'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('bgcolor'):
-												Flake8 forever <3 <3

											
										
										
											2016-08-29 18:59:28 +03:00
+								                style_attribute = 'background-color:%s' % (
 								                    element.get('bgcolor'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('text'):
 								                style_attribute = 'color:%s' % element.get('text')
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								            # TODO: we should support link, vlink, alink
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'center':
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								            yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                element, 'text-align:center')
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'div':
 								            align = element.get('align', '').lower()
 								            if align == 'middle':
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'text-align:center')
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            elif align in ('center', 'left', 'right', 'justify'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'text-align:%s' % align)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'font':
 								            if element.get('color'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'color:%s' % element.get('color'))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('face'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'font-family:%s' % element.get('face'))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('size'):
 								                size = element.get('size').strip()
 								                relative_plus = size.startswith('+')
 								                relative_minus = size.startswith('-')
 								                if relative_plus or relative_minus:
 								                    size = size[1:].strip()
 								                try:
 								                    size = int(size)
 								                except ValueError:
-												Let the logging module do the string interpolation

											
										
										
											2017-03-28 10:32:50 +03:00
+								                    LOGGER.warning('Invalid value for size: %s', size)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                else:
 								                    font_sizes = {
 : 'x-small',
 : 'small',
 : 'medium',
 : 'large',
 : 'x-large',
 : 'xx-large',
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+: '48px',  # 1.5 * xx-large
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    }
 								                    if relative_plus:
 								                        size += 3
 								                    elif relative_minus:
 								                        size -= 3
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                    size = max(1, min(7, size))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, 'font-size:%s' % font_sizes[size])
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'table':
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								            # TODO: we should support cellpadding
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('cellspacing'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    'border-spacing:%spx' % element.get('cellspacing'))
-												Support simple table[cellpadding]

											
										
										
											2016-11-17 03:06:10 +03:00
+								            if element.get('cellpadding'):
 								                cellpadding = element.get('cellpadding')
 								                if cellpadding.isdigit():
 								                    cellpadding += 'px'
 								                # TODO: don't match subtables cells
 								                for subelement in element.iter():
 								                    if subelement.tag in ('td', 'th'):
 								                        yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                            subelement,
-												Support simple table[cellpadding]

											
										
										
											2016-11-17 03:06:10 +03:00
+								                            'padding-left:%s;padding-right:%s;'
 								                            'padding-top:%s;padding-bottom:%s;' % (
 * (cellpadding,)))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('hspace'):
 								                hspace = element.get('hspace')
 								                if hspace.isdigit():
 								                    hspace += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    'margin-left:%s;margin-right:%s' % (hspace, hspace))
 								            if element.get('vspace'):
 								                vspace = element.get('vspace')
 								                if vspace.isdigit():
 								                    vspace += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    'margin-top:%s;margin-bottom:%s' % (vspace, vspace))
 								            if element.get('width'):
 								                style_attribute = 'width:%s' % element.get('width')
 								                if element.get('width').isdigit():
 								                    style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('height'):
 								                style_attribute = 'height:%s' % element.get('height')
 								                if element.get('height').isdigit():
 								                    style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('background'):
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                style_attribute = 'background-image:url(%s)' % (
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    element.get('background'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('bgcolor'):
 								                style_attribute = 'background-color:%s' % (
 								                    element.get('bgcolor'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('bordercolor'):
 								                style_attribute = 'border-color:%s' % (
 								                    element.get('bordercolor'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('border'):
 								                style_attribute = 'border-width:%spx' % (
 								                    element.get('border'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag in ('tr', 'td', 'th', 'thead', 'tbody', 'tfoot'):
 								            align = element.get('align', '').lower()
-												Handle middle and center values of align presentational hint

Fix #694.

											
										
										
											2018-09-20 16:29:27 +03:00
+								            # TODO: we should align descendants too
 								            if align == 'middle':
 								                yield specificity, check_style_attribute(
 								                    element, 'text-align:center')
 								            elif align in ('center', 'left', 'right', 'justify'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'text-align:%s' % align)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('background'):
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								                style_attribute = 'background-image:url(%s)' % (
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    element.get('background'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('bgcolor'):
 								                style_attribute = 'background-color:%s' % (
 								                    element.get('bgcolor'))
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Use a stylesheet for some presentational hints

											
										
										
											2016-08-31 23:33:26 +03:00
+								            if element.tag in ('tr', 'td', 'th'):
 								                if element.get('height'):
 								                    style_attribute = 'height:%s' % element.get('height')
 								                    if element.get('height').isdigit():
 								                        style_attribute += 'px'
 								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, style_attribute)
-												Use a stylesheet for some presentational hints

											
										
										
											2016-08-31 23:33:26 +03:00
+								                if element.tag in ('td', 'th'):
 								                    if element.get('width'):
 								                        style_attribute = 'width:%s' % element.get('width')
 								                        if element.get('width').isdigit():
 								                            style_attribute += 'px'
 								                        yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                            element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'caption':
 								            align = element.get('align', '').lower()
-												Use a stylesheet for some presentational hints

											
										
										
											2016-08-31 23:33:26 +03:00
+								            # TODO: we should align descendants too
-												Handle middle and center values of align presentational hint

Fix #694.

											
										
										
											2018-09-20 16:29:27 +03:00
+								            if align == 'middle':
 								                yield specificity, check_style_attribute(
 								                    element, 'text-align:center')
 								            elif align in ('center', 'left', 'right', 'justify'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'text-align:%s' % align)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'col':
 								            if element.get('width'):
 								                style_attribute = 'width:%s' % element.get('width')
 								                if element.get('width').isdigit():
 								                    style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag == 'hr':
 								            size = 0
 								            if element.get('size'):
 								                try:
 								                    size = int(element.get('size'))
 								                except ValueError:
-												Let the logging module do the string interpolation

											
										
										
											2017-03-28 10:32:50 +03:00
+								                    LOGGER.warning('Invalid value for size: %s', size)
-												Test presentational hints

											
										
										
											2016-09-01 03:11:33 +03:00
+								            if (element.get('color'), element.get('noshade')) != (None, None):
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                if size >= 1:
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, 'border-width:%spx' % (size / 2))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            elif size == 1:
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'border-bottom-width:0')
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            elif size > 1:
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'height:%spx' % (size - 2))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('width'):
 								                style_attribute = 'width:%s' % element.get('width')
 								                if element.get('width').isdigit():
 								                    style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								            if element.get('color'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element, 'color:%s' % element.get('color'))
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								        elif element.tag in (
 								                'iframe', 'applet', 'embed', 'img', 'input', 'object'):
 								            if (element.tag != 'input' or
 								                    element.get('type', '').lower() == 'image'):
 								                align = element.get('align', '').lower()
-												Use a stylesheet for some presentational hints

											
										
										
											2016-08-31 23:33:26 +03:00
+								                if align in ('middle', 'center'):
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                    # TODO: middle and center values are wrong
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, 'vertical-align:middle')
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                if element.get('hspace'):
 								                    hspace = element.get('hspace')
 								                    if hspace.isdigit():
 								                        hspace += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                        'margin-left:%s;margin-right:%s' % (hspace, hspace))
 								                if element.get('vspace'):
 								                    vspace = element.get('vspace')
 								                    if vspace.isdigit():
 								                        vspace += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                        'margin-top:%s;margin-bottom:%s' % (vspace, vspace))
 								                # TODO: img seems to be excluded for width and height, but a
 								                # lot of W3C tests rely on this attribute being applied to img
 								                if element.get('width'):
 								                    style_attribute = 'width:%s' % element.get('width')
 								                    if element.get('width').isdigit():
 								                        style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                if element.get('height'):
 								                    style_attribute = 'height:%s' % element.get('height')
 								                    if element.get('height').isdigit():
 								                        style_attribute += 'px'
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                    yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                        element, style_attribute)
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                if element.tag in ('img', 'object', 'input'):
 								                    if element.get('border'):
-												Add an option to follow presentational hints

											
										
										
											2016-08-30 20:10:53 +03:00
+								                        yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                            element,
-												Support presentational hints

											
										
										
											2016-08-29 18:50:07 +03:00
+								                            'border-width:%spx;border-style:solid' %
 								                            element.get('border'))
-												Support ol[start] and ul[value]

											
										
										
											2016-11-17 02:37:03 +03:00
+								        elif element.tag == 'ol':
 								            # From https://www.w3.org/TR/css-lists-3/
 								            if element.get('start'):
 								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element,
-												Support ol[start] and ul[value]

											
										
										
											2016-11-17 02:37:03 +03:00
+								                    'counter-reset:list-item %s;'
 								                    'counter-increment:list-item -1' % element.get('start'))
 								        elif element.tag == 'ul':
 								            # From https://www.w3.org/TR/css-lists-3/
 								            if element.get('value'):
 								                yield specificity, check_style_attribute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								                    element,
-												Support ol[start] and ul[value]

											
										
										
											2016-11-17 02:37:03 +03:00
+								                    'counter-reset:list-item %s;'
 								                    'counter-increment:none' % element.get('value'))
-												Sanity check: assert that dimension values are numeric.

											
										
										
											2011-06-29 13:07:48 +04:00
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
-												Make named pages inherit from anonymous page style

											
										
										
											2017-08-07 13:21:17 +03:00
+								def matching_page_types(page_type, names=()):
-												Use a custom object instead of constants for page pseudo-classes

This is a first step to lazily get the page styles and support named pages.

											
										
										
											2017-07-17 23:48:21 +03:00
+								    sides = ['left', 'right', None] if page_type.side is None else [
 								        page_type.side]
-												Make named pages inherit from anonymous page style

											
										
										
											2017-08-07 13:21:17 +03:00
+								    blanks = (True, False) if page_type.blank is False else (True,)
 								    firsts = (True, False) if page_type.first is False else (True,)
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								    indexes = list(range(100)) if page_type.index is None else (
 								        page_type.index,)
-												Make named pages inherit from anonymous page style

											
										
										
											2017-08-07 13:21:17 +03:00
+								    names = (
-												Use empty string as default value of named page

That's the value given in the spec, using None doesn't add anything and even
introduces bugs.

											
										
										
											2019-04-02 12:19:48 +03:00
+								        tuple(names) + ('',) if page_type.name == ''
-												Make named pages inherit from anonymous page style

											
										
										
											2017-08-07 13:21:17 +03:00
+								        else (page_type.name,))
-												Use a custom object instead of constants for page pseudo-classes

This is a first step to lazily get the page styles and support named pages.

											
										
										
											2017-07-17 23:48:21 +03:00
+								    for side in sides:
 								        for blank in blanks:
 								            for first in firsts:
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								                for index in indexes:
 								                    if (first and index) or (not first and not index):
 								                        continue
 								                    for name in names:
 								                        yield PageType(side, blank, first, index, name)
-												Use a custom object instead of constants for page pseudo-classes

This is a first step to lazily get the page styles and support named pages.

											
										
										
											2017-07-17 23:48:21 +03:00
-												Change weasy.css architecture to avoid rewriting stylesheets.

											
										
										
											2011-07-21 14:31:08 +04:00
+								def declaration_precedence(origin, importance):
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
+								    """Return the precedence for a declaration.
 								    Precedence values have no meaning unless compared to each other.
 								    Acceptable values for ``origin`` are the strings ``'author'``, ``'user'``
 								    and ``'user agent'``.
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
 								    """
 								    # See http://www.w3.org/TR/CSS21/cascade.html#cascading-order
 								    if origin == 'user agent':
 								        return 1
-												Change weasy.css architecture to avoid rewriting stylesheets.

											
										
										
											2011-07-21 14:31:08 +04:00
+								    elif origin == 'user' and not importance:
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
+								        return 2
-												Change weasy.css architecture to avoid rewriting stylesheets.

											
										
										
											2011-07-21 14:31:08 +04:00
+								    elif origin == 'author' and not importance:
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
+								        return 3
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
+								    elif origin == 'author':  # and importance
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
+								        return 4
 								    else:
-												Tests n’ fixes. Lots of them.

											
										
										
											2012-04-02 16:45:44 +04:00
+								        assert origin == 'user'  # and importance
 								        return 5
-												Add support for pseudo-elements.

											
										
										
											2011-05-12 18:06:47 +04:00
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
-												Have the document set its own attributes.

											
										
										
											2011-07-21 15:47:42 +04:00
+								def add_declaration(cascaded_styles, prop_name, prop_values, weight, element,
-												Change weasy.css architecture to avoid rewriting stylesheets.

											
										
										
											2011-07-21 14:31:08 +04:00
+								                    pseudo_type=None):
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
+								    """Set the value for a property on a given element.
 								    The value is only set if there is no value of greater weight defined yet.
-												Put styles in a signle Document object instead of each lxml element.

											
										
										
											2011-07-20 20:23:54 +04:00
+								    """
-												Have the document set its own attributes.

											
										
										
											2011-07-21 15:47:42 +04:00
+								    style = cascaded_styles.setdefault((element, pseudo_type), {})
-												Change weasy.css architecture to avoid rewriting stylesheets.

											
										
										
											2011-07-21 14:31:08 +04:00
+								    _values, previous_weight = style.get(prop_name, (None, None))
 								    if previous_weight is None or previous_weight <= weight:
 								        style[prop_name] = prop_values, weight
-												Put styles in a signle Document object instead of each lxml element.

											
										
										
											2011-07-20 20:23:54 +04:00
-												Add 'rem' support

This feature is kindly provided to you by Florian Demmer!

											
										
										
											2016-02-12 01:02:53 +03:00
+								def computed_from_cascaded(element, cascaded, parent_style, pseudo_type=None,
-												Don't use a global target collector

											
										
										
											2018-03-28 01:34:34 +03:00
+								                           root_style=None, base_url=None,
 								                           target_collector=None):
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
+								    """Get a dict of computed style mixed from parent and cascaded styles."""
-												Avoid re-computing styles for anonymous boxes.

											
										
										
											2011-08-18 19:05:34 +04:00
+								    if not cascaded and parent_style is not None:
 								        # Fast path for anonymous boxes:
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
+								        # no cascaded style, only implicitly initial or inherited values.
-												Fix imports for isort

											
										
										
											2019-03-01 13:38:03 +03:00
+								        computed = dict(INITIAL_VALUES)
 								        for name in INHERITED:
-												Avoid re-computing styles for anonymous boxes.

											
										
										
											2011-08-18 19:05:34 +04:00
+								            computed[name] = parent_style[name]
-												Handle the page property

											
										
										
											2017-07-18 03:01:36 +03:00
+								        # page is not inherited but taken from the ancestor if 'auto'
 								        computed['page'] = parent_style['page']
-												text-align: start should inherit as itself, not left or right.

											
										
										
											2011-12-16 19:02:49 +04:00
+								        # border-*-style is none, so border-width computes to zero.
-												Avoid re-computing styles for anonymous boxes.

											
										
										
											2011-08-18 19:05:34 +04:00
+								        # Other than that, properties that would need computing are
-												text-align: start should inherit as itself, not left or right.

											
										
										
											2011-12-16 19:02:49 +04:00
+								        # border-*-color, but they do not apply.
-												Avoid re-computing styles for anonymous boxes.

											
										
										
											2011-08-18 19:05:34 +04:00
+								        for side in ('top', 'bottom', 'left', 'right'):
-												Use _ instead of - for CSS property names everywhere.

											
										
										
											2011-10-08 17:46:41 +04:00
+								            computed['border_%s_width' % side] = 0
-												Add support for outlines.

											
										
										
											2012-08-03 18:21:47 +04:00
+								        computed['outline_width'] = 0
-												Remove StyleDict objects

											
										
										
											2018-01-13 19:41:08 +03:00
+								        return computed
-												Avoid re-computing styles for anonymous boxes.

											
										
										
											2011-08-18 19:05:34 +04:00
-												Rewrite computed values handling to dispatch by property, not by value type.

											
										
										
											2011-08-18 17:44:45 +04:00
+								    # Handle inheritance and initial values
-												Transform StyleDict into a kind of frozen dict

This forces to use a copy when changes are needed. Internal mutable structures
have also been changed into immutable ones (i.e. lists have been turned into
tuples).

This change is a really useful first step to greatly optimize memory and time
needed to render large documents, as allows us to cache style dicts more
safely. It's been already done in StyleDict.inherit_from, with a ~5-10% memory
benefice.

											
										
										
											2017-07-28 14:35:06 +03:00
+								    specified = {}
 								    computed = {}
-												Fix imports for isort

											
										
										
											2019-03-01 13:38:03 +03:00
+								    for name, initial in INITIAL_VALUES.items():
-												Rewrite computed values handling to dispatch by property, not by value type.

											
										
										
											2011-08-18 17:44:45 +04:00
+								        if name in cascaded:
-												Use strings or numbers instead of lists of cssutils Value objects.

... where appropriate. This remove much of the need for functions like
get_single_keyword and get_single_pixel_value.

											
										
										
											2011-10-08 16:41:12 +04:00
+								            value, _precedence = cascaded[name]
 								            keyword = value
-												Rewrite computed values handling to dispatch by property, not by value type.

											
										
										
											2011-08-18 17:44:45 +04:00
+								        else:
-												Fix imports for isort

											
										
										
											2019-03-01 13:38:03 +03:00
+								            if name in INHERITED:
-												Move 3 modules in weasy.css into a new weasy.css.properties module.

											
										
										
											2011-08-15 16:19:33 +04:00
+								                keyword = 'inherit'
 								            else:
 								                keyword = 'initial'
 								        if keyword == 'inherit' and parent_style is None:
 								            # On the root element, 'inherit' from initial values
 								            keyword = 'initial'
 								        if keyword == 'initial':
-												Use strings or numbers instead of lists of cssutils Value objects.

... where appropriate. This remove much of the need for functions like
get_single_keyword and get_single_pixel_value.

											
										
										
											2011-10-08 16:41:12 +04:00
+								            value = initial
-												Use a set instead of a regex to detect INITIAL_NOT_COMPUTED values

That's an easy ~1% performance enhancement!

											
										
										
											2017-10-13 10:48:57 +03:00
+								            if name not in INITIAL_NOT_COMPUTED:
-												Do not 'compute' most initial values.

											
										
										
											2011-12-16 20:53:11 +04:00
+								                # The value is the same as when computed
 								                computed[name] = value
-												Move 3 modules in weasy.css into a new weasy.css.properties module.

											
										
										
											2011-08-15 16:19:33 +04:00
+								        elif keyword == 'inherit':
-												Use strings or numbers instead of lists of cssutils Value objects.

... where appropriate. This remove much of the need for functions like
get_single_keyword and get_single_pixel_value.

											
										
										
											2011-10-08 16:41:12 +04:00
+								            value = parent_style[name]
 								            # Values in parent_style are already computed.
 								            computed[name] = value
-												Move 3 modules in weasy.css into a new weasy.css.properties module.

											
										
										
											2011-08-15 16:19:33 +04:00
-												Use strings or numbers instead of lists of cssutils Value objects.

... where appropriate. This remove much of the need for functions like
get_single_keyword and get_single_pixel_value.

											
										
										
											2011-10-08 16:41:12 +04:00
+								        specified[name] = value
-												Move 3 modules in weasy.css into a new weasy.css.properties module.

											
										
										
											2011-08-15 16:19:33 +04:00
-												Handle the page property

											
										
										
											2017-07-18 03:01:36 +03:00
+								    if specified['page'] == 'auto':
 								        # The page property does not inherit. However, if the page value on
 								        # an element is auto, then its used value is the value specified on
 								        # its nearest ancestor with a non-auto value. When specified on the
 								        # root element, the used value for auto is the empty string.
-												Fix computed value of 'page' attribute

											
										
										
											2017-07-18 13:01:50 +03:00
+								        computed['page'] = specified['page'] = (
-												Handle the page property

											
										
										
											2017-07-18 03:01:36 +03:00
+								            '' if parent_style is None else parent_style['page'])
-												Remove StyleDict objects

											
										
										
											2018-01-13 19:41:08 +03:00
+								    return computed_values.compute(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								        element, pseudo_type, specified, computed, parent_style, root_style,
-												Don't use a global target collector

											
										
										
											2018-03-28 01:34:34 +03:00
+								        base_url, target_collector)
-												Sanity check: assert that dimension values are numeric.

											
										
										
											2011-06-29 13:07:48 +04:00
-												Add support for pseudo-elements.

											
										
										
											2011-05-12 18:06:47 +04:00
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								def parse_page_selectors(rule):
 								    """Parse a page selector rule.
 								    Return a list of page data if the rule is correctly parsed. Page data are a
 								    dict containing:
 								    - 'side' ('left', 'right' or None),
 								    - 'blank' (True or False),
 								    - 'first' (True or False),
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								    - 'index' (page number or None),
-												Use empty string as default value of named page

That's the value given in the spec, using None doesn't add anything and even
introduces bugs.

											
										
										
											2019-04-02 12:19:48 +03:00
+								    - 'name' (page name string or empty string), and
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								    - 'spacificity' (list of numbers).
 								    Return ``None` if something went wrong while parsing the rule.
 								    """
 								    # See https://drafts.csswg.org/css-page-3/#syntax-page-selector
 								    tokens = list(remove_whitespace(rule.prelude))
 								    page_data = []
 								    # TODO: Specificity is probably wrong, should clean and test that.
 								    if not tokens:
 								        page_data.append({
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								            'side': None, 'blank': False, 'first': False, 'index': None,
-												Use empty string as default value of named page

That's the value given in the spec, using None doesn't add anything and even
introduces bugs.

											
										
										
											2019-04-02 12:19:48 +03:00
+								            'name': '', 'specificity': [0, 0, 0]})
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								        return page_data
 								    while tokens:
 								        types = {
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								            'side': None, 'blank': False, 'first': False, 'index': None,
-												Use empty string as default value of named page

That's the value given in the spec, using None doesn't add anything and even
introduces bugs.

											
										
										
											2019-04-02 12:19:48 +03:00
+								            'name': '', 'specificity': [0, 0, 0]}
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
 								        if tokens[0].type == 'ident':
 								            token = tokens.pop(0)
 								            types['name'] = token.value
 								            types['specificity'][0] = 1
 								        if len(tokens) == 1:
 								            return None
 								        elif not tokens:
 								            page_data.append(types)
 								            return page_data
 								        while tokens:
 								            literal = tokens.pop(0)
 								            if literal.type != 'literal':
 								                return None
 								            if literal.value == ':':
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								                if not tokens:
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								                    return None
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
 								                if tokens[0].type == 'ident':
 								                    ident = tokens.pop(0)
 								                    pseudo_class = ident.lower_value
 								                    if pseudo_class in ('left', 'right'):
 								                        if types['side']:
 								                            return None
 								                        types['side'] = pseudo_class
 								                        types['specificity'][2] += 1
 								                        continue
 								                    elif pseudo_class in ('blank', 'first'):
 								                        types[pseudo_class] = True
 								                        types['specificity'][1] += 1
 								                        continue
 								                elif tokens[0].type == 'function':
 								                    function = tokens.pop(0)
 								                    if function.name != 'nth':
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								                        return None
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								                    arguments = function.arguments
 								                    if len(arguments) != 1:
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								                        return None
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								                    number = arguments[0]
 								                    if number.type != 'number':
 								                        return None
 								                    types['index'] = number.value - 1
-												Set nth() selector specificity

											
										
										
											2019-04-02 12:36:07 +03:00
+								                    # TODO: specificity is not specified yet
 								                    # https://github.com/w3c/csswg-drafts/issues/3791
 								                    types['specificity'][1] += 1
-												Add a stupid and broken support of nth page selector

											
										
										
											2019-04-01 19:45:59 +03:00
+								                    continue
 								                return None
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								            elif literal.value == ',':
 								                if tokens and any(types['specificity']):
 								                    break
 								                else:
 								                    return None
 								        page_data.append(types)
 								    return page_data
-												Split rules and descriptors in CSS

											
										
										
											2016-09-24 16:36:26 +03:00
+								def preprocess_stylesheet(device_media_type, base_url, stylesheet_rules,
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                          url_fetcher, matcher, page_rules, fonts,
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								                          font_config, ignore_imports=False):
-												Pre-process stylesheet (do validation just after parsing)

											
										
										
											2012-03-25 03:39:41 +04:00
+								    """Do the work that can be done early on stylesheet, before they are
 								    in a document.
 								    """
-												Split rules and descriptors in CSS

											
										
										
											2016-09-24 16:36:26 +03:00
+								    for rule in stylesheet_rules:
-												Don't crash when an at-rule is empty

											
										
										
											2017-08-14 15:11:57 +03:00
+								        if getattr(rule, 'content', None) is None and (
-												Remove case-sensivity for at-rules and properties

											
										
										
											2017-08-17 08:52:18 +03:00
+								                rule.type != 'at-rule' or rule.lower_at_keyword != 'import'):
-												Don't crash when an at-rule is empty

											
										
										
											2017-08-14 15:11:57 +03:00
+								            continue
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								        if rule.type == 'qualified-rule':
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
+								            declarations = list(preprocess_declarations(
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								                base_url, tinycss2.parse_declaration_list(rule.content)))
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
+								            if declarations:
-												Add a --debug option and set debug level for prefixed CSS properties

											
										
										
											2019-01-04 03:22:49 +03:00
+								                logger_level = WARNING
-												Use the new cssselect.

											
										
										
											2012-04-25 21:05:42 +04:00
+								                try:
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                    selectors = cssselect2.compile_selector_list(rule.prelude)
 								                    for selector in selectors:
 								                        matcher.add_selector(selector, declarations)
-												Use the new cssselect.

											
										
										
											2012-04-25 21:05:42 +04:00
+								                        if selector.pseudo_element not in PSEUDO_ELEMENTS:
-												Add a --debug option and set debug level for prefixed CSS properties

											
										
										
											2019-01-04 03:22:49 +03:00
+								                            if selector.pseudo_element.startswith('-'):
 								                                logger_level = DEBUG
 								                                raise cssselect2.SelectorError(
 								                                    'ignored prefixed pseudo-element: %s'
 								                                    % selector.pseudo_element)
 								                            else:
 								                                raise cssselect2.SelectorError(
 								                                    'unknown pseudo-element: %s'
 								                                    % selector.pseudo_element)
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								                    ignore_imports = True
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                except cssselect2.SelectorError as exc:
-												Add a --debug option and set debug level for prefixed CSS properties

											
										
										
											2019-01-04 03:22:49 +03:00
+								                    LOGGER.log(
 								                        logger_level,
 								                        "Invalid or unsupported selector '%s', %s",
 								                        tinycss2.serialize(rule.prelude), exc)
-												Use the new cssselect.

											
										
										
											2012-04-25 21:05:42 +04:00
+								                    continue
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								            else:
 								                ignore_imports = True
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
-												Remove case-sensivity for at-rules and properties

											
										
										
											2017-08-17 08:52:18 +03:00
+								        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'import':
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								            if ignore_imports:
 								                LOGGER.warning('@import rule "%s" not at the beginning of the '
 								                               'the whole rule was ignored at %s:%s.',
 								                               tinycss2.serialize(rule.prelude),
 								                               rule.source_line, rule.source_column)
 								                continue
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								            tokens = remove_whitespace(rule.prelude)
 								            if tokens and tokens[0].type in ('url', 'string'):
 								                url = tokens[0].value
 								            else:
 								                continue
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								            media = media_queries.parse_media_query(tokens[1:])
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								            if media is None:
 								                LOGGER.warning('Invalid media type "%s" '
 								                               'the whole @import rule was ignored at %s:%s.',
 								                               tinycss2.serialize(rule.prelude),
 								                               rule.source_line, rule.source_column)
-												Ignore CSS rules with empty media queries

											
										
										
											2017-08-14 12:36:35 +03:00
+								                continue
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								            if not media_queries.evaluate_media_query(
 								                    media, device_media_type):
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
+								                continue
-												Allow relative URIs in anchors

Fix #437.

Backward-incompatible change: the signature of weasyprint.urls.url_join has
changed to allow relative links without a base URI.

This feature doesn't look really safe at first sight, but I can't find
anything bad coming from these changes. If there's a bug, I take the blame.

											
										
										
											2017-03-25 20:28:41 +03:00
+								            url = url_join(
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								                base_url, url, allow_relative=False,
-												Allow relative URIs in anchors

Fix #437.

Backward-incompatible change: the signature of weasyprint.urls.url_join has
changed to allow relative links without a base URI.

This feature doesn't look really safe at first sight, but I can't find
anything bad coming from these changes. If there's a bug, I take the blame.

											
										
										
											2017-03-25 20:28:41 +03:00
+								                context='@import at %s:%s',
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								                context_args=(rule.source_line, rule.source_column))
-												Warn (not crash) on missing base_url for @import

											
										
										
											2012-09-25 18:01:12 +04:00
+								            if url is not None:
-												Fix #84: Mak loading an author stylesheet not fatal.

											
										
										
											2013-06-21 01:07:52 +04:00
+								                try:
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                    CSS(
-												Add font_config parameter when loading CSS in CSS

											
										
										
											2016-10-28 18:44:31 +03:00
+								                        url=url, url_fetcher=url_fetcher,
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                        media_type=device_media_type, font_config=font_config,
 								                        matcher=matcher, page_rules=page_rules)
-												Fix #84: Mak loading an author stylesheet not fatal.

											
										
										
											2013-06-21 01:07:52 +04:00
+								                except URLFetchingError as exc:
-												Clean and document the logging levels

Related to #488.

											
										
										
											2017-07-25 14:59:56 +03:00
+								                    LOGGER.error(
 								                        'Failed to load stylesheet at %s : %s', url, exc)
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
-												Remove case-sensivity for at-rules and properties

											
										
										
											2017-08-17 08:52:18 +03:00
+								        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'media':
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								            media = media_queries.parse_media_query(rule.prelude)
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								            if media is None:
 								                LOGGER.warning('Invalid media type "%s" '
 								                               'the whole @media rule was ignored at %s:%s.',
 								                               tinycss2.serialize(rule.prelude),
 								                               rule.source_line, rule.source_column)
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
+								                continue
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								            ignore_imports = True
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								            if not media_queries.evaluate_media_query(
 								                    media, device_media_type):
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								                continue
 								            content_rules = tinycss2.parse_rule_list(rule.content)
-												Split rules and descriptors in CSS

											
										
										
											2016-09-24 16:36:26 +03:00
+								            preprocess_stylesheet(
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                device_media_type, base_url, content_rules, url_fetcher,
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								                matcher, page_rules, fonts, font_config, ignore_imports=True)
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
-												Remove case-sensivity for at-rules and properties

											
										
										
											2017-08-17 08:52:18 +03:00
+								        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'page':
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								            data = parse_page_selectors(rule)
 								            if data is None:
 								                LOGGER.warning(
 								                    'Unsupported @page selector "%s", '
 								                    'the whole @page rule was ignored at %s:%s.',
 								                    tinycss2.serialize(rule.prelude),
 								                    rule.source_line, rule.source_column)
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
+								                continue
-												Use the new cssselect.

											
										
										
											2012-04-25 21:05:42 +04:00
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								            ignore_imports = True
 								            for page_type in data:
 								                specificity = page_type.pop('specificity')
 								                page_type = PageType(**page_type)
 								                # Use a double lambda to have a closure that holds page_types
 								                match = (lambda page_type: lambda page_names: list(
 								                    matching_page_types(page_type, names=page_names)))(
 								                        page_type)
 								                content = tinycss2.parse_declaration_list(rule.content)
 								                declarations = list(preprocess_declarations(base_url, content))
-												Also pre-proccess @import and @media

											
										
										
											2012-03-25 04:41:02 +04:00
 								                if declarations:
-												Handle @page rule grammar correctly

Fix #562.

											
										
										
											2018-01-29 00:17:26 +03:00
+								                    selector_list = [(specificity, None, match)]
 								                    page_rules.append((rule, selector_list, declarations))
 								                for margin_rule in content:
 								                    if margin_rule.type != 'at-rule' or (
 								                            margin_rule.content is None):
 								                        continue
 								                    declarations = list(preprocess_declarations(
 								                        base_url,
 								                        tinycss2.parse_declaration_list(margin_rule.content)))
 								                    if declarations:
 								                        selector_list = [(
 								                            specificity, '@' + margin_rule.lower_at_keyword,
 								                            match)]
 								                        page_rules.append(
 								                            (margin_rule, selector_list, declarations))
-												Pre-process stylesheet (do validation just after parsing)

											
										
										
											2012-03-25 03:39:41 +04:00
-												Remove case-sensivity for at-rules and properties

											
										
										
											2017-08-17 08:52:18 +03:00
+								        elif rule.type == 'at-rule' and rule.lower_at_keyword == 'font-face':
-												Ignore CSS imports after other types of declarations

											
										
										
											2017-08-17 08:47:20 +03:00
+								            ignore_imports = True
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								            content = tinycss2.parse_declaration_list(rule.content)
-												Don't go through the tree twice when applying styles

											
										
										
											2017-07-01 08:26:36 +03:00
+								            rule_descriptors = dict(preprocess_descriptors(base_url, content))
-												Parse @font-face rules

											
										
										
											2016-09-23 20:00:14 +03:00
+								            for key in ('src', 'font_family'):
-												WIP: Support @font-face

											
										
										
											2016-09-26 13:15:12 +03:00
+								                if key not in rule_descriptors:
-												Parse @font-face rules

											
										
										
											2016-09-23 20:00:14 +03:00
+								                    LOGGER.warning(
 								                        "Missing %s descriptor in '@font-face' rule at %s:%s",
-												Switch to tinycss2

											
										
										
											2017-03-26 12:42:50 +03:00
+								                        key.replace('_', '-'),
 								                        rule.source_line, rule.source_column)
-												Parse @font-face rules

											
										
										
											2016-09-23 20:00:14 +03:00
+								                    break
 								            else:
-												check for font_config

check for font_config before attempting to add_font_face
											
										
										
											2016-11-17 23:29:39 +03:00
+								                if font_config is not None:
 								                    font_filename = font_config.add_font_face(
 								                        rule_descriptors, url_fetcher)
 								                    if font_filename:
 								                        fonts.append(font_filename)
-												Pre-process stylesheet (do validation just after parsing)

											
										
										
											2012-03-25 03:39:41 +04:00
-												Add a presentational-hints option

											
										
										
											2016-08-30 19:15:30 +03:00
+								def get_all_computed_styles(html, user_stylesheets=None,
-												Use cssselect2 instead of cssselect

											
										
										
											2017-06-30 18:54:02 +03:00
+								                            presentational_hints=False, font_config=None,
-												Don't use a global target collector

											
										
										
											2018-03-28 01:34:34 +03:00
+								                            page_rules=None, target_collector=None):
-												Add a presentational-hints option

											
										
										
											2016-08-30 19:15:30 +03:00
+								    """Compute all the computed styles of all elements in ``html`` document.
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
-												Get rid of the Document class (finally!)

											
										
										
											2012-09-25 18:01:47 +04:00
+								    Do everything from finding author stylesheets to parsing and applying them.
-												Sanity check: assert that dimension values are numeric.

											
										
										
											2011-06-29 13:07:48 +04:00
-												Get rid of the Document class (finally!)

											
										
										
											2012-09-25 18:01:47 +04:00
+								    Return a ``style_for`` function that takes an element and an optional
-												Remove StyleDict objects

											
										
										
											2018-01-13 19:41:08 +03:00
+								    pseudo-element type, and return a style dict object.
-												Clean weasy/css/__init__

											
										
										
											2011-08-22 20:33:54 +04:00
-												Annotate DOM elements with a value for every property. Needs more tests.

											
										
										
											2011-05-04 13:47:04 +04:00
+								    """
-												Flatten stylesheets list

											
										
										
											2017-07-01 08:41:13 +03:00
+								    # List stylesheets. Order here is not important ('origin' is).
 								    sheets = []
 								    for sheet in (html._ua_stylesheets() or []):
 								        sheets.append((sheet, 'user agent', None))
-												Use a stylesheet for some presentational hints

											
										
										
											2016-08-31 23:33:26 +03:00
+								    if presentational_hints:
-												Flatten stylesheets list

											
										
										
											2017-07-01 08:41:13 +03:00
+								        for sheet in (html._ph_stylesheets() or []):
 								            sheets.append((sheet, 'author', (0, 0, 0)))
 								    for sheet in find_stylesheets(
-												Use ElementTree's elements as much as possible

											
										
										
											2017-07-03 16:19:05 +03:00
+								            html.wrapper_element, html.media_type, html.url_fetcher,
-												Don't store base_url in ElementWrappers

											
										
										
											2017-07-07 12:14:07 +03:00
+								            html.base_url, font_config, page_rules):
-												Flatten stylesheets list

											
										
										
											2017-07-01 08:41:13 +03:00
+								        sheets.append((sheet, 'author', None))
 								    for sheet in (user_stylesheets or []):
 								        sheets.append((sheet, 'user', None))
-												Handle page margins and page area.

											
										
										
											2011-07-05 17:02:18 +04:00
-												Put media queries in a separate module, create a class for style_for

											
										
										
											2018-08-17 11:30:51 +03:00
+								    return StyleFor(html, sheets, presentational_hints, target_collector)