1
1
mirror of https://github.com/Kozea/WeasyPrint.git synced 2024-10-05 08:27:22 +03:00
WeasyPrint/weasyprint/formatting_structure/boxes.py

707 lines
22 KiB
Python
Raw Normal View History

"""
weasyprint.formatting_structure.boxes
-------------------------------------
2011-05-17 13:29:00 +04:00
Classes for all types of boxes in the CSS formatting structure / box model.
2011-05-17 13:29:00 +04:00
See http://www.w3.org/TR/CSS21/visuren.html
Names are the same as in CSS 2.1 with the exception of ``TextBox``. In
WeasyPrint, any text is in a ``TextBox``. What CSS calls anonymous
inline boxes are text boxes but not all text boxes are anonymous
inline boxes.
See http://www.w3.org/TR/CSS21/visuren.html#anonymous
Abstract classes, should not be instantiated:
* Box
* BlockLevelBox
* InlineLevelBox
* BlockContainerBox
* ReplacedBox
* ParentBox
* AtomicInlineLevelBox
Concrete classes:
* PageBox
* BlockBox
* InlineBox
* InlineBlockBox
* BlockReplacedBox
* InlineReplacedBox
* TextBox
* LineBox
* Various table-related Box subclasses
All concrete box classes whose name contains "Inline" or "Block" have
one of the following "outside" behavior:
* Block-level (inherits from :class:`BlockLevelBox`)
* Inline-level (inherits from :class:`InlineLevelBox`)
and one of the following "inside" behavior:
* Block container (inherits from :class:`BlockContainerBox`)
* Inline content (InlineBox and :class:`TextBox`)
* Replaced content (inherits from :class:`ReplacedBox`)
... with various combinasions of both.
See respective docstrings for details.
2019-03-04 13:04:06 +03:00
:copyright: Copyright 2011-2019 Simon Sapin and contributors, see AUTHORS.
:license: BSD, see LICENSE for details.
"""
2011-05-17 13:29:00 +04:00
import itertools
2018-01-13 19:41:08 +03:00
from ..css import computed_from_cascaded
from ..css.properties import Dimension
2011-05-19 17:31:34 +04:00
class Box(object):
2011-08-24 11:41:38 +04:00
"""Abstract base class for all boxes."""
# Definitions for the rules generating anonymous table boxes
# http://www.w3.org/TR/CSS21/tables.html#anonymous-boxes
proper_table_child = False
internal_table_or_caption = False
tabular_container = False
# Keep track of removed collapsing spaces for wrap opportunities.
leading_collapsible_space = False
trailing_collapsible_space = False
# Default, may be overriden on instances.
is_table_wrapper = False
is_flex_item = False
is_for_root_element = False
is_column = False
# Other properties
transformation_matrix = None
bookmark_label = None
string_set = None
# Default, overriden on some subclasses
def all_children(self):
return ()
2017-07-01 01:28:14 +03:00
def __init__(self, element_tag, style):
self.element_tag = element_tag
2016-11-01 04:38:34 +03:00
self.style = style
2011-06-29 16:04:42 +04:00
def __repr__(self):
2017-07-01 01:28:14 +03:00
return '<%s %s>' % (type(self).__name__, self.element_tag)
@classmethod
def anonymous_from(cls, parent, *args, **kwargs):
"""Return an anonymous box that inherits from ``parent``."""
2018-01-13 19:41:08 +03:00
style = computed_from_cascaded(
cascaded={}, parent_style=parent.style, element=None)
return cls(parent.element_tag, style, *args, **kwargs)
def copy(self):
"""Return shallow copy of the box."""
cls = type(self)
# Create a new instance without calling __init__: parameters are
# different depending on the class.
new_box = cls.__new__(cls)
# Copy attributes
new_box.__dict__.update(self.__dict__)
return new_box
def translate(self, dx=0, dy=0, ignore_floats=False):
2011-08-24 11:41:38 +04:00
"""Change the boxs position.
Also update the childrens positions accordingly.
2011-08-11 14:05:40 +04:00
"""
# Overridden in ParentBox to also translate children, if any.
if dx == 0 and dy == 0:
return
2011-11-24 20:56:05 +04:00
self.position_x += dx
self.position_y += dy
for child in self.all_children():
if not (ignore_floats and child.is_floated()):
child.translate(dx, dy, ignore_floats)
2011-08-11 14:05:40 +04:00
2011-08-24 11:41:38 +04:00
# Heights and widths
2011-07-12 19:53:15 +04:00
def padding_width(self):
"""Width of the padding box."""
2011-07-12 19:53:15 +04:00
return self.width + self.padding_left + self.padding_right
2011-05-19 17:31:34 +04:00
2011-07-12 19:53:15 +04:00
def padding_height(self):
"""Height of the padding box."""
2011-07-12 19:53:15 +04:00
return self.height + self.padding_top + self.padding_bottom
2011-07-12 19:53:15 +04:00
def border_width(self):
"""Width of the border box."""
return self.padding_width() + self.border_left_width + \
self.border_right_width
2011-07-12 19:53:15 +04:00
def border_height(self):
"""Height of the border box."""
return self.padding_height() + self.border_top_width + \
self.border_bottom_width
def margin_width(self):
"""Width of the margin box (aka. outer box)."""
return self.border_width() + self.margin_left + self.margin_right
def margin_height(self):
"""Height of the margin box (aka. outer box)."""
return self.border_height() + self.margin_top + self.margin_bottom
2011-08-24 11:41:38 +04:00
# Corners positions
def content_box_x(self):
"""Absolute horizontal position of the content box."""
return self.position_x + self.margin_left + self.padding_left + \
self.border_left_width
def content_box_y(self):
"""Absolute vertical position of the content box."""
return self.position_y + self.margin_top + self.padding_top + \
self.border_top_width
def padding_box_x(self):
"""Absolute horizontal position of the padding box."""
return self.position_x + self.margin_left + self.border_left_width
def padding_box_y(self):
"""Absolute vertical position of the padding box."""
return self.position_y + self.margin_top + self.border_top_width
def border_box_x(self):
"""Absolute horizontal position of the border box."""
return self.position_x + self.margin_left
def border_box_y(self):
"""Absolute vertical position of the border box."""
return self.position_y + self.margin_top
2012-06-15 00:04:48 +04:00
def hit_area(self):
"""Return the (x, y, w, h) rectangle where the box is clickable."""
# "Border area. That's the area that hit-testing is done on."
# http://lists.w3.org/Archives/Public/www-style/2012Jun/0318.html
2013-06-06 17:58:00 +04:00
# TODO: manage the border radii, use outer_border_radii instead
2012-06-15 00:04:48 +04:00
return (self.border_box_x(), self.border_box_y(),
self.border_width(), self.border_height())
def rounded_box(self, bt, br, bb, bl):
2013-06-06 17:58:00 +04:00
"""Position, size and radii of a box inside the outer border box.
bt, br, bb, and bl are distances from the outer border box,
defining a rectangle to be rounded.
2013-06-06 17:58:00 +04:00
"""
2013-06-07 19:05:58 +04:00
tlrx, tlry = self.border_top_left_radius
trrx, trry = self.border_top_right_radius
brrx, brry = self.border_bottom_right_radius
blrx, blry = self.border_bottom_left_radius
tlrx = max(0, tlrx - bl)
tlry = max(0, tlry - bt)
trrx = max(0, trrx - br)
trry = max(0, trry - bt)
brrx = max(0, brrx - br)
brry = max(0, brry - bb)
blrx = max(0, blrx - bl)
blry = max(0, blry - bb)
x = self.border_box_x() + bl
y = self.border_box_y() + bt
width = self.border_width() - bl - br
height = self.border_height() - bt - bb
2013-06-07 19:05:58 +04:00
# Fix overlapping curves
# See http://www.w3.org/TR/css3-background/#corner-overlap
ratio = min([1] + [
extent / sum_radii
for extent, sum_radii in [
(width, tlrx + trrx),
(width, blrx + brrx),
(height, tlry + blry),
(height, trry + brry),
]
if sum_radii > 0
])
2013-06-06 17:58:00 +04:00
return (
x, y, width, height,
(tlrx * ratio, tlry * ratio),
(trrx * ratio, trry * ratio),
(brrx * ratio, brry * ratio),
(blrx * ratio, blry * ratio))
def rounded_box_ratio(self, ratio):
return self.rounded_box(
self.border_top_width * ratio,
self.border_right_width * ratio,
self.border_bottom_width * ratio,
self.border_left_width * ratio)
2013-06-06 17:58:00 +04:00
def rounded_padding_box(self):
"""Return the position, size and radii of the rounded padding box."""
return self.rounded_box(
self.border_top_width,
self.border_right_width,
self.border_bottom_width,
self.border_left_width)
2013-06-06 17:58:00 +04:00
def rounded_border_box(self):
"""Return the position, size and radii of the rounded border box."""
return self.rounded_box(0, 0, 0, 0)
def rounded_content_box(self):
"""Return the position, size and radii of the rounded content box."""
return self.rounded_box(
2013-12-10 21:29:58 +04:00
self.border_top_width + self.padding_top,
self.border_right_width + self.padding_right,
self.border_bottom_width + self.padding_bottom,
self.border_left_width + self.padding_left)
2011-08-24 11:41:38 +04:00
# Positioning schemes
def is_floated(self):
"""Return whether this box is floated."""
return self.style['float'] != 'none'
def is_absolutely_positioned(self):
"""Return whether this box is in the absolute positioning scheme."""
return self.style['position'] in ('absolute', 'fixed')
def is_in_normal_flow(self):
"""Return whether this box is in normal flow."""
return not (self.is_floated() or self.is_absolutely_positioned())
# Start and end page values for named pages
def page_values(self):
"""Return start and end page values."""
return (self.style['page'], self.style['page'])
class ParentBox(Box):
2011-08-24 11:41:38 +04:00
"""A box that has children."""
2017-07-01 01:28:14 +03:00
def __init__(self, element_tag, style, children):
super(ParentBox, self).__init__(element_tag, style)
2011-10-03 20:57:26 +04:00
self.children = tuple(children)
def all_children(self):
return self.children
def _reset_spacing(self, side):
"""Set to 0 the margin, padding and border of ``side``."""
self.style['margin_%s' % side] = Dimension(0, 'px')
self.style['padding_%s' % side] = Dimension(0, 'px')
self.style['border_%s_width' % side] = 0
if side in ('top', 'bottom'):
self.style['border_%s_left_radius' % side] = (
Dimension(0, 'px'), Dimension(0, 'px'))
self.style['border_%s_right_radius' % side] = (
Dimension(0, 'px'), Dimension(0, 'px'))
else:
self.style['border_bottom_%s_radius' % side] = (
Dimension(0, 'px'), Dimension(0, 'px'))
self.style['border_top_%s_radius' % side] = (
Dimension(0, 'px'), Dimension(0, 'px'))
setattr(self, 'margin_%s' % side, 0)
setattr(self, 'padding_%s' % side, 0)
setattr(self, 'border_%s_width' % side, 0)
def _remove_decoration(self, start, end):
if start or end:
old_style = self.style
self.style = self.style.copy()
if start:
self._reset_spacing('top')
if end:
self._reset_spacing('bottom')
if (start or end) and old_style == self.style:
# Don't copy style if there's no need to, save some memory
self.style = old_style
2016-11-01 06:31:15 +03:00
def copy_with_children(self, new_children, is_start=True, is_end=True):
2012-07-11 21:19:13 +04:00
"""Create a new equivalent box with given ``new_children``."""
2016-11-01 06:31:15 +03:00
new_box = self.copy()
2012-07-11 21:19:13 +04:00
new_box.children = tuple(new_children)
if self.style['box_decoration_break'] == 'slice':
new_box._remove_decoration(not is_start, not is_end)
2011-10-03 20:57:26 +04:00
return new_box
def descendants(self):
"""A flat generator for a box, its children and descendants."""
yield self
for child in self.children:
if hasattr(child, 'descendants'):
for grand_child in child.descendants():
yield grand_child
else:
yield child
2012-06-15 00:04:48 +04:00
def get_wrapped_table(self):
"""Get the table wrapped by the box."""
if self.is_table_wrapper:
for child in self.children:
if isinstance(child, TableBox):
return child
else: # pragma: no cover
raise ValueError('Table wrapper without a table')
def page_values(self):
start_value, end_value = super(ParentBox, self).page_values()
if self.children:
start_box, end_box = self.children[0], self.children[-1]
start_value = start_box.page_values()[0] or start_value
end_value = end_box.page_values()[1] or end_value
return start_value, end_value
class BlockLevelBox(Box):
2011-08-24 11:41:38 +04:00
"""A box that participates in an block formatting context.
An element with a ``display`` value of ``block``, ``list-item`` or
``table`` generates a block-level box.
"""
clearance = None
class BlockContainerBox(ParentBox):
2011-08-24 11:41:38 +04:00
"""A box that contains only block-level boxes or only line boxes.
A box that either contains only block-level boxes or establishes an inline
formatting context and thus contains only line boxes.
2011-08-24 11:41:38 +04:00
A non-replaced element with a ``display`` value of ``block``,
``list-item``, ``inline-block`` or 'table-cell' generates a block container
box.
"""
class BlockBox(BlockContainerBox, BlockLevelBox):
2011-08-24 11:41:38 +04:00
"""A block-level box that is also a block container.
2011-06-29 16:04:42 +04:00
2011-08-24 11:41:38 +04:00
A non-replaced element with a ``display`` value of ``block``, ``list-item``
generates a block box.
2011-08-24 11:41:38 +04:00
2011-05-23 16:31:14 +04:00
"""
2011-05-19 17:31:34 +04:00
class LineBox(ParentBox):
2011-08-24 11:41:38 +04:00
"""A box that represents a line in an inline formatting context.
Can only contain inline-level boxes.
2011-06-29 16:04:42 +04:00
2011-05-23 16:31:14 +04:00
In early stages of building the box tree a single line box contains many
2011-07-01 20:20:30 +04:00
consecutive inline boxes. Later, during layout phase, each line boxes will
be split into multiple line boxes, one for each actual line.
2011-08-24 11:41:38 +04:00
2011-05-23 16:31:14 +04:00
"""
text_overflow = 'clip'
@classmethod
def anonymous_from(cls, parent, *args, **kwargs):
box = super().anonymous_from(parent, *args, **kwargs)
if parent.style['overflow'] != 'visible':
box.text_overflow = parent.style['text_overflow']
return box
2011-05-19 17:31:34 +04:00
class InlineLevelBox(Box):
2011-08-24 11:41:38 +04:00
"""A box that participates in an inline formatting context.
An inline-level box that is not an inline box is said to be "atomic". Such
boxes are inline blocks, replaced elements and inline tables.
2011-06-29 16:04:42 +04:00
2011-08-24 11:41:38 +04:00
An element with a ``display`` value of ``inline``, ``inline-table``, or
``inline-block`` generates an inline-level box.
2011-05-23 16:31:14 +04:00
"""
def _remove_decoration(self, start, end):
if start or end:
old_style = self.style
self.style = self.style.copy()
ltr = self.style['direction'] == 'ltr'
if start:
self._reset_spacing('left' if ltr else 'right')
if end:
self._reset_spacing('right' if ltr else 'left')
if (start or end) and old_style == self.style:
# Don't copy style if there's no need to, save some memory
self.style = old_style
2011-05-19 17:31:34 +04:00
class InlineBox(InlineLevelBox, ParentBox):
2011-08-24 11:41:38 +04:00
"""An inline box with inline children.
A box that participates in an inline formatting context and whose content
also participates in that inline formatting context.
2011-06-29 16:04:42 +04:00
2011-08-24 11:41:38 +04:00
A non-replaced element with a ``display`` value of ``inline`` generates an
inline box.
2011-08-24 11:41:38 +04:00
"""
2012-06-15 00:04:48 +04:00
def hit_area(self):
"""Return the (x, y, w, h) rectangle where the box is clickable."""
# Use line-height (margin_height) rather than border_height
return (self.border_box_x(), self.position_y,
self.border_width(), self.margin_height())
class TextBox(InlineLevelBox):
2011-08-24 11:41:38 +04:00
"""A box that contains only text and has no box children.
2011-06-29 16:04:42 +04:00
Any text in the document ends up in a text box. What CSS calls "anonymous
inline boxes" are also text boxes.
2011-08-24 11:41:38 +04:00
2011-05-23 16:31:14 +04:00
"""
justification_spacing = 0
2016-08-21 01:47:13 +03:00
# http://stackoverflow.com/questions/16317534/
2018-01-14 03:48:17 +03:00
ascii_to_wide = dict((i, chr(i + 0xfee0)) for i in range(0x21, 0x7f))
2016-08-21 01:47:13 +03:00
ascii_to_wide.update({0x20: '\u3000', 0x2D: '\u2212'})
2017-07-01 01:28:14 +03:00
def __init__(self, element_tag, style, text):
assert text
2017-07-01 01:28:14 +03:00
super(TextBox, self).__init__(element_tag, style)
text_transform = style['text_transform']
2011-12-05 21:03:25 +04:00
if text_transform != 'none':
text = {
'uppercase': lambda t: t.upper(),
'lowercase': lambda t: t.lower(),
# Pythons unicode.captitalize is not the same.
'capitalize': lambda t: t.title(),
2016-08-21 01:47:13 +03:00
'full-width': lambda t: t.translate(self.ascii_to_wide),
2011-12-05 21:03:25 +04:00
}[text_transform](text)
if style['hyphens'] == 'none':
text = text.replace('\u00AD', '') # U+00AD SOFT HYPHEN (SHY)
2011-11-08 16:09:19 +04:00
self.text = text
2011-05-19 17:31:34 +04:00
2011-11-08 16:09:19 +04:00
def copy_with_text(self, text):
2011-12-26 15:47:26 +04:00
"""Return a new TextBox identical to this one except for the text."""
2011-11-08 16:09:19 +04:00
assert text
new_box = self.copy()
2011-11-08 16:09:19 +04:00
new_box.text = text
return new_box
2011-05-19 17:31:34 +04:00
class AtomicInlineLevelBox(InlineLevelBox):
2011-08-24 11:41:38 +04:00
"""An atomic box in an inline formatting context.
This inline-level box cannot be split for line breaks.
"""
class InlineBlockBox(AtomicInlineLevelBox, BlockContainerBox):
2011-08-24 11:41:38 +04:00
"""A box that is both inline-level and a block container.
It behaves as inline on the outside and as a block on the inside.
A non-replaced element with a 'display' value of 'inline-block' generates
an inline-block box.
2011-08-24 11:41:38 +04:00
"""
class ReplacedBox(Box):
2011-08-24 11:41:38 +04:00
"""A box whose content is replaced.
For example, ``<img>`` are replaced: their content is rendered externally
and is opaque from CSSs point of view.
"""
2017-07-01 01:28:14 +03:00
def __init__(self, element_tag, style, replacement):
super(ReplacedBox, self).__init__(element_tag, style)
2011-05-25 17:54:46 +04:00
self.replacement = replacement
2011-12-05 17:24:43 +04:00
class BlockReplacedBox(ReplacedBox, BlockLevelBox):
2011-08-24 11:41:38 +04:00
"""A box that is both replaced and block-level.
A replaced element with a ``display`` value of ``block``, ``liste-item`` or
``table`` generates a block-level replaced box.
"""
2011-12-05 17:24:43 +04:00
class InlineReplacedBox(ReplacedBox, AtomicInlineLevelBox):
2011-08-24 11:41:38 +04:00
"""A box that is both replaced and inline-level.
A replaced element with a ``display`` value of ``inline``,
``inline-table``, or ``inline-block`` generates an inline-level replaced
box.
"""
class TableBox(BlockLevelBox, ParentBox):
"""Box for elements with ``display: table``"""
# Definitions for the rules generating anonymous table boxes
# http://www.w3.org/TR/CSS21/tables.html#anonymous-boxes
tabular_container = True
def all_children(self):
return itertools.chain(self.children, self.column_groups)
def translate(self, dx=0, dy=0, ignore_floats=False):
if dx == 0 and dy == 0:
return
self.column_positions = [
position + dx for position in self.column_positions]
return super(TableBox, self).translate(dx, dy, ignore_floats)
def page_values(self):
return (self.style['page'], self.style['page'])
class InlineTableBox(TableBox):
"""Box for elements with ``display: inline-table``"""
class TableRowGroupBox(ParentBox):
"""Box for elements with ``display: table-row-group``"""
proper_table_child = True
internal_table_or_caption = True
tabular_container = True
proper_parents = (TableBox, InlineTableBox)
# Default values. May be overriden on instances.
is_header = False
is_footer = False
class TableRowBox(ParentBox):
"""Box for elements with ``display: table-row``"""
proper_table_child = True
internal_table_or_caption = True
tabular_container = True
proper_parents = (TableBox, InlineTableBox, TableRowGroupBox)
class TableColumnGroupBox(ParentBox):
"""Box for elements with ``display: table-column-group``"""
proper_table_child = True
internal_table_or_caption = True
proper_parents = (TableBox, InlineTableBox)
# Default value. May be overriden on instances.
span = 1
2011-11-29 15:43:42 +04:00
# Columns groups never have margins or paddings
margin_top = 0
margin_bottom = 0
margin_left = 0
margin_right = 0
padding_top = 0
padding_bottom = 0
padding_left = 0
padding_right = 0
def get_cells(self):
"""Return cells that originate in the group's columns."""
return [
cell for column in self.children for cell in column.get_cells()]
# Not really a parent box, but pretending to be removes some corner cases.
class TableColumnBox(ParentBox):
2011-12-26 15:47:26 +04:00
"""Box for elements with ``display: table-column``"""
proper_table_child = True
internal_table_or_caption = True
proper_parents = (TableBox, InlineTableBox, TableColumnGroupBox)
# Default value. May be overriden on instances.
span = 1
2011-11-29 15:43:42 +04:00
# Columns never have margins or paddings
margin_top = 0
margin_bottom = 0
margin_left = 0
margin_right = 0
padding_top = 0
padding_bottom = 0
padding_left = 0
padding_right = 0
def get_cells(self):
"""Return cells that originate in the column.
May be overriden on instances.
"""
return []
class TableCellBox(BlockContainerBox):
"""Box for elements with ``display: table-cell``"""
internal_table_or_caption = True
# Default values. May be overriden on instances.
colspan = 1
rowspan = 1
class TableCaptionBox(BlockBox):
"""Box for elements with ``display: table-caption``"""
proper_table_child = True
internal_table_or_caption = True
proper_parents = (TableBox, InlineTableBox)
class PageBox(ParentBox):
"""Box for a page.
Initially the whole document will be in the box for the root element.
During layout a new page box is created after every page break.
"""
def __init__(self, page_type, style):
self.page_type = page_type
# Page boxes are not linked to any element.
super(PageBox, self).__init__(
2017-07-01 01:28:14 +03:00
element_tag=None, style=style, children=[])
def __repr__(self):
return '<%s %s>' % (type(self).__name__, self.page_type)
class MarginBox(BlockContainerBox):
"""Box in page margins, as defined in CSS3 Paged Media"""
def __init__(self, at_keyword, style):
self.at_keyword = at_keyword
# Margin boxes are not linked to any element.
super(MarginBox, self).__init__(
2017-07-01 01:28:14 +03:00
element_tag=None, style=style, children=[])
def __repr__(self):
return '<%s %s>' % (type(self).__name__, self.at_keyword)
class FlexContainerBox(ParentBox):
"""A box that contains only flex-items."""
class FlexBox(FlexContainerBox, BlockLevelBox):
"""A box that is both block-level and a flex container.
It behaves as block on the outside and as a flex container on the inside.
"""
class InlineFlexBox(FlexContainerBox, InlineLevelBox):
"""A box that is both inline-level and a flex container.
It behaves as inline on the outside and as a flex container on the inside.
"""