docutils/docutils/writers/html4css1/__init__.py

   1 # $Id$
   2 # Author: David Goodger
   3 # Maintainer: docutils-develop@lists.sourceforge.net
   4 # Copyright: This module has been placed in the public domain.
   5
   6 """
   7 Simple HyperText Markup Language document tree Writer.
   8
   9 The output conforms to the XHTML version 1.0 Transitional DTD
  10 (*almost* strict).  The output contains a minimum of formatting
  11 information.  The cascading style sheet "html4css1.css" is required
  12 for proper viewing with a modern graphical browser.
  13 """
  14
  15 __docformat__ = 'reStructuredText'
  16
  17
  18 import sys
  19 import os
  20 import os.path
  21 import time
  22 import re
  23 import urllib
  24 try: # check for the Python Imaging Library
  25     import PIL.Image
  26 except ImportError:
  27     try:  # sometimes PIL modules are put in PYTHONPATH's root
  28         import Image
  29         class PIL(object): pass  # dummy wrapper
  30         PIL.Image = Image
  31     except ImportError:
  32         PIL = None
  33 import docutils
  34 from docutils import frontend, nodes, utils, writers, languages, io
  35 from docutils.utils.error_reporting import SafeString
  36 from docutils.transforms import writer_aux
  37 from docutils.utils.math import unichar2tex, pick_math_environment, math2html
  38 from docutils.utils.math.latex2mathml import parse_latex_math
  39
  40 class Writer(writers.Writer):
  41
  42     supported = ('html', 'html4css1', 'xhtml')
  43     """Formats this writer supports."""
  44
  45     default_stylesheets = ['html4css1.css']
  46     default_stylesheet_dirs = ['.', os.path.abspath(os.path.dirname(__file__))]
  47
  48     default_template = 'template.txt'
  49     default_template_path = os.path.join(
  50         os.path.dirname(os.path.abspath(__file__)), default_template)
  51
  52     settings_spec = (
  53         'HTML-Specific Options',
  54         None,
  55         (('Specify the template file (UTF-8 encoded).  Default is "%s".'
  56           % default_template_path,
  57           ['--template'],
  58           {'default': default_template_path, 'metavar': '<file>'}),
  59          ('Comma separated list of stylesheet URLs. '
  60           'Overrides previous --stylesheet and --stylesheet-path settings.',
  61           ['--stylesheet'],
  62           {'metavar': '<URL[,URL,...]>', 'overrides': 'stylesheet_path',
  63            'validator': frontend.validate_comma_separated_list}),
  64          ('Comma separated list of stylesheet paths. '
  65           'Relative paths are expanded if a matching file is found in '
  66           'the --stylesheet-dirs. With --link-stylesheet, '
  67           'the path is rewritten relative to the output HTML file. '
  68           'Default: "%s"' % ','.join(default_stylesheets),
  69           ['--stylesheet-path'],
  70           {'metavar': '<file[,file,...]>', 'overrides': 'stylesheet',
  71            'validator': frontend.validate_comma_separated_list,
  72            'default': default_stylesheets}),
  73          ('Embed the stylesheet(s) in the output HTML file.  The stylesheet '
  74           'files must be accessible during processing. This is the default.',
  75           ['--embed-stylesheet'],
  76           {'default': 1, 'action': 'store_true',
  77            'validator': frontend.validate_boolean}),
  78          ('Link to the stylesheet(s) in the output HTML file. '
  79           'Default: embed stylesheets.',
  80           ['--link-stylesheet'],
  81           {'dest': 'embed_stylesheet', 'action': 'store_false'}),
  82          ('Comma-separated list of directories where stylesheets are found. '
  83           'Used by --stylesheet-path when expanding relative path arguments. '
  84           'Default: "%s"' % default_stylesheet_dirs,
  85           ['--stylesheet-dirs'],
  86           {'metavar': '<dir[,dir,...]>',
  87            'validator': frontend.validate_comma_separated_list,
  88            'default': default_stylesheet_dirs}),
  89          ('Specify the initial header level.  Default is 1 for "<h1>".  '
  90           'Does not affect document title & subtitle (see --no-doc-title).',
  91           ['--initial-header-level'],
  92           {'choices': '1 2 3 4 5 6'.split(), 'default': '1',
  93            'metavar': '<level>'}),
  94          ('Specify the maximum width (in characters) for one-column field '
  95           'names.  Longer field names will span an entire row of the table '
  96           'used to render the field list.  Default is 14 characters.  '
  97           'Use 0 for "no limit".',
  98           ['--field-name-limit'],
  99           {'default': 14, 'metavar': '<level>',
 100            'validator': frontend.validate_nonnegative_int}),
 101          ('Specify the maximum width (in characters) for options in option '
 102           'lists.  Longer options will span an entire row of the table used '
 103           'to render the option list.  Default is 14 characters.  '
 104           'Use 0 for "no limit".',
 105           ['--option-limit'],
 106           {'default': 14, 'metavar': '<level>',
 107            'validator': frontend.validate_nonnegative_int}),
 108          ('Format for footnote references: one of "superscript" or '
 109           '"brackets".  Default is "brackets".',
 110           ['--footnote-references'],
 111           {'choices': ['superscript', 'brackets'], 'default': 'brackets',
 112            'metavar': '<format>',
 113            'overrides': 'trim_footnote_reference_space'}),
 114          ('Format for block quote attributions: one of "dash" (em-dash '
 115           'prefix), "parentheses"/"parens", or "none".  Default is "dash".',
 116           ['--attribution'],
 117           {'choices': ['dash', 'parentheses', 'parens', 'none'],
 118            'default': 'dash', 'metavar': '<format>'}),
 119          ('Remove extra vertical whitespace between items of "simple" bullet '
 120           'lists and enumerated lists.  Default: enabled.',
 121           ['--compact-lists'],
 122           {'default': 1, 'action': 'store_true',
 123            'validator': frontend.validate_boolean}),
 124          ('Disable compact simple bullet and enumerated lists.',
 125           ['--no-compact-lists'],
 126           {'dest': 'compact_lists', 'action': 'store_false'}),
 127          ('Remove extra vertical whitespace between items of simple field '
 128           'lists.  Default: enabled.',
 129           ['--compact-field-lists'],
 130           {'default': 1, 'action': 'store_true',
 131            'validator': frontend.validate_boolean}),
 132          ('Disable compact simple field lists.',
 133           ['--no-compact-field-lists'],
 134           {'dest': 'compact_field_lists', 'action': 'store_false'}),
 135          ('Added to standard table classes. '
 136           'Defined styles: "borderless". Default: ""',
 137           ['--table-style'],
 138           {'default': ''}),
 139          ('Math output format, one of "MathML", "HTML", "MathJax" '
 140           'or "LaTeX". Default: "HTML math.css"',
 141           ['--math-output'],
 142           {'default': 'HTML math.css'}),
 143          ('Omit the XML declaration.  Use with caution.',
 144           ['--no-xml-declaration'],
 145           {'dest': 'xml_declaration', 'default': 1, 'action': 'store_false',
 146            'validator': frontend.validate_boolean}),
 147          ('Obfuscate email addresses to confuse harvesters while still '
 148           'keeping email links usable with standards-compliant browsers.',
 149           ['--cloak-email-addresses'],
 150           {'action': 'store_true', 'validator': frontend.validate_boolean}),))
 151
 152     settings_defaults = {'output_encoding_error_handler': 'xmlcharrefreplace'}
 153
 154     config_section = 'html4css1 writer'
 155     config_section_dependencies = ('writers',)
 156
 157     visitor_attributes = (
 158         'head_prefix', 'head', 'stylesheet', 'body_prefix',
 159         'body_pre_docinfo', 'docinfo', 'body', 'body_suffix',
 160         'title', 'subtitle', 'header', 'footer', 'meta', 'fragment',
 161         'html_prolog', 'html_head', 'html_title', 'html_subtitle',
 162         'html_body')
 163
 164     def get_transforms(self):
 165         return writers.Writer.get_transforms(self) + [writer_aux.Admonitions]
 166
 167     def __init__(self):
 168         writers.Writer.__init__(self)
 169         self.translator_class = HTMLTranslator
 170
 171     def translate(self):
 172         self.visitor = visitor = self.translator_class(self.document)
 173         self.document.walkabout(visitor)
 174         for attr in self.visitor_attributes:
 175             setattr(self, attr, getattr(visitor, attr))
 176         self.output = self.apply_template()
 177
 178     def apply_template(self):
 179         template_file = open(self.document.settings.template, 'rb')
 180         template = unicode(template_file.read(), 'utf-8')
 181         template_file.close()
 182         subs = self.interpolation_dict()
 183         return template % subs
 184
 185     def interpolation_dict(self):
 186         subs = {}
 187         settings = self.document.settings
 188         for attr in self.visitor_attributes:
 189             subs[attr] = ''.join(getattr(self, attr)).rstrip('\n')
 190         subs['encoding'] = settings.output_encoding
 191         subs['version'] = docutils.__version__
 192         return subs
 193
 194     def assemble_parts(self):
 195         writers.Writer.assemble_parts(self)
 196         for part in self.visitor_attributes:
 197             self.parts[part] = ''.join(getattr(self, part))
 198
 199
 200 class HTMLTranslator(nodes.NodeVisitor):
 201
 202     """
 203     This HTML writer has been optimized to produce visually compact
 204     lists (less vertical whitespace).  HTML's mixed content models
 205     allow list items to contain "<li><p>body elements</p></li>" or
 206     "<li>just text</li>" or even "<li>text<p>and body
 207     elements</p>combined</li>", each with different effects.  It would
 208     be best to stick with strict body elements in list items, but they
 209     affect vertical spacing in browsers (although they really
 210     shouldn't).
 211
 212     Here is an outline of the optimization:
 213
 214     - Check for and omit <p> tags in "simple" lists: list items
 215       contain either a single paragraph, a nested simple list, or a
 216       paragraph followed by a nested simple list.  This means that
 217       this list can be compact:
 218
 219           - Item 1.
 220           - Item 2.
 221
 222       But this list cannot be compact:
 223
 224           - Item 1.
 225
 226             This second paragraph forces space between list items.
 227
 228           - Item 2.
 229
 230     - In non-list contexts, omit <p> tags on a paragraph if that
 231       paragraph is the only child of its parent (footnotes & citations
 232       are allowed a label first).
 233
 234     - Regardless of the above, in definitions, table cells, field bodies,
 235       option descriptions, and list items, mark the first child with
 236       'class="first"' and the last child with 'class="last"'.  The stylesheet
 237       sets the margins (top & bottom respectively) to 0 for these elements.
 238
 239     The ``no_compact_lists`` setting (``--no-compact-lists`` command-line
 240     option) disables list whitespace optimization.
 241     """
 242
 243     xml_declaration = '<?xml version="1.0" encoding="%s" ?>\n'
 244     doctype = (
 245         '<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"'
 246         ' "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">\n')
 247     doctype_mathml = doctype
 248
 249     head_prefix_template = ('<html xmlns="http://www.w3.org/1999/xhtml"'
 250                             ' xml:lang="%(lang)s" lang="%(lang)s">\n<head>\n')
 251     content_type = ('<meta http-equiv="Content-Type"'
 252                     ' content="text/html; charset=%s" />\n')
 253     content_type_mathml = ('<meta http-equiv="Content-Type"'
 254                            ' content="application/xhtml+xml; charset=%s" />\n')
 255
 256     generator = ('<meta name="generator" content="Docutils %s: '
 257                  'http://docutils.sourceforge.net/" />\n')
 258
 259     # Template for the MathJax script in the header:
 260     mathjax_script = '<script type="text/javascript" src="%s"></script>\n'
 261     # The latest version of MathJax from the distributed server:
 262     # avaliable to the public under the `MathJax CDN Terms of Service`__
 263     # __http://www.mathjax.org/download/mathjax-cdn-terms-of-service/
 264     mathjax_url = ('http://cdn.mathjax.org/mathjax/latest/MathJax.js?'
 265                    'config=TeX-AMS-MML_HTMLorMML')
 266     # may be overwritten by custom URL appended to "mathjax"
 267
 268     stylesheet_link = '<link rel="stylesheet" href="%s" type="text/css" />\n'
 269     embedded_stylesheet = '<style type="text/css">\n\n%s\n</style>\n'
 270     words_and_spaces = re.compile(r'\S+| +|\n')
 271     sollbruchstelle = re.compile(r'.+\W\W.+|[-?].+', re.U) # wrap point inside word
 272     lang_attribute = 'lang' # name changes to 'xml:lang' in XHTML 1.1
 273
 274     def __init__(self, document):
 275         nodes.NodeVisitor.__init__(self, document)
 276         self.settings = settings = document.settings
 277         lcode = settings.language_code
 278         self.language = languages.get_language(lcode, document.reporter)
 279         self.meta = [self.generator % docutils.__version__]
 280         self.head_prefix = []
 281         self.html_prolog = []
 282         if settings.xml_declaration:
 283             self.head_prefix.append(self.xml_declaration
 284                                     % settings.output_encoding)
 285             # encoding not interpolated:
 286             self.html_prolog.append(self.xml_declaration)
 287         self.head = self.meta[:]
 288         self.stylesheet = [self.stylesheet_call(path)
 289                            for path in utils.get_stylesheet_list(settings)]
 290         self.body_prefix = ['</head>\n<body>\n']
 291         # document title, subtitle display
 292         self.body_pre_docinfo = []
 293         # author, date, etc.
 294         self.docinfo = []
 295         self.body = []
 296         self.fragment = []
 297         self.body_suffix = ['</body>\n</html>\n']
 298         self.section_level = 0
 299         self.initial_header_level = int(settings.initial_header_level)
 300
 301         self.math_output = settings.math_output.split()
 302         self.math_output_options = self.math_output[1:]
 303         self.math_output = self.math_output[0].lower()
 304
 305         # A heterogenous stack used in conjunction with the tree traversal.
 306         # Make sure that the pops correspond to the pushes:
 307         self.context = []
 308         self.topic_classes = []
 309         self.colspecs = []
 310         self.compact_p = True
 311         self.compact_simple = False
 312         self.compact_field_list = False
 313         self.in_docinfo = False
 314         self.in_sidebar = False
 315         self.title = []
 316         self.subtitle = []
 317         self.header = []
 318         self.footer = []
 319         self.html_head = [self.content_type] # charset not interpolated
 320         self.html_title = []
 321         self.html_subtitle = []
 322         self.html_body = []
 323         self.in_document_title = 0   # len(self.body) or 0
 324         self.in_mailto = False
 325         self.author_in_authors = False
 326         self.math_header = []
 327
 328     def astext(self):
 329         return ''.join(self.head_prefix + self.head
 330                        + self.stylesheet + self.body_prefix
 331                        + self.body_pre_docinfo + self.docinfo
 332                        + self.body + self.body_suffix)
 333
 334     def encode(self, text):
 335         """Encode special characters in `text` & return."""
 336         # @@@ A codec to do these and all other HTML entities would be nice.
 337         text = unicode(text)
 338         return text.translate({
 339             ord('&'): u'&amp;',
 340             ord('<'): u'&lt;',
 341             ord('"'): u'&quot;',
 342             ord('>'): u'&gt;',
 343             ord('@'): u'&#64;', # may thwart some address harvesters
 344             # TODO: convert non-breaking space only if needed?
 345             0xa0: u'&nbsp;'}) # non-breaking space
 346
 347     def cloak_mailto(self, uri):
 348         """Try to hide a mailto: URL from harvesters."""
 349         # Encode "@" using a URL octet reference (see RFC 1738).
 350         # Further cloaking with HTML entities will be done in the
 351         # `attval` function.
 352         return uri.replace('@', '%40')
 353
 354     def cloak_email(self, addr):
 355         """Try to hide the link text of a email link from harversters."""
 356         # Surround at-signs and periods with <span> tags.  ("@" has
 357         # already been encoded to "&#64;" by the `encode` method.)
 358         addr = addr.replace('&#64;', '<span>&#64;</span>')
 359         addr = addr.replace('.', '<span>&#46;</span>')
 360         return addr
 361
 362     def attval(self, text,
 363                whitespace=re.compile('[\n\r\t\v\f]')):
 364         """Cleanse, HTML encode, and return attribute value text."""
 365         encoded = self.encode(whitespace.sub(' ', text))
 366         if self.in_mailto and self.settings.cloak_email_addresses:
 367             # Cloak at-signs ("%40") and periods with HTML entities.
 368             encoded = encoded.replace('%40', '&#37;&#52;&#48;')
 369             encoded = encoded.replace('.', '&#46;')
 370         return encoded
 371
 372     def stylesheet_call(self, path):
 373         """Return code to reference or embed stylesheet file `path`"""
 374         if self.settings.embed_stylesheet:
 375             try:
 376                 content = io.FileInput(source_path=path,
 377                                        encoding='utf-8').read()
 378                 self.settings.record_dependencies.add(path)
 379             except IOError, err:
 380                 msg = u"Cannot embed stylesheet '%s': %s." % (
 381                                 path, SafeString(err.strerror))
 382                 self.document.reporter.error(msg)
 383                 return '<--- %s --->\n' % msg
 384             return self.embedded_stylesheet % content
 385         # else link to style file:
 386         if self.settings.stylesheet_path:
 387             # adapt path relative to output (cf. config.html#stylesheet-path)
 388             path = utils.relative_path(self.settings._destination, path)
 389         return self.stylesheet_link % self.encode(path)
 390
 391     def starttag(self, node, tagname, suffix='\n', empty=False, **attributes):
 392         """
 393         Construct and return a start tag given a node (id & class attributes
 394         are extracted), tag name, and optional attributes.
 395         """
 396         tagname = tagname.lower()
 397         prefix = []
 398         atts = {}
 399         ids = []
 400         for (name, value) in attributes.items():
 401             atts[name.lower()] = value
 402         classes = []
 403         languages = []
 404         # unify class arguments and move language specification
 405         for cls in node.get('classes', []) + atts.pop('class', '').split() :
 406             if cls.startswith('language-'):
 407                 languages.append(cls[9:])
 408             elif cls.strip() and cls not in classes:
 409                 classes.append(cls)
 410         if languages:
 411             # attribute name is 'lang' in XHTML 1.0 but 'xml:lang' in 1.1
 412             atts[self.lang_attribute] = languages[0]
 413         if classes:
 414             atts['class'] = ' '.join(classes)
 415         assert 'id' not in atts
 416         ids.extend(node.get('ids', []))
 417         if 'ids' in atts:
 418             ids.extend(atts['ids'])
 419             del atts['ids']
 420         if ids:
 421             atts['id'] = ids[0]
 422             for id in ids[1:]:
 423                 # Add empty "span" elements for additional IDs.  Note
 424                 # that we cannot use empty "a" elements because there
 425                 # may be targets inside of references, but nested "a"
 426                 # elements aren't allowed in XHTML (even if they do
 427                 # not all have a "href" attribute).
 428                 if empty:
 429                     # Empty tag.  Insert target right in front of element.
 430                     prefix.append('<span id="%s"></span>' % id)
 431                 else:
 432                     # Non-empty tag.  Place the auxiliary <span> tag
 433                     # *inside* the element, as the first child.
 434                     suffix += '<span id="%s"></span>' % id
 435         attlist = atts.items()
 436         attlist.sort()
 437         parts = [tagname]
 438         for name, value in attlist:
 439             # value=None was used for boolean attributes without
 440             # value, but this isn't supported by XHTML.
 441             assert value is not None
 442             if isinstance(value, list):
 443                 values = [unicode(v) for v in value]
 444                 parts.append('%s="%s"' % (name.lower(),
 445                                           self.attval(' '.join(values))))
 446             else:
 447                 parts.append('%s="%s"' % (name.lower(),
 448                                           self.attval(unicode(value))))
 449         if empty:
 450             infix = ' /'
 451         else:
 452             infix = ''
 453         return ''.join(prefix) + '<%s%s>' % (' '.join(parts), infix) + suffix
 454
 455     def emptytag(self, node, tagname, suffix='\n', **attributes):
 456         """Construct and return an XML-compatible empty tag."""
 457         return self.starttag(node, tagname, suffix, empty=True, **attributes)
 458
 459     def set_class_on_child(self, node, class_, index=0):
 460         """
 461         Set class `class_` on the visible child no. index of `node`.
 462         Do nothing if node has fewer children than `index`.
 463         """
 464         children = [n for n in node if not isinstance(n, nodes.Invisible)]
 465         try:
 466             child = children[index]
 467         except IndexError:
 468             return
 469         child['classes'].append(class_)
 470
 471     def set_first_last(self, node):
 472         self.set_class_on_child(node, 'first', 0)
 473         self.set_class_on_child(node, 'last', -1)
 474
 475     def visit_Text(self, node):
 476         text = node.astext()
 477         encoded = self.encode(text)
 478         if self.in_mailto and self.settings.cloak_email_addresses:
 479             encoded = self.cloak_email(encoded)
 480         self.body.append(encoded)
 481
 482     def depart_Text(self, node):
 483         pass
 484
 485     def visit_abbreviation(self, node):
 486         # @@@ implementation incomplete ("title" attribute)
 487         self.body.append(self.starttag(node, 'abbr', ''))
 488
 489     def depart_abbreviation(self, node):
 490         self.body.append('</abbr>')
 491
 492     def visit_acronym(self, node):
 493         # @@@ implementation incomplete ("title" attribute)
 494         self.body.append(self.starttag(node, 'acronym', ''))
 495
 496     def depart_acronym(self, node):
 497         self.body.append('</acronym>')
 498
 499     def visit_address(self, node):
 500         self.visit_docinfo_item(node, 'address', meta=False)
 501         self.body.append(self.starttag(node, 'pre', CLASS='address'))
 502
 503     def depart_address(self, node):
 504         self.body.append('\n</pre>\n')
 505         self.depart_docinfo_item()
 506
 507     def visit_admonition(self, node):
 508         self.body.append(self.starttag(node, 'div'))
 509         self.set_first_last(node)
 510
 511     def depart_admonition(self, node=None):
 512         self.body.append('</div>\n')
 513
 514     attribution_formats = {'dash': ('&mdash;', ''),
 515                            'parentheses': ('(', ')'),
 516                            'parens': ('(', ')'),
 517                            'none': ('', '')}
 518
 519     def visit_attribution(self, node):
 520         prefix, suffix = self.attribution_formats[self.settings.attribution]
 521         self.context.append(suffix)
 522         self.body.append(
 523             self.starttag(node, 'p', prefix, CLASS='attribution'))
 524
 525     def depart_attribution(self, node):
 526         self.body.append(self.context.pop() + '</p>\n')
 527
 528     def visit_author(self, node):
 529         if isinstance(node.parent, nodes.authors):
 530             if self.author_in_authors:
 531                 self.body.append('\n<br />')
 532         else:
 533             self.visit_docinfo_item(node, 'author')
 534
 535     def depart_author(self, node):
 536         if isinstance(node.parent, nodes.authors):
 537             self.author_in_authors = True
 538         else:
 539             self.depart_docinfo_item()
 540
 541     def visit_authors(self, node):
 542         self.visit_docinfo_item(node, 'authors')
 543         self.author_in_authors = False  # initialize
 544
 545     def depart_authors(self, node):
 546         self.depart_docinfo_item()
 547
 548     def visit_block_quote(self, node):
 549         self.body.append(self.starttag(node, 'blockquote'))
 550
 551     def depart_block_quote(self, node):
 552         self.body.append('</blockquote>\n')
 553
 554     def check_simple_list(self, node):
 555         """Check for a simple list that can be rendered compactly."""
 556         visitor = SimpleListChecker(self.document)
 557         try:
 558             node.walk(visitor)
 559         except nodes.NodeFound:
 560             return None
 561         else:
 562             return 1
 563
 564     def is_compactable(self, node):
 565         return ('compact' in node['classes']
 566                 or (self.settings.compact_lists
 567                     and 'open' not in node['classes']
 568                     and (self.compact_simple
 569                          or self.topic_classes == ['contents']
 570                          or self.check_simple_list(node))))
 571
 572     def visit_bullet_list(self, node):
 573         atts = {}
 574         old_compact_simple = self.compact_simple
 575         self.context.append((self.compact_simple, self.compact_p))
 576         self.compact_p = None
 577         self.compact_simple = self.is_compactable(node)
 578         if self.compact_simple and not old_compact_simple:
 579             atts['class'] = 'simple'
 580         self.body.append(self.starttag(node, 'ul', **atts))
 581
 582     def depart_bullet_list(self, node):
 583         self.compact_simple, self.compact_p = self.context.pop()
 584         self.body.append('</ul>\n')
 585
 586     def visit_caption(self, node):
 587         self.body.append(self.starttag(node, 'p', '', CLASS='caption'))
 588
 589     def depart_caption(self, node):
 590         self.body.append('</p>\n')
 591
 592     def visit_citation(self, node):
 593         self.body.append(self.starttag(node, 'table',
 594                                        CLASS='docutils citation',
 595                                        frame="void", rules="none"))
 596         self.body.append('<colgroup><col class="label" /><col /></colgroup>\n'
 597                          '<tbody valign="top">\n'
 598                          '<tr>')
 599         self.footnote_backrefs(node)
 600
 601     def depart_citation(self, node):
 602         self.body.append('</td></tr>\n'
 603                          '</tbody>\n</table>\n')
 604
 605     def visit_citation_reference(self, node):
 606         href = '#'
 607         if 'refid' in node:
 608             href += node['refid']
 609         elif 'refname' in node:
 610             href += self.document.nameids[node['refname']]
 611         # else: # TODO system message (or already in the transform)?
 612         # 'Citation reference missing.'
 613         self.body.append(self.starttag(
 614             node, 'a', '[', CLASS='citation-reference', href=href))
 615
 616     def depart_citation_reference(self, node):
 617         self.body.append(']</a>')
 618
 619     def visit_classifier(self, node):
 620         self.body.append(' <span class="classifier-delimiter">:</span> ')
 621         self.body.append(self.starttag(node, 'span', '', CLASS='classifier'))
 622
 623     def depart_classifier(self, node):
 624         self.body.append('</span>')
 625
 626     def visit_colspec(self, node):
 627         self.colspecs.append(node)
 628         # "stubs" list is an attribute of the tgroup element:
 629         node.parent.stubs.append(node.attributes.get('stub'))
 630
 631     def depart_colspec(self, node):
 632         pass
 633
 634     def write_colspecs(self):
 635         width = 0
 636         for node in self.colspecs:
 637             width += node['colwidth']
 638         for node in self.colspecs:
 639             colwidth = int(node['colwidth'] * 100.0 / width + 0.5)
 640             self.body.append(self.emptytag(node, 'col',
 641                                            width='%i%%' % colwidth))
 642         self.colspecs = []
 643
 644     def visit_comment(self, node,
 645                       sub=re.compile('-(?=-)').sub):
 646         """Escape double-dashes in comment text."""
 647         self.body.append('<!-- %s -->\n' % sub('- ', node.astext()))
 648         # Content already processed:
 649         raise nodes.SkipNode
 650
 651     def visit_compound(self, node):
 652         self.body.append(self.starttag(node, 'div', CLASS='compound'))
 653         if len(node) > 1:
 654             node[0]['classes'].append('compound-first')
 655             node[-1]['classes'].append('compound-last')
 656             for child in node[1:-1]:
 657                 child['classes'].append('compound-middle')
 658
 659     def depart_compound(self, node):
 660         self.body.append('</div>\n')
 661
 662     def visit_container(self, node):
 663         self.body.append(self.starttag(node, 'div', CLASS='docutils container'))
 664
 665     def depart_container(self, node):
 666         self.body.append('</div>\n')
 667
 668     def visit_contact(self, node):
 669         self.visit_docinfo_item(node, 'contact', meta=False)
 670
 671     def depart_contact(self, node):
 672         self.depart_docinfo_item()
 673
 674     def visit_copyright(self, node):
 675         self.visit_docinfo_item(node, 'copyright')
 676
 677     def depart_copyright(self, node):
 678         self.depart_docinfo_item()
 679
 680     def visit_date(self, node):
 681         self.visit_docinfo_item(node, 'date')
 682
 683     def depart_date(self, node):
 684         self.depart_docinfo_item()
 685
 686     def visit_decoration(self, node):
 687         pass
 688
 689     def depart_decoration(self, node):
 690         pass
 691
 692     def visit_definition(self, node):
 693         self.body.append('</dt>\n')
 694         self.body.append(self.starttag(node, 'dd', ''))
 695         self.set_first_last(node)
 696
 697     def depart_definition(self, node):
 698         self.body.append('</dd>\n')
 699
 700     def visit_definition_list(self, node):
 701         self.body.append(self.starttag(node, 'dl', CLASS='docutils'))
 702
 703     def depart_definition_list(self, node):
 704         self.body.append('</dl>\n')
 705
 706     def visit_definition_list_item(self, node):
 707         pass
 708
 709     def depart_definition_list_item(self, node):
 710         pass
 711
 712     def visit_description(self, node):
 713         self.body.append(self.starttag(node, 'td', ''))
 714         self.set_first_last(node)
 715
 716     def depart_description(self, node):
 717         self.body.append('</td>')
 718
 719     def visit_docinfo(self, node):
 720         self.context.append(len(self.body))
 721         self.body.append(self.starttag(node, 'table',
 722                                        CLASS='docinfo',
 723                                        frame="void", rules="none"))
 724         self.body.append('<col class="docinfo-name" />\n'
 725                          '<col class="docinfo-content" />\n'
 726                          '<tbody valign="top">\n')
 727         self.in_docinfo = True
 728
 729     def depart_docinfo(self, node):
 730         self.body.append('</tbody>\n</table>\n')
 731         self.in_docinfo = False
 732         start = self.context.pop()
 733         self.docinfo = self.body[start:]
 734         self.body = []
 735
 736     def visit_docinfo_item(self, node, name, meta=True):
 737         if meta:
 738             meta_tag = '<meta name="%s" content="%s" />\n' \
 739                        % (name, self.attval(node.astext()))
 740             self.add_meta(meta_tag)
 741         self.body.append(self.starttag(node, 'tr', ''))
 742         self.body.append('<th class="docinfo-name">%s:</th>\n<td>'
 743                          % self.language.labels[name])
 744         if len(node):
 745             if isinstance(node[0], nodes.Element):
 746                 node[0]['classes'].append('first')
 747             if isinstance(node[-1], nodes.Element):
 748                 node[-1]['classes'].append('last')
 749
 750     def depart_docinfo_item(self):
 751         self.body.append('</td></tr>\n')
 752
 753     def visit_doctest_block(self, node):
 754         self.body.append(self.starttag(node, 'pre', CLASS='doctest-block'))
 755
 756     def depart_doctest_block(self, node):
 757         self.body.append('\n</pre>\n')
 758
 759     def visit_document(self, node):
 760         self.head.append('<title>%s</title>\n'
 761                          % self.encode(node.get('title', '')))
 762
 763     def depart_document(self, node):
 764         self.head_prefix.extend([self.doctype,
 765                                  self.head_prefix_template %
 766                                  {'lang': self.settings.language_code}])
 767         self.html_prolog.append(self.doctype)
 768         self.meta.insert(0, self.content_type % self.settings.output_encoding)
 769         self.head.insert(0, self.content_type % self.settings.output_encoding)
 770         if self.math_header:
 771             if self.math_output == 'mathjax':
 772                 self.head.extend(self.math_header)
 773             else:
 774                 self.stylesheet.extend(self.math_header)
 775         # skip content-type meta tag with interpolated charset value:
 776         self.html_head.extend(self.head[1:])
 777         self.body_prefix.append(self.starttag(node, 'div', CLASS='document'))
 778         self.body_suffix.insert(0, '</div>\n')
 779         self.fragment.extend(self.body) # self.fragment is the "naked" body
 780         self.html_body.extend(self.body_prefix[1:] + self.body_pre_docinfo
 781                               + self.docinfo + self.body
 782                               + self.body_suffix[:-1])
 783         assert not self.context, 'len(context) = %s' % len(self.context)
 784
 785     def visit_emphasis(self, node):
 786         self.body.append(self.starttag(node, 'em', ''))
 787
 788     def depart_emphasis(self, node):
 789         self.body.append('</em>')
 790
 791     def visit_entry(self, node):
 792         atts = {'class': []}
 793         if isinstance(node.parent.parent, nodes.thead):
 794             atts['class'].append('head')
 795         if node.parent.parent.parent.stubs[node.parent.column]:
 796             # "stubs" list is an attribute of the tgroup element
 797             atts['class'].append('stub')
 798         if atts['class']:
 799             tagname = 'th'
 800             atts['class'] = ' '.join(atts['class'])
 801         else:
 802             tagname = 'td'
 803             del atts['class']
 804         node.parent.column += 1
 805         if 'morerows' in node:
 806             atts['rowspan'] = node['morerows'] + 1
 807         if 'morecols' in node:
 808             atts['colspan'] = node['morecols'] + 1
 809             node.parent.column += node['morecols']
 810         self.body.append(self.starttag(node, tagname, '', **atts))
 811         self.context.append('</%s>\n' % tagname.lower())
 812         if len(node) == 0:              # empty cell
 813             self.body.append('&nbsp;')
 814         self.set_first_last(node)
 815
 816     def depart_entry(self, node):
 817         self.body.append(self.context.pop())
 818
 819     def visit_enumerated_list(self, node):
 820         """
 821         The 'start' attribute does not conform to HTML 4.01's strict.dtd, but
 822         CSS1 doesn't help. CSS2 isn't widely enough supported yet to be
 823         usable.
 824         """
 825         atts = {}
 826         if 'start' in node:
 827             atts['start'] = node['start']
 828         if 'enumtype' in node:
 829             atts['class'] = node['enumtype']
 830         # @@@ To do: prefix, suffix. How? Change prefix/suffix to a
 831         # single "format" attribute? Use CSS2?
 832         old_compact_simple = self.compact_simple
 833         self.context.append((self.compact_simple, self.compact_p))
 834         self.compact_p = None
 835         self.compact_simple = self.is_compactable(node)
 836         if self.compact_simple and not old_compact_simple:
 837             atts['class'] = (atts.get('class', '') + ' simple').strip()
 838         self.body.append(self.starttag(node, 'ol', **atts))
 839
 840     def depart_enumerated_list(self, node):
 841         self.compact_simple, self.compact_p = self.context.pop()
 842         self.body.append('</ol>\n')
 843
 844     def visit_field(self, node):
 845         self.body.append(self.starttag(node, 'tr', '', CLASS='field'))
 846
 847     def depart_field(self, node):
 848         self.body.append('</tr>\n')
 849
 850     def visit_field_body(self, node):
 851         self.body.append(self.starttag(node, 'td', '', CLASS='field-body'))
 852         self.set_class_on_child(node, 'first', 0)
 853         field = node.parent
 854         if (self.compact_field_list or
 855             isinstance(field.parent, nodes.docinfo) or
 856             field.parent.index(field) == len(field.parent) - 1):
 857             # If we are in a compact list, the docinfo, or if this is
 858             # the last field of the field list, do not add vertical
 859             # space after last element.
 860             self.set_class_on_child(node, 'last', -1)
 861
 862     def depart_field_body(self, node):
 863         self.body.append('</td>\n')
 864
 865     def visit_field_list(self, node):
 866         self.context.append((self.compact_field_list, self.compact_p))
 867         self.compact_p = None
 868         if 'compact' in node['classes']:
 869             self.compact_field_list = True
 870         elif (self.settings.compact_field_lists
 871               and 'open' not in node['classes']):
 872             self.compact_field_list = True
 873         if self.compact_field_list:
 874             for field in node:
 875                 field_body = field[-1]
 876                 assert isinstance(field_body, nodes.field_body)
 877                 children = [n for n in field_body
 878                             if not isinstance(n, nodes.Invisible)]
 879                 if not (len(children) == 0 or
 880                         len(children) == 1 and
 881                         isinstance(children[0],
 882                                    (nodes.paragraph, nodes.line_block))):
 883                     self.compact_field_list = False
 884                     break
 885         self.body.append(self.starttag(node, 'table', frame='void',
 886                                        rules='none',
 887                                        CLASS='docutils field-list'))
 888         self.body.append('<col class="field-name" />\n'
 889                          '<col class="field-body" />\n'
 890                          '<tbody valign="top">\n')
 891
 892     def depart_field_list(self, node):
 893         self.body.append('</tbody>\n</table>\n')
 894         self.compact_field_list, self.compact_p = self.context.pop()
 895
 896     def visit_field_name(self, node):
 897         atts = {}
 898         if self.in_docinfo:
 899             atts['class'] = 'docinfo-name'
 900         else:
 901             atts['class'] = 'field-name'
 902         if ( self.settings.field_name_limit
 903              and len(node.astext()) > self.settings.field_name_limit):
 904             atts['colspan'] = 2
 905             self.context.append('</tr>\n'
 906                                 + self.starttag(node.parent, 'tr', '',
 907                                                 CLASS='field')
 908                                 + '<td>&nbsp;</td>')
 909         else:
 910             self.context.append('')
 911         self.body.append(self.starttag(node, 'th', '', **atts))
 912
 913     def depart_field_name(self, node):
 914         self.body.append(':</th>')
 915         self.body.append(self.context.pop())
 916
 917     def visit_figure(self, node):
 918         atts = {'class': 'figure'}
 919         if node.get('width'):
 920             atts['style'] = 'width: %s' % node['width']
 921         if node.get('align'):
 922             atts['class'] += " align-" + node['align']
 923         self.body.append(self.starttag(node, 'div', **atts))
 924
 925     def depart_figure(self, node):
 926         self.body.append('</div>\n')
 927
 928     def visit_footer(self, node):
 929         self.context.append(len(self.body))
 930
 931     def depart_footer(self, node):
 932         start = self.context.pop()
 933         footer = [self.starttag(node, 'div', CLASS='footer'),
 934                   '<hr class="footer" />\n']
 935         footer.extend(self.body[start:])
 936         footer.append('\n</div>\n')
 937         self.footer.extend(footer)
 938         self.body_suffix[:0] = footer
 939         del self.body[start:]
 940
 941     def visit_footnote(self, node):
 942         self.body.append(self.starttag(node, 'table',
 943                                        CLASS='docutils footnote',
 944                                        frame="void", rules="none"))
 945         self.body.append('<colgroup><col class="label" /><col /></colgroup>\n'
 946                          '<tbody valign="top">\n'
 947                          '<tr>')
 948         self.footnote_backrefs(node)
 949
 950     def footnote_backrefs(self, node):
 951         backlinks = []
 952         backrefs = node['backrefs']
 953         if self.settings.footnote_backlinks and backrefs:
 954             if len(backrefs) == 1:
 955                 self.context.append('')
 956                 self.context.append('</a>')
 957                 self.context.append('<a class="fn-backref" href="#%s">'
 958                                     % backrefs[0])
 959             else:
 960                 i = 1
 961                 for backref in backrefs:
 962                     backlinks.append('<a class="fn-backref" href="#%s">%s</a>'
 963                                      % (backref, i))
 964                     i += 1
 965                 self.context.append('<em>(%s)</em> ' % ', '.join(backlinks))
 966                 self.context += ['', '']
 967         else:
 968             self.context.append('')
 969             self.context += ['', '']
 970         # If the node does not only consist of a label.
 971         if len(node) > 1:
 972             # If there are preceding backlinks, we do not set class
 973             # 'first', because we need to retain the top-margin.
 974             if not backlinks:
 975                 node[1]['classes'].append('first')
 976             node[-1]['classes'].append('last')
 977
 978     def depart_footnote(self, node):
 979         self.body.append('</td></tr>\n'
 980                          '</tbody>\n</table>\n')
 981
 982     def visit_footnote_reference(self, node):
 983         href = '#' + node['refid']
 984         format = self.settings.footnote_references
 985         if format == 'brackets':
 986             suffix = '['
 987             self.context.append(']')
 988         else:
 989             assert format == 'superscript'
 990             suffix = '<sup>'
 991             self.context.append('</sup>')
 992         self.body.append(self.starttag(node, 'a', suffix,
 993                                        CLASS='footnote-reference', href=href))
 994
 995     def depart_footnote_reference(self, node):
 996         self.body.append(self.context.pop() + '</a>')
 997
 998     def visit_generated(self, node):
 999         pass
1000
1001     def depart_generated(self, node):
1002         pass
1003
1004     def visit_header(self, node):
1005         self.context.append(len(self.body))
1006
1007     def depart_header(self, node):
1008         start = self.context.pop()
1009         header = [self.starttag(node, 'div', CLASS='header')]
1010         header.extend(self.body[start:])
1011         header.append('\n<hr class="header"/>\n</div>\n')
1012         self.body_prefix.extend(header)
1013         self.header.extend(header)
1014         del self.body[start:]
1015
1016     # Image types to place in an <object> element
1017     # SVG not supported by IE up to version 8
1018     # (html4css1 strives for IE6 compatibility)
1019     object_image_types = {'.svg': 'image/svg+xml',
1020                          '.swf': 'application/x-shockwave-flash'}
1021
1022     def visit_image(self, node):
1023         atts = {}
1024         uri = node['uri']
1025         ext = os.path.splitext(uri)[1].lower()
1026         if ext in self.object_image_types: # ('.svg', '.swf'):
1027             atts['data'] = uri
1028             atts['type'] = self.object_image_types[ext]
1029         else:
1030             atts['src'] = uri
1031             atts['alt'] = node.get('alt', uri)
1032         # image size
1033         if 'width' in node:
1034             atts['width'] = node['width']
1035         if 'height' in node:
1036             atts['height'] = node['height']
1037         if 'scale' in node:
1038             if (PIL and not ('width' in node and 'height' in node)
1039                 and self.settings.file_insertion_enabled):
1040                 imagepath = urllib.url2pathname(uri)
1041                 try:
1042                     img = PIL.Image.open(
1043                             imagepath.encode(sys.getfilesystemencoding()))
1044                 except (IOError, UnicodeEncodeError):
1045                     pass # TODO: warn?
1046                 else:
1047                     self.settings.record_dependencies.add(
1048                         imagepath.replace('\\', '/'))
1049                     if 'width' not in atts:
1050                         atts['width'] = '%dpx' % img.size[0]
1051                     if 'height' not in atts:
1052                         atts['height'] = '%dpx' % img.size[1]
1053                     del img
1054             for att_name in 'width', 'height':
1055                 if att_name in atts:
1056                     match = re.match(r'([0-9.]+)(\S*)$', atts[att_name])
1057                     assert match
1058                     atts[att_name] = '%s%s' % (
1059                         float(match.group(1)) * (float(node['scale']) / 100),
1060                         match.group(2))
1061         style = []
1062         for att_name in 'width', 'height':
1063             if att_name in atts:
1064                 if re.match(r'^[0-9.]+$', atts[att_name]):
1065                     # Interpret unitless values as pixels.
1066                     atts[att_name] += 'px'
1067                 style.append('%s: %s;' % (att_name, atts[att_name]))
1068                 del atts[att_name]
1069         if style:
1070             atts['style'] = ' '.join(style)
1071         if (isinstance(node.parent, nodes.TextElement) or
1072             (isinstance(node.parent, nodes.reference) and
1073              not isinstance(node.parent.parent, nodes.TextElement))):
1074             # Inline context or surrounded by <a>...</a>.
1075             suffix = ''
1076         else:
1077             suffix = '\n'
1078         if 'align' in node:
1079             atts['class'] = 'align-%s' % node['align']
1080         if ext in self.object_image_types: # ('.svg', '.swf')
1081             # do NOT use an empty tag: incorrect rendering in browsers
1082             self.body.append(self.starttag(node, 'object', suffix, **atts) +
1083                              node.get('alt', uri) + '</object>' + suffix)
1084         else:
1085             self.body.append(self.emptytag(node, 'img', suffix, **atts))
1086
1087     def depart_image(self, node):
1088         # self.body.append(self.context.pop())
1089         pass
1090
1091     def visit_inline(self, node):
1092         self.body.append(self.starttag(node, 'span', ''))
1093
1094     def depart_inline(self, node):
1095         self.body.append('</span>')
1096
1097     def visit_label(self, node):
1098         # Context added in footnote_backrefs.
1099         self.body.append(self.starttag(node, 'td', '%s[' % self.context.pop(),
1100                                        CLASS='label'))
1101
1102     def depart_label(self, node):
1103         # Context added in footnote_backrefs.
1104         self.body.append(']%s</td><td>%s' % (self.context.pop(), self.context.pop()))
1105
1106     def visit_legend(self, node):
1107         self.body.append(self.starttag(node, 'div', CLASS='legend'))
1108
1109     def depart_legend(self, node):
1110         self.body.append('</div>\n')
1111
1112     def visit_line(self, node):
1113         self.body.append(self.starttag(node, 'div', suffix='', CLASS='line'))
1114         if not len(node):
1115             self.body.append('<br />')
1116
1117     def depart_line(self, node):
1118         self.body.append('</div>\n')
1119
1120     def visit_line_block(self, node):
1121         self.body.append(self.starttag(node, 'div', CLASS='line-block'))
1122
1123     def depart_line_block(self, node):
1124         self.body.append('</div>\n')
1125
1126     def visit_list_item(self, node):
1127         self.body.append(self.starttag(node, 'li', ''))
1128         if len(node):
1129             node[0]['classes'].append('first')
1130
1131     def depart_list_item(self, node):
1132         self.body.append('</li>\n')
1133
1134     def visit_literal(self, node):
1135         # special case: "code" role
1136         classes = node.get('classes', [])
1137         if 'code' in classes:
1138             # filter 'code' from class arguments
1139             node['classes'] = [cls for cls in classes if cls != 'code']
1140             self.body.append(self.starttag(node, 'code', ''))
1141             return
1142         self.body.append(
1143             self.starttag(node, 'tt', '', CLASS='docutils literal'))
1144         text = node.astext()
1145         for token in self.words_and_spaces.findall(text):
1146             if token.strip():
1147                 # Protect text like "--an-option" and the regular expression
1148                 # ``[+]?(\d+(\.\d*)?|\.\d+)`` from bad line wrapping
1149                 if self.sollbruchstelle.search(token):
1150                     self.body.append('<span class="pre">%s</span>'
1151                                      % self.encode(token))
1152                 else:
1153                     self.body.append(self.encode(token))
1154             elif token in ('\n', ' '):
1155                 # Allow breaks at whitespace:
1156                 self.body.append(token)
1157             else:
1158                 # Protect runs of multiple spaces; the last space can wrap:
1159                 self.body.append('&nbsp;' * (len(token) - 1) + ' ')
1160         self.body.append('</tt>')
1161         # Content already processed:
1162         raise nodes.SkipNode
1163
1164     def depart_literal(self, node):
1165         # skipped unless literal element is from "code" role:
1166         self.body.append('</code>')
1167
1168     def visit_literal_block(self, node):
1169         self.body.append(self.starttag(node, 'pre', CLASS='literal-block'))
1170
1171     def depart_literal_block(self, node):
1172         self.body.append('\n</pre>\n')
1173
1174     def visit_math(self, node, math_env=''):
1175         # If the method is called from visit_math_block(), math_env != ''.
1176
1177         # As there is no native HTML math support, we provide alternatives:
1178         # LaTeX and MathJax math_output modes simply wrap the content,
1179         # HTML and MathML math_output modes also convert the math_code.
1180         if self.math_output not in ('mathml', 'html', 'mathjax', 'latex'):
1181             self.document.reporter.error(
1182                 'math-output format "%s" not supported '
1183                 'falling back to "latex"'% self.math_output)
1184             self.math_output = 'latex'
1185         #
1186         # HTML container
1187         tags = {# math_output: (block, inline, class-arguments)
1188                 'mathml':      ('div', '', ''),
1189                 'html':        ('div', 'span', 'formula'),
1190                 'mathjax':     ('div', 'span', 'math'),
1191                 'latex':       ('pre', 'tt',   'math'),
1192                }
1193         tag = tags[self.math_output][math_env == '']
1194         clsarg = tags[self.math_output][2]
1195         # LaTeX container
1196         wrappers = {# math_mode: (inline, block)
1197                     'mathml':  (None,     None),
1198                     'html':    ('$%s$',   u'\\begin{%s}\n%s\n\\end{%s}'),
1199                     'mathjax': ('\(%s\)', u'\\begin{%s}\n%s\n\\end{%s}'),
1200                     'latex':   (None,     None),
1201                    }
1202         wrapper = wrappers[self.math_output][math_env != '']
1203         # get and wrap content
1204         math_code = node.astext().translate(unichar2tex.uni2tex_table)
1205         if wrapper and math_env:
1206             math_code = wrapper % (math_env, math_code, math_env)
1207         elif wrapper:
1208             math_code = wrapper % math_code
1209         # settings and conversion
1210         if self.math_output in ('latex', 'mathjax'):
1211             math_code = self.encode(math_code)
1212         if self.math_output == 'mathjax' and not self.math_header:
1213             if self.math_output_options:
1214                 self.mathjax_url = self.math_output_options[0]
1215             self.math_header = [self.mathjax_script % self.mathjax_url]
1216         elif self.math_output == 'html':
1217             if self.math_output_options and not self.math_header:
1218                 self.math_header = [self.stylesheet_call(
1219                     utils.find_file_in_dirs(s, self.settings.stylesheet_dirs))
1220                     for s in self.math_output_options[0].split(',')]
1221             # TODO: fix display mode in matrices and fractions
1222             math2html.DocumentParameters.displaymode = (math_env != '')
1223             math_code = math2html.math2html(math_code)
1224         elif self.math_output == 'mathml':
1225             self.doctype = self.doctype_mathml
1226             self.content_type = self.content_type_mathml
1227             try:
1228                 mathml_tree = parse_latex_math(math_code, inline=not(math_env))
1229                 math_code = ''.join(mathml_tree.xml())
1230             except SyntaxError, err:
1231                 err_node = self.document.reporter.error(err, base_node=node)
1232                 self.visit_system_message(err_node)
1233                 self.body.append(self.starttag(node, 'p'))
1234                 self.body.append(u','.join(err.args))
1235                 self.body.append('</p>\n')
1236                 self.body.append(self.starttag(node, 'pre',
1237                                                CLASS='literal-block'))
1238                 self.body.append(self.encode(math_code))
1239                 self.body.append('\n</pre>\n')
1240                 self.depart_system_message(err_node)
1241                 raise nodes.SkipNode
1242         # append to document body
1243         if tag:
1244             self.body.append(self.starttag(node, tag,
1245                                            suffix='\n'*bool(math_env),
1246                                            CLASS=clsarg))
1247         self.body.append(math_code)
1248         if math_env: # block mode (equation, display)
1249             self.body.append('\n')
1250         if tag:
1251             self.body.append('</%s>' % tag)
1252         if math_env:
1253             self.body.append('\n')
1254         # Content already processed:
1255         raise nodes.SkipNode
1256
1257     def depart_math(self, node):
1258         pass # never reached
1259
1260     def visit_math_block(self, node):
1261         # print node.astext().encode('utf8')
1262         math_env = pick_math_environment(node.astext())
1263         self.visit_math(node, math_env=math_env)
1264
1265     def depart_math_block(self, node):
1266         pass # never reached
1267
1268     def visit_meta(self, node):
1269         meta = self.emptytag(node, 'meta', **node.non_default_attributes())
1270         self.add_meta(meta)
1271
1272     def depart_meta(self, node):
1273         pass
1274
1275     def add_meta(self, tag):
1276         self.meta.append(tag)
1277         self.head.append(tag)
1278
1279     def visit_option(self, node):
1280         if self.context[-1]:
1281             self.body.append(', ')
1282         self.body.append(self.starttag(node, 'span', '', CLASS='option'))
1283
1284     def depart_option(self, node):
1285         self.body.append('</span>')
1286         self.context[-1] += 1
1287
1288     def visit_option_argument(self, node):
1289         self.body.append(node.get('delimiter', ' '))
1290         self.body.append(self.starttag(node, 'var', ''))
1291
1292     def depart_option_argument(self, node):
1293         self.body.append('</var>')
1294
1295     def visit_option_group(self, node):
1296         atts = {}
1297         if ( self.settings.option_limit
1298              and len(node.astext()) > self.settings.option_limit):
1299             atts['colspan'] = 2
1300             self.context.append('</tr>\n<tr><td>&nbsp;</td>')
1301         else:
1302             self.context.append('')
1303         self.body.append(
1304             self.starttag(node, 'td', CLASS='option-group', **atts))
1305         self.body.append('<kbd>')
1306         self.context.append(0)          # count number of options
1307
1308     def depart_option_group(self, node):
1309         self.context.pop()
1310         self.body.append('</kbd></td>\n')
1311         self.body.append(self.context.pop())
1312
1313     def visit_option_list(self, node):
1314         self.body.append(
1315               self.starttag(node, 'table', CLASS='docutils option-list',
1316                             frame="void", rules="none"))
1317         self.body.append('<col class="option" />\n'
1318                          '<col class="description" />\n'
1319                          '<tbody valign="top">\n')
1320
1321     def depart_option_list(self, node):
1322         self.body.append('</tbody>\n</table>\n')
1323
1324     def visit_option_list_item(self, node):
1325         self.body.append(self.starttag(node, 'tr', ''))
1326
1327     def depart_option_list_item(self, node):
1328         self.body.append('</tr>\n')
1329
1330     def visit_option_string(self, node):
1331         pass
1332
1333     def depart_option_string(self, node):
1334         pass
1335
1336     def visit_organization(self, node):
1337         self.visit_docinfo_item(node, 'organization')
1338
1339     def depart_organization(self, node):
1340         self.depart_docinfo_item()
1341
1342     def should_be_compact_paragraph(self, node):
1343         """
1344         Determine if the <p> tags around paragraph ``node`` can be omitted.
1345         """
1346         if (isinstance(node.parent, nodes.document) or
1347             isinstance(node.parent, nodes.compound)):
1348             # Never compact paragraphs in document or compound.
1349             return False
1350         for key, value in node.attlist():
1351             if (node.is_not_default(key) and
1352                 not (key == 'classes' and value in
1353                      ([], ['first'], ['last'], ['first', 'last']))):
1354                 # Attribute which needs to survive.
1355                 return False
1356         first = isinstance(node.parent[0], nodes.label) # skip label
1357         for child in node.parent.children[first:]:
1358             # only first paragraph can be compact
1359             if isinstance(child, nodes.Invisible):
1360                 continue
1361             if child is node:
1362                 break
1363             return False
1364         parent_length = len([n for n in node.parent if not isinstance(
1365             n, (nodes.Invisible, nodes.label))])
1366         if ( self.compact_simple
1367              or self.compact_field_list
1368              or self.compact_p and parent_length == 1):
1369             return True
1370         return False
1371
1372     def visit_paragraph(self, node):
1373         if self.should_be_compact_paragraph(node):
1374             self.context.append('')
1375         else:
1376             self.body.append(self.starttag(node, 'p', ''))
1377             self.context.append('</p>\n')
1378
1379     def depart_paragraph(self, node):
1380         self.body.append(self.context.pop())
1381
1382     def visit_problematic(self, node):
1383         if node.hasattr('refid'):
1384             self.body.append('<a href="#%s">' % node['refid'])
1385             self.context.append('</a>')
1386         else:
1387             self.context.append('')
1388         self.body.append(self.starttag(node, 'span', '', CLASS='problematic'))
1389
1390     def depart_problematic(self, node):
1391         self.body.append('</span>')
1392         self.body.append(self.context.pop())
1393
1394     def visit_raw(self, node):
1395         if 'html' in node.get('format', '').split():
1396             t = isinstance(node.parent, nodes.TextElement) and 'span' or 'div'
1397             if node['classes']:
1398                 self.body.append(self.starttag(node, t, suffix=''))
1399             self.body.append(node.astext())
1400             if node['classes']:
1401                 self.body.append('</%s>' % t)
1402         # Keep non-HTML raw text out of output:
1403         raise nodes.SkipNode
1404
1405     def visit_reference(self, node):
1406         atts = {'class': 'reference'}
1407         if 'refuri' in node:
1408             atts['href'] = node['refuri']
1409             if ( self.settings.cloak_email_addresses
1410                  and atts['href'].startswith('mailto:')):
1411                 atts['href'] = self.cloak_mailto(atts['href'])
1412                 self.in_mailto = True
1413             atts['class'] += ' external'
1414         else:
1415             assert 'refid' in node, \
1416                    'References must have "refuri" or "refid" attribute.'
1417             atts['href'] = '#' + node['refid']
1418             atts['class'] += ' internal'
1419         if not isinstance(node.parent, nodes.TextElement):
1420             assert len(node) == 1 and isinstance(node[0], nodes.image)
1421             atts['class'] += ' image-reference'
1422         self.body.append(self.starttag(node, 'a', '', **atts))
1423
1424     def depart_reference(self, node):
1425         self.body.append('</a>')
1426         if not isinstance(node.parent, nodes.TextElement):
1427             self.body.append('\n')
1428         self.in_mailto = False
1429
1430     def visit_revision(self, node):
1431         self.visit_docinfo_item(node, 'revision', meta=False)
1432
1433     def depart_revision(self, node):
1434         self.depart_docinfo_item()
1435
1436     def visit_row(self, node):
1437         self.body.append(self.starttag(node, 'tr', ''))
1438         node.column = 0
1439
1440     def depart_row(self, node):
1441         self.body.append('</tr>\n')
1442
1443     def visit_rubric(self, node):
1444         self.body.append(self.starttag(node, 'p', '', CLASS='rubric'))
1445
1446     def depart_rubric(self, node):
1447         self.body.append('</p>\n')
1448
1449     def visit_section(self, node):
1450         self.section_level += 1
1451         self.body.append(
1452             self.starttag(node, 'div', CLASS='section'))
1453
1454     def depart_section(self, node):
1455         self.section_level -= 1
1456         self.body.append('</div>\n')
1457
1458     def visit_sidebar(self, node):
1459         self.body.append(
1460             self.starttag(node, 'div', CLASS='sidebar'))
1461         self.set_first_last(node)
1462         self.in_sidebar = True
1463
1464     def depart_sidebar(self, node):
1465         self.body.append('</div>\n')
1466         self.in_sidebar = False
1467
1468     def visit_status(self, node):
1469         self.visit_docinfo_item(node, 'status', meta=False)
1470
1471     def depart_status(self, node):
1472         self.depart_docinfo_item()
1473
1474     def visit_strong(self, node):
1475         self.body.append(self.starttag(node, 'strong', ''))
1476
1477     def depart_strong(self, node):
1478         self.body.append('</strong>')
1479
1480     def visit_subscript(self, node):
1481         self.body.append(self.starttag(node, 'sub', ''))
1482
1483     def depart_subscript(self, node):
1484         self.body.append('</sub>')
1485
1486     def visit_substitution_definition(self, node):
1487         """Internal only."""
1488         raise nodes.SkipNode
1489
1490     def visit_substitution_reference(self, node):
1491         self.unimplemented_visit(node)
1492
1493     def visit_subtitle(self, node):
1494         if isinstance(node.parent, nodes.sidebar):
1495             self.body.append(self.starttag(node, 'p', '',
1496                                            CLASS='sidebar-subtitle'))
1497             self.context.append('</p>\n')
1498         elif isinstance(node.parent, nodes.document):
1499             self.body.append(self.starttag(node, 'h2', '', CLASS='subtitle'))
1500             self.context.append('</h2>\n')
1501             self.in_document_title = len(self.body)
1502         elif isinstance(node.parent, nodes.section):
1503             tag = 'h%s' % (self.section_level + self.initial_header_level - 1)
1504             self.body.append(
1505                 self.starttag(node, tag, '', CLASS='section-subtitle') +
1506                 self.starttag({}, 'span', '', CLASS='section-subtitle'))
1507             self.context.append('</span></%s>\n' % tag)
1508
1509     def depart_subtitle(self, node):
1510         self.body.append(self.context.pop())
1511         if self.in_document_title:
1512             self.subtitle = self.body[self.in_document_title:-1]
1513             self.in_document_title = 0
1514             self.body_pre_docinfo.extend(self.body)
1515             self.html_subtitle.extend(self.body)
1516             del self.body[:]
1517
1518     def visit_superscript(self, node):
1519         self.body.append(self.starttag(node, 'sup', ''))
1520
1521     def depart_superscript(self, node):
1522         self.body.append('</sup>')
1523
1524     def visit_system_message(self, node):
1525         self.body.append(self.starttag(node, 'div', CLASS='system-message'))
1526         self.body.append('<p class="system-message-title">')
1527         backref_text = ''
1528         if len(node['backrefs']):
1529             backrefs = node['backrefs']
1530             if len(backrefs) == 1:
1531                 backref_text = ('; <em><a href="#%s">backlink</a></em>'
1532                                 % backrefs[0])
1533             else:
1534                 i = 1
1535                 backlinks = []
1536                 for backref in backrefs:
1537                     backlinks.append('<a href="#%s">%s</a>' % (backref, i))
1538                     i += 1
1539                 backref_text = ('; <em>backlinks: %s</em>'
1540                                 % ', '.join(backlinks))
1541         if node.hasattr('line'):
1542             line = ', line %s' % node['line']
1543         else:
1544             line = ''
1545         self.body.append('System Message: %s/%s '
1546                          '(<tt class="docutils">%s</tt>%s)%s</p>\n'
1547                          % (node['type'], node['level'],
1548                             self.encode(node['source']), line, backref_text))
1549
1550     def depart_system_message(self, node):
1551         self.body.append('</div>\n')
1552
1553     def visit_table(self, node):
1554         self.context.append(self.compact_p)
1555         self.compact_p = True
1556         classes = ' '.join(['docutils', self.settings.table_style]).strip()
1557         self.body.append(
1558             self.starttag(node, 'table', CLASS=classes, border="1"))
1559
1560     def depart_table(self, node):
1561         self.compact_p = self.context.pop()
1562         self.body.append('</table>\n')
1563
1564     def visit_target(self, node):
1565         if not ('refuri' in node or 'refid' in node
1566                 or 'refname' in node):
1567             self.body.append(self.starttag(node, 'span', '', CLASS='target'))
1568             self.context.append('</span>')
1569         else:
1570             self.context.append('')
1571
1572     def depart_target(self, node):
1573         self.body.append(self.context.pop())
1574
1575     def visit_tbody(self, node):
1576         self.write_colspecs()
1577         self.body.append(self.context.pop()) # '</colgroup>\n' or ''
1578         self.body.append(self.starttag(node, 'tbody', valign='top'))
1579
1580     def depart_tbody(self, node):
1581         self.body.append('</tbody>\n')
1582
1583     def visit_term(self, node):
1584         self.body.append(self.starttag(node, 'dt', ''))
1585
1586     def depart_term(self, node):
1587         """
1588         Leave the end tag to `self.visit_definition()`, in case there's a
1589         classifier.
1590         """
1591         pass
1592
1593     def visit_tgroup(self, node):
1594         # Mozilla needs <colgroup>:
1595         self.body.append(self.starttag(node, 'colgroup'))
1596         # Appended by thead or tbody:
1597         self.context.append('</colgroup>\n')
1598         node.stubs = []
1599
1600     def depart_tgroup(self, node):
1601         pass
1602
1603     def visit_thead(self, node):
1604         self.write_colspecs()
1605         self.body.append(self.context.pop()) # '</colgroup>\n'
1606         # There may or may not be a <thead>; this is for <tbody> to use:
1607         self.context.append('')
1608         self.body.append(self.starttag(node, 'thead', valign='bottom'))
1609
1610     def depart_thead(self, node):
1611         self.body.append('</thead>\n')
1612
1613     def visit_title(self, node):
1614         """Only 6 section levels are supported by HTML."""
1615         check_id = 0  # TODO: is this a bool (False) or a counter?
1616         close_tag = '</p>\n'
1617         if isinstance(node.parent, nodes.topic):
1618             self.body.append(
1619                   self.starttag(node, 'p', '', CLASS='topic-title first'))
1620         elif isinstance(node.parent, nodes.sidebar):
1621             self.body.append(
1622                   self.starttag(node, 'p', '', CLASS='sidebar-title'))
1623         elif isinstance(node.parent, nodes.Admonition):
1624             self.body.append(
1625                   self.starttag(node, 'p', '', CLASS='admonition-title'))
1626         elif isinstance(node.parent, nodes.table):
1627             self.body.append(
1628                   self.starttag(node, 'caption', ''))
1629             close_tag = '</caption>\n'
1630         elif isinstance(node.parent, nodes.document):
1631             self.body.append(self.starttag(node, 'h1', '', CLASS='title'))
1632             close_tag = '</h1>\n'
1633             self.in_document_title = len(self.body)
1634         else:
1635             assert isinstance(node.parent, nodes.section)
1636             h_level = self.section_level + self.initial_header_level - 1
1637             atts = {}
1638             if (len(node.parent) >= 2 and
1639                 isinstance(node.parent[1], nodes.subtitle)):
1640                 atts['CLASS'] = 'with-subtitle'
1641             self.body.append(
1642                   self.starttag(node, 'h%s' % h_level, '', **atts))
1643             atts = {}
1644             if node.hasattr('refid'):
1645                 atts['class'] = 'toc-backref'
1646                 atts['href'] = '#' + node['refid']
1647             if atts:
1648                 self.body.append(self.starttag({}, 'a', '', **atts))
1649                 close_tag = '</a></h%s>\n' % (h_level)
1650             else:
1651                 close_tag = '</h%s>\n' % (h_level)
1652         self.context.append(close_tag)
1653
1654     def depart_title(self, node):
1655         self.body.append(self.context.pop())
1656         if self.in_document_title:
1657             self.title = self.body[self.in_document_title:-1]
1658             self.in_document_title = 0
1659             self.body_pre_docinfo.extend(self.body)
1660             self.html_title.extend(self.body)
1661             del self.body[:]
1662
1663     def visit_title_reference(self, node):
1664         self.body.append(self.starttag(node, 'cite', ''))
1665
1666     def depart_title_reference(self, node):
1667         self.body.append('</cite>')
1668
1669     def visit_topic(self, node):
1670         self.body.append(self.starttag(node, 'div', CLASS='topic'))
1671         self.topic_classes = node['classes']
1672
1673     def depart_topic(self, node):
1674         self.body.append('</div>\n')
1675         self.topic_classes = []
1676
1677     def visit_transition(self, node):
1678         self.body.append(self.emptytag(node, 'hr', CLASS='docutils'))
1679
1680     def depart_transition(self, node):
1681         pass
1682
1683     def visit_version(self, node):
1684         self.visit_docinfo_item(node, 'version', meta=False)
1685
1686     def depart_version(self, node):
1687         self.depart_docinfo_item()
1688
1689     def unimplemented_visit(self, node):
1690         raise NotImplementedError('visiting unimplemented node type: %s'
1691                                   % node.__class__.__name__)
1692
1693
1694 class SimpleListChecker(nodes.GenericNodeVisitor):
1695
1696     """
1697     Raise `nodes.NodeFound` if non-simple list item is encountered.
1698
1699     Here "simple" means a list item containing nothing other than a single
1700     paragraph, a simple list, or a paragraph followed by a simple list.
1701     """
1702
1703     def default_visit(self, node):
1704         raise nodes.NodeFound
1705
1706     def visit_bullet_list(self, node):
1707         pass
1708
1709     def visit_enumerated_list(self, node):
1710         pass
1711
1712     def visit_list_item(self, node):
1713         children = []
1714         for child in node.children:
1715             if not isinstance(child, nodes.Invisible):
1716                 children.append(child)
1717         if (children and isinstance(children[0], nodes.paragraph)
1718             and (isinstance(children[-1], nodes.bullet_list)
1719                  or isinstance(children[-1], nodes.enumerated_list))):
1720             children.pop()
1721         if len(children) <= 1:
1722             return
1723         else:
1724             raise nodes.NodeFound
1725
1726     def visit_paragraph(self, node):
1727         raise nodes.SkipNode
1728
1729     def invisible_visit(self, node):
1730         """Invisible nodes should be ignored."""
1731         raise nodes.SkipNode
1732
1733     visit_comment = invisible_visit
1734     visit_substitution_definition = invisible_visit
1735     visit_target = invisible_visit
1736     visit_pending = invisible_visit