genshi/genshi-test: genshi/output.py comparison

comparison genshi/output.py @ 784:67d324a62cc0 experimental-match-fastpaths

update to 0.5.x branch, up through r907 don't know how this fits in with SoC work, but I wanted to do due diligence and keep this branch working in case it someday gets considered for trunk

author	aflett
date	Mon, 21 Jul 2008 23:17:52 +0000
parents	8f2c7023af94
children

comparison

equal deleted inserted replaced

-:8f2c7023af94
+:67d324a62cc0
 'html', '-//W3C//DTD XHTML 1.0 Frameset//EN',
 'http://www.w3.org/TR/xhtml1/DTD/xhtml1-frameset.dtd'
 )
 XHTML = XHTML_STRICT
+XHTML11 = (
+'html', '-//W3C//DTD XHTML 1.1//EN',
+'http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd'
+)
 SVG_FULL = (
 'svg', '-//W3C//DTD SVG 1.1//EN',
 'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'
 )
 SVG_BASIC = (
 declaration for the specified name.
 The following names are recognized in this version:
 * "html" or "html-strict" for the HTML 4.01 strict DTD
 * "html-transitional" for the HTML 4.01 transitional DTD
-* "html-transitional" for the HTML 4.01 frameset DTD
+* "html-frameset" for the HTML 4.01 frameset DTD
 * "html5" for the ``DOCTYPE`` proposed for HTML5
 * "xhtml" or "xhtml-strict" for the XHTML 1.0 strict DTD
 * "xhtml-transitional" for the XHTML 1.0 transitional DTD
 * "xhtml-frameset" for the XHTML 1.0 frameset DTD
+* "xhtml11" for the XHTML 1.1 DTD
 * "svg" or "svg-full" for the SVG 1.1 DTD
 * "svg-basic" for the SVG Basic 1.1 DTD
 * "svg-tiny" for the SVG Tiny 1.1 DTD
 :param name: the name of the ``DOCTYPE``
 'html-frameset': DocType.HTML_FRAMESET,
 'html5': cls.HTML5,
 'xhtml': cls.XHTML, 'xhtml-strict': cls.XHTML_STRICT,
 'xhtml-transitional': cls.XHTML_TRANSITIONAL,
 'xhtml-frameset': cls.XHTML_FRAMESET,
+'xhtml11': cls.XHTML11,
 'svg': cls.SVG, 'svg-full': cls.SVG_FULL,
 'svg-basic': cls.SVG_BASIC,
 'svg-tiny': cls.SVG_TINY
 }.get(name.lower())
 get = classmethod(get)
 QName('pre'), QName('http://www.w3.org/1999/xhtml}pre'),
 QName('textarea'), QName('http://www.w3.org/1999/xhtml}textarea')
 ])
 def __init__(self, doctype=None, strip_whitespace=True,
-namespace_prefixes=None):
+namespace_prefixes=None, drop_xml_decl=True):
 super(XHTMLSerializer, self).__init__(doctype, False)
 self.filters = [EmptyTagFilter()]
 if strip_whitespace:
 self.filters.append(WhitespaceFilter(self._PRESERVE_SPACE))
 namespace_prefixes = namespace_prefixes or {}
 namespace_prefixes['http://www.w3.org/1999/xhtml'] = ''
 self.filters.append(NamespaceFlattener(prefixes=namespace_prefixes))
 if doctype:
 self.filters.append(DocTypeInserter(doctype))
+self.drop_xml_decl = drop_xml_decl
 def __call__(self, stream):
 boolean_attrs = self._BOOLEAN_ATTRS
 empty_elems = self._EMPTY_ELEMS
-have_doctype = False
+drop_xml_decl = self.drop_xml_decl
+have_decl = have_doctype = False
 in_cdata = False
 for filter_ in self.filters:
 stream = filter_(stream)
 for kind, data, pos in stream:
 buf.append(' "%s"')
 buf.append('>\n')
 yield Markup(u''.join(buf)) % filter(None, data)
 have_doctype = True
+elif kind is XML_DECL and not have_decl and not drop_xml_decl:
+version, encoding, standalone = data
+buf = ['<?xml version="%s"' % version]
+if encoding:
+buf.append(' encoding="%s"' % encoding)
+if standalone != -1:
+standalone = standalone and 'yes' or 'no'
+buf.append(' standalone="%s"' % standalone)
+buf.append('?>\n')
+yield Markup(u''.join(buf))
+have_decl = True
 elif kind is START_CDATA:
 yield Markup('<![CDATA[')
 in_cdata = True
 elif kind is END_CDATA:
 >>> elem = tag.div(Markup('<a href="foo">Hello &amp; Bye!</a><br/>'))
 >>> print elem.generate().render(TextSerializer)
 <a href="foo">Hello &amp; Bye!</a><br/>
-You can use the `strip_markup` to change this behavior, so that tags and
+You can use the ``strip_markup`` to change this behavior, so that tags and
 entities are stripped from the output (or in the case of entities,
 replaced with the equivalent character):
 >>> print elem.generate().render(TextSerializer, strip_markup=True)
 Hello & Bye!
 """
 def __init__(self, strip_markup=False):
+"""Create the serializer.
+:param strip_markup: whether markup (tags and encoded characters) found
+in the text should be removed
+"""
 self.strip_markup = strip_markup
 def __call__(self, stream):
 strip_markup = self.strip_markup
 for event in stream:

Mercurial > genshi > genshi-test

comparison genshi/output.py @ 784:67d324a62cc0 experimental-match-fastpaths